diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,228792 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 2.9998819780479167, + "eval_steps": 500, + "global_step": 38127, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 0.00029999999949079136, + "loss": 10.8263, + "step": 1 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999999979631655, + "loss": 9.6257, + "step": 2 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999999954171225, + "loss": 10.047, + "step": 3 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999999185266224, + "loss": 10.146, + "step": 4 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999998726978487, + "loss": 9.148, + "step": 5 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999999816684903, + "loss": 8.6304, + "step": 6 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999999750487787, + "loss": 8.3464, + "step": 7 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999996741064997, + "loss": 8.1256, + "step": 8 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999995875410433, + "loss": 7.8647, + "step": 9 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999999490791416, + "loss": 7.6842, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999999383857622, + "loss": 7.5368, + "step": 11 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999992667396587, + "loss": 7.4578, + "step": 12 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999999139437528, + "loss": 7.3552, + "step": 13 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999999001951231, + "loss": 7.3954, + "step": 14 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999998854280769, + "loss": 7.3702, + "step": 15 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999998696426142, + "loss": 7.3327, + "step": 16 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999998528387352, + "loss": 7.3107, + "step": 17 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999983501643996, + "loss": 7.2468, + "step": 18 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999981617572863, + "loss": 7.2979, + "step": 19 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999997963166013, + "loss": 7.2101, + "step": 20 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999997754390582, + "loss": 7.2101, + "step": 21 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999997535430993, + "loss": 7.1943, + "step": 22 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999997306287249, + "loss": 7.1691, + "step": 23 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999970669593513, + "loss": 7.0904, + "step": 24 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999996817447301, + "loss": 7.097, + "step": 25 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999965577511, + "loss": 7.1219, + "step": 26 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999962878707505, + "loss": 7.0476, + "step": 27 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999960078062535, + "loss": 7.0578, + "step": 28 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999995717557612, + "loss": 7.0238, + "step": 29 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999954171248266, + "loss": 6.9804, + "step": 30 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999951065079, + "loss": 6.997, + "step": 31 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999947857068353, + "loss": 6.9591, + "step": 32 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999944547216335, + "loss": 6.9196, + "step": 33 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999994113552296, + "loss": 6.8851, + "step": 34 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999993762198828, + "loss": 6.8979, + "step": 35 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999993400661229, + "loss": 6.788, + "step": 36 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999993028939503, + "loss": 6.7845, + "step": 37 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999992647033652, + "loss": 6.7746, + "step": 38 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999992254943678, + "loss": 6.7175, + "step": 39 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999991852669585, + "loss": 6.6889, + "step": 40 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999914402113753, + "loss": 6.6795, + "step": 41 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999910175690516, + "loss": 6.6665, + "step": 42 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999990584742616, + "loss": 6.6377, + "step": 43 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999990141732072, + "loss": 6.5646, + "step": 44 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999896885374235, + "loss": 6.4904, + "step": 45 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999892251586724, + "loss": 6.4492, + "step": 46 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999988751595822, + "loss": 6.4633, + "step": 47 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999988267848876, + "loss": 6.4431, + "step": 48 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999877739178376, + "loss": 6.4306, + "step": 49 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999872698027095, + "loss": 6.4155, + "step": 50 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999986755503496, + "loss": 6.3593, + "step": 51 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999862310202, + "loss": 6.3509, + "step": 52 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999985696352825, + "loss": 6.2662, + "step": 53 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999851515013755, + "loss": 6.3003, + "step": 54 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999845964658544, + "loss": 6.2946, + "step": 55 + }, + { + "epoch": 0.0, + "learning_rate": 0.0002999984031246265, + "loss": 6.2259, + "step": 56 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999834558426124, + "loss": 6.1623, + "step": 57 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999828702549, + "loss": 6.1292, + "step": 58 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999822744831316, + "loss": 6.137, + "step": 59 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999816685273106, + "loss": 6.0887, + "step": 60 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999810523874426, + "loss": 6.0979, + "step": 61 + }, + { + "epoch": 0.0, + "learning_rate": 0.00029999804260635307, + "loss": 6.0342, + "step": 62 + }, + { + "epoch": 0.0, + "learning_rate": 0.000299997978955558, + "loss": 5.9838, + "step": 63 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999791428635933, + "loss": 5.9474, + "step": 64 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999978485987577, + "loss": 5.9451, + "step": 65 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999977818927534, + "loss": 5.9931, + "step": 66 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999977141683469, + "loss": 5.8736, + "step": 67 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999976454255388, + "loss": 5.8801, + "step": 68 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999757566432934, + "loss": 5.8562, + "step": 69 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999975048847192, + "loss": 5.8236, + "step": 70 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999743308670873, + "loss": 5.8224, + "step": 71 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999973602702985, + "loss": 5.7981, + "step": 72 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999728643548897, + "loss": 5.7025, + "step": 73 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999721158228065, + "loss": 5.6899, + "step": 74 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999713571067396, + "loss": 5.653, + "step": 75 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999970588206696, + "loss": 5.6553, + "step": 76 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999698091226793, + "loss": 5.5973, + "step": 77 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999969019854695, + "loss": 5.6341, + "step": 78 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999682204027495, + "loss": 5.6035, + "step": 79 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999967410766848, + "loss": 5.5762, + "step": 80 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999966590946994, + "loss": 5.5966, + "step": 81 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999657609431957, + "loss": 5.6069, + "step": 82 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999649207554575, + "loss": 5.51, + "step": 83 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999964070383785, + "loss": 5.5384, + "step": 84 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999963209828184, + "loss": 5.4613, + "step": 85 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999962339088661, + "loss": 5.5278, + "step": 86 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999961458165221, + "loss": 5.4587, + "step": 87 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999605670578706, + "loss": 5.4138, + "step": 88 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999596657666165, + "loss": 5.4319, + "step": 89 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999587542914633, + "loss": 5.3703, + "step": 90 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999578326324176, + "loss": 5.3929, + "step": 91 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999569007894863, + "loss": 5.3934, + "step": 92 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999559587626755, + "loss": 5.3809, + "step": 93 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999550065519916, + "loss": 5.4258, + "step": 94 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999540441574406, + "loss": 5.3402, + "step": 95 + }, + { + "epoch": 0.01, + "learning_rate": 0.000299995307157903, + "loss": 5.3044, + "step": 96 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999952088816765, + "loss": 5.387, + "step": 97 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999510958706534, + "loss": 5.3063, + "step": 98 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999950092740702, + "loss": 5.2135, + "step": 99 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999949079426916, + "loss": 5.219, + "step": 100 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999480559293046, + "loss": 5.1805, + "step": 101 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999947022247873, + "loss": 5.1834, + "step": 102 + }, + { + "epoch": 0.01, + "learning_rate": 0.000299994597838263, + "loss": 5.2355, + "step": 103 + }, + { + "epoch": 0.01, + "learning_rate": 0.000299994492433358, + "loss": 5.1719, + "step": 104 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999438601007323, + "loss": 5.1662, + "step": 105 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999427856840943, + "loss": 5.1674, + "step": 106 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999417010836716, + "loss": 5.1132, + "step": 107 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999940606299473, + "loss": 5.126, + "step": 108 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999395013315046, + "loss": 5.1225, + "step": 109 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999383861797755, + "loss": 5.104, + "step": 110 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999372608442926, + "loss": 5.0844, + "step": 111 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999936125325063, + "loss": 5.047, + "step": 112 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999349796220947, + "loss": 5.0473, + "step": 113 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999338237353965, + "loss": 4.9838, + "step": 114 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999326576649743, + "loss": 5.0187, + "step": 115 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999314814108374, + "loss": 4.9802, + "step": 116 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999930294972994, + "loss": 5.0482, + "step": 117 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999290983514506, + "loss": 5.0848, + "step": 118 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999278915462176, + "loss": 4.987, + "step": 119 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999266745573013, + "loss": 5.0122, + "step": 120 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999254473847103, + "loss": 5.0057, + "step": 121 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999924210028454, + "loss": 4.9281, + "step": 122 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999922962488539, + "loss": 4.9386, + "step": 123 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999217047649757, + "loss": 4.9355, + "step": 124 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999920436857772, + "loss": 4.8219, + "step": 125 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999191587669355, + "loss": 4.8698, + "step": 126 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999178704924755, + "loss": 4.897, + "step": 127 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999165720344016, + "loss": 4.8923, + "step": 128 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999152633927213, + "loss": 4.8457, + "step": 129 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999139445674444, + "loss": 4.8464, + "step": 130 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999126155585797, + "loss": 4.8345, + "step": 131 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999112763661357, + "loss": 4.8542, + "step": 132 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999909926990122, + "loss": 4.8239, + "step": 133 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999085674305473, + "loss": 4.8497, + "step": 134 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999907197687422, + "loss": 4.7598, + "step": 135 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029999058177607537, + "loss": 4.8297, + "step": 136 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999904427650553, + "loss": 4.7698, + "step": 137 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999903027356829, + "loss": 4.781, + "step": 138 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999901616879591, + "loss": 4.7935, + "step": 139 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999900196218849, + "loss": 4.7196, + "step": 140 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999898765374612, + "loss": 4.7244, + "step": 141 + }, + { + "epoch": 0.01, + "learning_rate": 0.000299989732434689, + "loss": 4.6923, + "step": 142 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999895873135693, + "loss": 4.7321, + "step": 143 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998944117410307, + "loss": 4.6675, + "step": 144 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998929401629137, + "loss": 4.6667, + "step": 145 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998914584013507, + "loss": 4.659, + "step": 146 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998899664563527, + "loss": 4.7102, + "step": 147 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998884643279294, + "loss": 4.6546, + "step": 148 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999886952016091, + "loss": 4.6442, + "step": 149 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998854295208477, + "loss": 4.6421, + "step": 150 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998838968422104, + "loss": 4.6408, + "step": 151 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999882353980189, + "loss": 4.6317, + "step": 152 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999880800934795, + "loss": 4.5644, + "step": 153 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999879237706037, + "loss": 4.6313, + "step": 154 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998776642939265, + "loss": 4.623, + "step": 155 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999876080698475, + "loss": 4.5865, + "step": 156 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998744869196925, + "loss": 4.4979, + "step": 157 + }, + { + "epoch": 0.01, + "learning_rate": 0.000299987288295759, + "loss": 4.5336, + "step": 158 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999871268812178, + "loss": 4.5288, + "step": 159 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999869644483468, + "loss": 4.4542, + "step": 160 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999868009971471, + "loss": 4.4658, + "step": 161 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998663652761975, + "loss": 4.4747, + "step": 162 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999864710397659, + "loss": 4.4708, + "step": 163 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998630453358674, + "loss": 4.477, + "step": 164 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999861370090833, + "loss": 4.5103, + "step": 165 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999859684662568, + "loss": 4.4611, + "step": 166 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998579890510825, + "loss": 4.4862, + "step": 167 + }, + { + "epoch": 0.01, + "learning_rate": 0.000299985628325639, + "loss": 4.4651, + "step": 168 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999854567278501, + "loss": 4.4672, + "step": 169 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998528411174266, + "loss": 4.4404, + "step": 170 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999851104773179, + "loss": 4.4826, + "step": 171 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998493582457706, + "loss": 4.4619, + "step": 172 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998476015352123, + "loss": 4.3926, + "step": 173 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998458346415166, + "loss": 4.385, + "step": 174 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998440575646954, + "loss": 4.3887, + "step": 175 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998422703047606, + "loss": 4.4201, + "step": 176 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998404728617253, + "loss": 4.3839, + "step": 177 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998386652355997, + "loss": 4.4229, + "step": 178 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999836847426398, + "loss": 4.3861, + "step": 179 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998350194341313, + "loss": 4.332, + "step": 180 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999833181258813, + "loss": 4.3391, + "step": 181 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999831332900455, + "loss": 4.3121, + "step": 182 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999829474359069, + "loss": 4.3118, + "step": 183 + }, + { + "epoch": 0.01, + "learning_rate": 0.000299982760563467, + "loss": 4.3351, + "step": 184 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998257267272685, + "loss": 4.3679, + "step": 185 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998238376368773, + "loss": 4.2416, + "step": 186 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998219383635107, + "loss": 4.3281, + "step": 187 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998200289071806, + "loss": 4.278, + "step": 188 + }, + { + "epoch": 0.01, + "learning_rate": 0.00029998181092679, + "loss": 4.2585, + "step": 189 + }, + { + "epoch": 0.01, + "learning_rate": 0.0002999816179445683, + "loss": 4.3055, + "step": 190 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999814239440541, + "loss": 4.1961, + "step": 191 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999812289252488, + "loss": 4.2319, + "step": 192 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999810328881538, + "loss": 4.2092, + "step": 193 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999808358327702, + "loss": 4.3242, + "step": 194 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029998063775909964, + "loss": 4.1855, + "step": 195 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029998043866714323, + "loss": 4.303, + "step": 196 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029998023855690246, + "loss": 4.1591, + "step": 197 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029998003742837863, + "loss": 4.1983, + "step": 198 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999798352815731, + "loss": 4.3276, + "step": 199 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999796321164872, + "loss": 4.2653, + "step": 200 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029997942793312245, + "loss": 4.2074, + "step": 201 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999792227314801, + "loss": 4.2234, + "step": 202 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999790165115616, + "loss": 4.2097, + "step": 203 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999788092733683, + "loss": 4.2144, + "step": 204 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999786010169017, + "loss": 4.1698, + "step": 205 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999783917421632, + "loss": 4.2162, + "step": 206 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029997818144915416, + "loss": 4.1766, + "step": 207 + }, + { + "epoch": 0.02, + "learning_rate": 0.000299977970137876, + "loss": 4.0721, + "step": 208 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029997775780833024, + "loss": 4.1178, + "step": 209 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999775444605182, + "loss": 4.1111, + "step": 210 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029997733009444146, + "loss": 4.1418, + "step": 211 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999771147101014, + "loss": 4.1061, + "step": 212 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999768983074995, + "loss": 4.1108, + "step": 213 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029997668088663714, + "loss": 4.1349, + "step": 214 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029997646244751597, + "loss": 4.0807, + "step": 215 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029997624299013737, + "loss": 4.1052, + "step": 216 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999760225145028, + "loss": 4.118, + "step": 217 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999758010206139, + "loss": 4.1122, + "step": 218 + }, + { + "epoch": 0.02, + "learning_rate": 0.000299975578508472, + "loss": 4.1162, + "step": 219 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999753549780787, + "loss": 4.1254, + "step": 220 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029997513042943544, + "loss": 4.0779, + "step": 221 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999749048625439, + "loss": 4.0547, + "step": 222 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999746782774055, + "loss": 4.081, + "step": 223 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029997445067402175, + "loss": 4.0886, + "step": 224 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999742220523943, + "loss": 4.0712, + "step": 225 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029997399241252465, + "loss": 4.1302, + "step": 226 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999737617544143, + "loss": 3.97, + "step": 227 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999735300780649, + "loss": 4.0399, + "step": 228 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029997329738347796, + "loss": 4.0173, + "step": 229 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029997306367065516, + "loss": 4.026, + "step": 230 + }, + { + "epoch": 0.02, + "learning_rate": 0.000299972828939598, + "loss": 4.0269, + "step": 231 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029997259319030804, + "loss": 4.037, + "step": 232 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999723564227869, + "loss": 3.9136, + "step": 233 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029997211863703636, + "loss": 3.9446, + "step": 234 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999718798330578, + "loss": 3.9837, + "step": 235 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029997164001085297, + "loss": 4.0232, + "step": 236 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029997139917042345, + "loss": 3.9559, + "step": 237 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029997115731177093, + "loss": 3.9762, + "step": 238 + }, + { + "epoch": 0.02, + "learning_rate": 0.000299970914434897, + "loss": 3.9527, + "step": 239 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029997067053980325, + "loss": 3.9775, + "step": 240 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999704256264915, + "loss": 3.9603, + "step": 241 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029997017969496327, + "loss": 3.9555, + "step": 242 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999699327452203, + "loss": 3.9495, + "step": 243 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999696847772642, + "loss": 3.9491, + "step": 244 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029996943579109676, + "loss": 3.9303, + "step": 245 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999691857867196, + "loss": 3.8839, + "step": 246 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999689347641344, + "loss": 3.9252, + "step": 247 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029996868272334293, + "loss": 3.9429, + "step": 248 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999684296643468, + "loss": 3.9003, + "step": 249 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029996817558714786, + "loss": 3.9223, + "step": 250 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029996792049174776, + "loss": 3.9366, + "step": 251 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999676643781482, + "loss": 3.9667, + "step": 252 + }, + { + "epoch": 0.02, + "learning_rate": 0.000299967407246351, + "loss": 3.8674, + "step": 253 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999671490963578, + "loss": 3.8993, + "step": 254 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999668899281705, + "loss": 3.8674, + "step": 255 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029996662974179076, + "loss": 3.8797, + "step": 256 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999663685372203, + "loss": 3.8734, + "step": 257 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029996610631446096, + "loss": 3.8857, + "step": 258 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999658430735146, + "loss": 3.7975, + "step": 259 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999655788143829, + "loss": 3.9391, + "step": 260 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029996531353706764, + "loss": 3.8268, + "step": 261 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029996504724157065, + "loss": 3.8626, + "step": 262 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029996477992789376, + "loss": 3.8168, + "step": 263 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999645115960388, + "loss": 3.8726, + "step": 264 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029996424224600754, + "loss": 3.8246, + "step": 265 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029996397187780186, + "loss": 3.8001, + "step": 266 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029996370049142353, + "loss": 3.7944, + "step": 267 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999634280868744, + "loss": 3.6991, + "step": 268 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999631546641564, + "loss": 3.8191, + "step": 269 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999628802232713, + "loss": 3.7679, + "step": 270 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999626047642211, + "loss": 3.8535, + "step": 271 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999623282870075, + "loss": 3.7943, + "step": 272 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029996205079163243, + "loss": 3.7432, + "step": 273 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029996177227809776, + "loss": 3.7871, + "step": 274 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029996149274640554, + "loss": 3.771, + "step": 275 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029996121219655743, + "loss": 3.7222, + "step": 276 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029996093062855544, + "loss": 3.774, + "step": 277 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029996064804240153, + "loss": 3.6882, + "step": 278 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999603644380976, + "loss": 3.7667, + "step": 279 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999600798156455, + "loss": 3.8107, + "step": 280 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999597941750472, + "loss": 3.7369, + "step": 281 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999595075163047, + "loss": 3.715, + "step": 282 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999592198394199, + "loss": 3.7312, + "step": 283 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029995893114439473, + "loss": 3.7781, + "step": 284 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029995864143123117, + "loss": 3.747, + "step": 285 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999583506999312, + "loss": 3.7143, + "step": 286 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029995805895049674, + "loss": 3.7797, + "step": 287 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999577661829299, + "loss": 3.7805, + "step": 288 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999574723972325, + "loss": 3.788, + "step": 289 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999571775934066, + "loss": 3.7218, + "step": 290 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999568817714543, + "loss": 3.7922, + "step": 291 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029995658493137746, + "loss": 3.691, + "step": 292 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999562870731782, + "loss": 3.6587, + "step": 293 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999559881968585, + "loss": 3.7278, + "step": 294 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999556883024204, + "loss": 3.6881, + "step": 295 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999553873898659, + "loss": 3.7996, + "step": 296 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999550854591971, + "loss": 3.6761, + "step": 297 + }, + { + "epoch": 0.02, + "learning_rate": 0.000299954782510416, + "loss": 3.6604, + "step": 298 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999544785435247, + "loss": 3.622, + "step": 299 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999541735585252, + "loss": 3.7345, + "step": 300 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029995386755541964, + "loss": 3.678, + "step": 301 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999535605342101, + "loss": 3.7082, + "step": 302 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029995325249489857, + "loss": 3.7032, + "step": 303 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029995294343748724, + "loss": 3.6546, + "step": 304 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999526333619782, + "loss": 3.7053, + "step": 305 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029995232226837353, + "loss": 3.6493, + "step": 306 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999520101566753, + "loss": 3.6268, + "step": 307 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999516970268857, + "loss": 3.6729, + "step": 308 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029995138287900684, + "loss": 3.6733, + "step": 309 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999510677130408, + "loss": 3.5923, + "step": 310 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029995075152898976, + "loss": 3.6958, + "step": 311 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029995043432685595, + "loss": 3.6217, + "step": 312 + }, + { + "epoch": 0.02, + "learning_rate": 0.00029995011610664134, + "loss": 3.6087, + "step": 313 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999497968683482, + "loss": 3.6249, + "step": 314 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999494766119787, + "loss": 3.6491, + "step": 315 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999491553375351, + "loss": 3.591, + "step": 316 + }, + { + "epoch": 0.02, + "learning_rate": 0.0002999488330450194, + "loss": 3.6178, + "step": 317 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029994850973443383, + "loss": 3.6651, + "step": 318 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999481854057807, + "loss": 3.5771, + "step": 319 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999478600590621, + "loss": 3.6254, + "step": 320 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029994753369428024, + "loss": 3.5805, + "step": 321 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029994720631143745, + "loss": 3.656, + "step": 322 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029994687791053587, + "loss": 3.6891, + "step": 323 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999465484915777, + "loss": 3.5846, + "step": 324 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999462180545653, + "loss": 3.6018, + "step": 325 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999458865995007, + "loss": 3.5023, + "step": 326 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999455541263863, + "loss": 3.5587, + "step": 327 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999452206352244, + "loss": 3.6164, + "step": 328 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999448861260172, + "loss": 3.5607, + "step": 329 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999445505987669, + "loss": 3.6474, + "step": 330 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029994421405347586, + "loss": 3.5786, + "step": 331 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999438764901464, + "loss": 3.5564, + "step": 332 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999435379087808, + "loss": 3.5337, + "step": 333 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029994319830938123, + "loss": 3.5182, + "step": 334 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999428576919501, + "loss": 3.5075, + "step": 335 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029994251605648973, + "loss": 3.6318, + "step": 336 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029994217340300244, + "loss": 3.6346, + "step": 337 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999418297314905, + "loss": 3.4845, + "step": 338 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029994148504195633, + "loss": 3.5481, + "step": 339 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999411393344022, + "loss": 3.4799, + "step": 340 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029994079260883046, + "loss": 3.5433, + "step": 341 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999404448652435, + "loss": 3.5505, + "step": 342 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999400961036437, + "loss": 3.5395, + "step": 343 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999397463240333, + "loss": 3.5285, + "step": 344 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999393955264149, + "loss": 3.5803, + "step": 345 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999390437107906, + "loss": 3.5289, + "step": 346 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029993869087716307, + "loss": 3.516, + "step": 347 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029993833702553446, + "loss": 3.4995, + "step": 348 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029993798215590734, + "loss": 3.4694, + "step": 349 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029993762626828404, + "loss": 3.5153, + "step": 350 + }, + { + "epoch": 0.03, + "learning_rate": 0.000299937269362667, + "loss": 3.5131, + "step": 351 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029993691143905866, + "loss": 3.4829, + "step": 352 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029993655249746146, + "loss": 3.4813, + "step": 353 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999361925378778, + "loss": 3.5926, + "step": 354 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029993583156031007, + "loss": 3.5124, + "step": 355 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999354695647608, + "loss": 3.4817, + "step": 356 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999351065512325, + "loss": 3.4733, + "step": 357 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999347425197275, + "loss": 3.5251, + "step": 358 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999343774702484, + "loss": 3.5314, + "step": 359 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029993401140279756, + "loss": 3.4583, + "step": 360 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999336443173776, + "loss": 3.4635, + "step": 361 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029993327621399086, + "loss": 3.456, + "step": 362 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999329070926399, + "loss": 3.4824, + "step": 363 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029993253695332733, + "loss": 3.4846, + "step": 364 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999321657960555, + "loss": 3.5, + "step": 365 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029993179362082707, + "loss": 3.4837, + "step": 366 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029993142042764444, + "loss": 3.4955, + "step": 367 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999310462165102, + "loss": 3.5033, + "step": 368 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999306709874269, + "loss": 3.4598, + "step": 369 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999302947403971, + "loss": 3.4585, + "step": 370 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999299174754233, + "loss": 3.4963, + "step": 371 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999295391925082, + "loss": 3.5095, + "step": 372 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999291598916542, + "loss": 3.4137, + "step": 373 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999287795728639, + "loss": 3.4546, + "step": 374 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029992839823614, + "loss": 3.4099, + "step": 375 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029992801588148496, + "loss": 3.4493, + "step": 376 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999276325089015, + "loss": 3.4755, + "step": 377 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029992724811839206, + "loss": 3.4423, + "step": 378 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999268627099594, + "loss": 3.4219, + "step": 379 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029992647628360603, + "loss": 3.4129, + "step": 380 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029992608883933465, + "loss": 3.4411, + "step": 381 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999257003771479, + "loss": 3.4778, + "step": 382 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999253108970484, + "loss": 3.4326, + "step": 383 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029992492039903864, + "loss": 3.3993, + "step": 384 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999245288831215, + "loss": 3.3898, + "step": 385 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029992413634929955, + "loss": 3.4255, + "step": 386 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029992374279757546, + "loss": 3.3929, + "step": 387 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029992334822795185, + "loss": 3.4002, + "step": 388 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999229526404315, + "loss": 3.3688, + "step": 389 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029992255603501696, + "loss": 3.3356, + "step": 390 + }, + { + "epoch": 0.03, + "learning_rate": 0.000299922158411711, + "loss": 3.3853, + "step": 391 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029992175977051633, + "loss": 3.3704, + "step": 392 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999213601114357, + "loss": 3.4197, + "step": 393 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999209594344717, + "loss": 3.3395, + "step": 394 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999205577396272, + "loss": 3.3234, + "step": 395 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029992015502690474, + "loss": 3.3223, + "step": 396 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029991975129630723, + "loss": 3.3458, + "step": 397 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029991934654783736, + "loss": 3.3912, + "step": 398 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029991894078149783, + "loss": 3.3862, + "step": 399 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999185339972914, + "loss": 3.365, + "step": 400 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029991812619522087, + "loss": 3.3797, + "step": 401 + }, + { + "epoch": 0.03, + "learning_rate": 0.000299917717375289, + "loss": 3.3347, + "step": 402 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999173075374986, + "loss": 3.3421, + "step": 403 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999168966818523, + "loss": 3.4062, + "step": 404 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999164848083531, + "loss": 3.3438, + "step": 405 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029991607191700366, + "loss": 3.2981, + "step": 406 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029991565800780687, + "loss": 3.3278, + "step": 407 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029991524308076547, + "loss": 3.3876, + "step": 408 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999148271358823, + "loss": 3.3242, + "step": 409 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999144101731601, + "loss": 3.314, + "step": 410 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029991399219260185, + "loss": 3.3267, + "step": 411 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029991357319421037, + "loss": 3.2674, + "step": 412 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029991315317798843, + "loss": 3.3884, + "step": 413 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999127321439389, + "loss": 3.3839, + "step": 414 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999123100920646, + "loss": 3.3184, + "step": 415 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999118870223685, + "loss": 3.3089, + "step": 416 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999114629348534, + "loss": 3.3404, + "step": 417 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999110378295222, + "loss": 3.3075, + "step": 418 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999106117063778, + "loss": 3.3059, + "step": 419 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999101845654231, + "loss": 3.3482, + "step": 420 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999097564066609, + "loss": 3.3484, + "step": 421 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029990932723009415, + "loss": 3.305, + "step": 422 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029990889703572585, + "loss": 3.3064, + "step": 423 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999084658235589, + "loss": 3.263, + "step": 424 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029990803359359616, + "loss": 3.3036, + "step": 425 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999076003458406, + "loss": 3.2776, + "step": 426 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029990716608029516, + "loss": 3.2948, + "step": 427 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999067307969628, + "loss": 3.2468, + "step": 428 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999062944958464, + "loss": 3.2286, + "step": 429 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029990585717694905, + "loss": 3.2593, + "step": 430 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029990541884027366, + "loss": 3.2648, + "step": 431 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029990497948582316, + "loss": 3.2489, + "step": 432 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999045391136006, + "loss": 3.2649, + "step": 433 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029990409772360897, + "loss": 3.2866, + "step": 434 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999036553158512, + "loss": 3.2414, + "step": 435 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029990321189033033, + "loss": 3.2652, + "step": 436 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999027674470494, + "loss": 3.2923, + "step": 437 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029990232198601137, + "loss": 3.23, + "step": 438 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029990187550721934, + "loss": 3.2453, + "step": 439 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999014280106762, + "loss": 3.2658, + "step": 440 + }, + { + "epoch": 0.03, + "learning_rate": 0.0002999009794963852, + "loss": 3.2777, + "step": 441 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029990052996434923, + "loss": 3.3127, + "step": 442 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029990007941457135, + "loss": 3.3072, + "step": 443 + }, + { + "epoch": 0.03, + "learning_rate": 0.00029989962784705474, + "loss": 3.2399, + "step": 444 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998991752618023, + "loss": 3.2192, + "step": 445 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998987216588172, + "loss": 3.2204, + "step": 446 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029989826703810256, + "loss": 3.283, + "step": 447 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998978113996613, + "loss": 3.2228, + "step": 448 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029989735474349665, + "loss": 3.2552, + "step": 449 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029989689706961175, + "loss": 3.2266, + "step": 450 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998964383780096, + "loss": 3.272, + "step": 451 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029989597866869334, + "loss": 3.2204, + "step": 452 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998955179416661, + "loss": 3.2473, + "step": 453 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029989505619693106, + "loss": 3.1992, + "step": 454 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998945934344912, + "loss": 3.2689, + "step": 455 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029989412965434985, + "loss": 3.2824, + "step": 456 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998936648565101, + "loss": 3.2405, + "step": 457 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998931990409751, + "loss": 3.2571, + "step": 458 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998927322077479, + "loss": 3.1744, + "step": 459 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029989226435683184, + "loss": 3.2192, + "step": 460 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029989179548823, + "loss": 3.1929, + "step": 461 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029989132560194557, + "loss": 3.1559, + "step": 462 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998908546979818, + "loss": 3.2255, + "step": 463 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998903827763418, + "loss": 3.16, + "step": 464 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998899098370288, + "loss": 3.1441, + "step": 465 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998894358800461, + "loss": 3.1374, + "step": 466 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998889609053968, + "loss": 3.2022, + "step": 467 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998884849130842, + "loss": 3.2187, + "step": 468 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998880079031115, + "loss": 3.1887, + "step": 469 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029988752987548185, + "loss": 3.1583, + "step": 470 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998870508301987, + "loss": 3.1046, + "step": 471 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998865707672651, + "loss": 3.1383, + "step": 472 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998860896866845, + "loss": 3.1351, + "step": 473 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029988560758845996, + "loss": 3.1745, + "step": 474 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029988512447259494, + "loss": 3.132, + "step": 475 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998846403390926, + "loss": 3.1297, + "step": 476 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998841551879563, + "loss": 3.1711, + "step": 477 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029988366901918925, + "loss": 3.1424, + "step": 478 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029988318183279484, + "loss": 3.1174, + "step": 479 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998826936287763, + "loss": 3.1397, + "step": 480 + }, + { + "epoch": 0.04, + "learning_rate": 0.000299882204407137, + "loss": 3.1701, + "step": 481 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998817141678802, + "loss": 3.1798, + "step": 482 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029988122291100936, + "loss": 3.1283, + "step": 483 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029988073063652766, + "loss": 3.1025, + "step": 484 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029988023734443857, + "loss": 3.1207, + "step": 485 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029987974303474535, + "loss": 3.1344, + "step": 486 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029987924770745136, + "loss": 3.105, + "step": 487 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029987875136256, + "loss": 3.1359, + "step": 488 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029987825400007467, + "loss": 3.1229, + "step": 489 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998777556199987, + "loss": 3.1058, + "step": 490 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029987725622233544, + "loss": 3.0607, + "step": 491 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998767558070883, + "loss": 3.0856, + "step": 492 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998762543742607, + "loss": 2.9987, + "step": 493 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998757519238561, + "loss": 3.0655, + "step": 494 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029987524845587784, + "loss": 3.1465, + "step": 495 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998747439703293, + "loss": 3.1124, + "step": 496 + }, + { + "epoch": 0.04, + "learning_rate": 0.000299874238467214, + "loss": 3.0728, + "step": 497 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998737319465353, + "loss": 3.1369, + "step": 498 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029987322440829667, + "loss": 3.1197, + "step": 499 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998727158525016, + "loss": 3.0726, + "step": 500 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029987220627915344, + "loss": 3.1129, + "step": 501 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029987169568825576, + "loss": 3.0882, + "step": 502 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029987118407981194, + "loss": 3.028, + "step": 503 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029987067145382547, + "loss": 3.0593, + "step": 504 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029987015781029986, + "loss": 3.0912, + "step": 505 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998696431492386, + "loss": 3.0887, + "step": 506 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998691274706452, + "loss": 3.091, + "step": 507 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029986861077452304, + "loss": 3.054, + "step": 508 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029986809306087575, + "loss": 3.0896, + "step": 509 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029986757432970683, + "loss": 3.0379, + "step": 510 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029986705458101976, + "loss": 3.0625, + "step": 511 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998665338148181, + "loss": 3.033, + "step": 512 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998660120311054, + "loss": 3.0174, + "step": 513 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029986548922988514, + "loss": 3.0736, + "step": 514 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029986496541116095, + "loss": 3.0877, + "step": 515 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029986444057493634, + "loss": 2.9844, + "step": 516 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029986391472121494, + "loss": 3.0893, + "step": 517 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998633878500002, + "loss": 3.0505, + "step": 518 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998628599612957, + "loss": 3.0343, + "step": 519 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998623310551052, + "loss": 3.0546, + "step": 520 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029986180113143203, + "loss": 2.9731, + "step": 521 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998612701902801, + "loss": 3.0947, + "step": 522 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998607382316527, + "loss": 3.0458, + "step": 523 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998602052555537, + "loss": 2.9464, + "step": 524 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998596712619865, + "loss": 3.0588, + "step": 525 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998591362509549, + "loss": 3.0908, + "step": 526 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029985860022246246, + "loss": 2.9842, + "step": 527 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998580631765128, + "loss": 3.1067, + "step": 528 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998575251131096, + "loss": 3.0265, + "step": 529 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029985698603225653, + "loss": 2.9895, + "step": 530 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029985644593395717, + "loss": 3.0481, + "step": 531 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998559048182152, + "loss": 3.009, + "step": 532 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998553626850345, + "loss": 3.0404, + "step": 533 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029985481953441847, + "loss": 3.0198, + "step": 534 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029985427536637093, + "loss": 2.9818, + "step": 535 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998537301808955, + "loss": 2.9981, + "step": 536 + }, + { + "epoch": 0.04, + "learning_rate": 0.000299853183977996, + "loss": 3.0112, + "step": 537 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998526367576761, + "loss": 3.058, + "step": 538 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029985208851993945, + "loss": 2.9824, + "step": 539 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029985153926478985, + "loss": 2.9641, + "step": 540 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029985098899223094, + "loss": 3.0193, + "step": 541 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998504377022665, + "loss": 2.9502, + "step": 542 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029984988539490034, + "loss": 2.9858, + "step": 543 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998493320701361, + "loss": 3.031, + "step": 544 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998487777279777, + "loss": 2.9623, + "step": 545 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029984822236842865, + "loss": 3.0078, + "step": 546 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998476659914929, + "loss": 2.9393, + "step": 547 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998471085971743, + "loss": 2.9405, + "step": 548 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029984655018547643, + "loss": 2.9701, + "step": 549 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029984599075640316, + "loss": 2.9684, + "step": 550 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998454303099583, + "loss": 3.0025, + "step": 551 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998448688461457, + "loss": 3.005, + "step": 552 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029984430636496916, + "loss": 2.9699, + "step": 553 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998437428664324, + "loss": 2.955, + "step": 554 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029984317835053936, + "loss": 2.8974, + "step": 555 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029984261281729385, + "loss": 2.9148, + "step": 556 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029984204626669965, + "loss": 3.0008, + "step": 557 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998414786987606, + "loss": 3.0046, + "step": 558 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029984091011348073, + "loss": 2.9123, + "step": 559 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029984034051086365, + "loss": 2.9313, + "step": 560 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029983976989091343, + "loss": 2.9623, + "step": 561 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998391982536338, + "loss": 2.9309, + "step": 562 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998386255990287, + "loss": 2.9293, + "step": 563 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998380519271021, + "loss": 2.8694, + "step": 564 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029983747723785775, + "loss": 2.8473, + "step": 565 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998369015312996, + "loss": 2.933, + "step": 566 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998363248074316, + "loss": 2.9198, + "step": 567 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029983574706625763, + "loss": 2.9053, + "step": 568 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029983516830778164, + "loss": 2.9249, + "step": 569 + }, + { + "epoch": 0.04, + "learning_rate": 0.00029983458853200754, + "loss": 2.9805, + "step": 570 + }, + { + "epoch": 0.04, + "learning_rate": 0.0002998340077389392, + "loss": 2.965, + "step": 571 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029983342592858076, + "loss": 2.8676, + "step": 572 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029983284310093595, + "loss": 2.9428, + "step": 573 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029983225925600884, + "loss": 2.9323, + "step": 574 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998316743938034, + "loss": 2.8882, + "step": 575 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998310885143236, + "loss": 2.9232, + "step": 576 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029983050161757333, + "loss": 2.9208, + "step": 577 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029982991370355665, + "loss": 2.8978, + "step": 578 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998293247722776, + "loss": 2.8934, + "step": 579 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029982873482374, + "loss": 2.9157, + "step": 580 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029982814385794805, + "loss": 2.9203, + "step": 581 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998275518749057, + "loss": 2.8976, + "step": 582 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998269588746169, + "loss": 2.912, + "step": 583 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998263648570858, + "loss": 2.8397, + "step": 584 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029982576982231634, + "loss": 2.8763, + "step": 585 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998251737703126, + "loss": 2.8731, + "step": 586 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998245767010785, + "loss": 2.8994, + "step": 587 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998239786146183, + "loss": 2.8959, + "step": 588 + }, + { + "epoch": 0.05, + "learning_rate": 0.000299823379510936, + "loss": 2.9344, + "step": 589 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998227793900355, + "loss": 2.9004, + "step": 590 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029982217825192113, + "loss": 2.9039, + "step": 591 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998215760965968, + "loss": 2.8548, + "step": 592 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029982097292406663, + "loss": 2.8582, + "step": 593 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998203687343348, + "loss": 2.8568, + "step": 594 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998197635274053, + "loss": 2.8544, + "step": 595 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029981915730328227, + "loss": 2.9275, + "step": 596 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998185500619698, + "loss": 2.8658, + "step": 597 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029981794180347214, + "loss": 2.9085, + "step": 598 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998173325277933, + "loss": 2.8681, + "step": 599 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029981672223493744, + "loss": 2.807, + "step": 600 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998161109249087, + "loss": 2.848, + "step": 601 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998154985977113, + "loss": 2.8962, + "step": 602 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998148852533492, + "loss": 2.9375, + "step": 603 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029981427089182685, + "loss": 2.8912, + "step": 604 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998136555131482, + "loss": 2.8608, + "step": 605 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998130391173175, + "loss": 2.8124, + "step": 606 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029981242170433903, + "loss": 2.7887, + "step": 607 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998118032742168, + "loss": 2.8788, + "step": 608 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998111838269551, + "loss": 2.8294, + "step": 609 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998105633625582, + "loss": 2.8548, + "step": 610 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998099418810302, + "loss": 2.841, + "step": 611 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029980931938237537, + "loss": 2.9162, + "step": 612 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029980869586659795, + "loss": 2.8521, + "step": 613 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998080713337021, + "loss": 2.8271, + "step": 614 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998074457836922, + "loss": 2.84, + "step": 615 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029980681921657235, + "loss": 2.7782, + "step": 616 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998061916323469, + "loss": 2.7358, + "step": 617 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029980556303102, + "loss": 2.8618, + "step": 618 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998049334125961, + "loss": 2.8669, + "step": 619 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998043027770794, + "loss": 2.8121, + "step": 620 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029980367112447404, + "loss": 2.841, + "step": 621 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029980303845478446, + "loss": 2.8193, + "step": 622 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029980240476801495, + "loss": 2.8047, + "step": 623 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029980177006416975, + "loss": 2.7937, + "step": 624 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998011343432532, + "loss": 2.8147, + "step": 625 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002998004976052696, + "loss": 2.8271, + "step": 626 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029979985985022336, + "loss": 2.7999, + "step": 627 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029979922107811866, + "loss": 2.8938, + "step": 628 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029979858128895994, + "loss": 2.8051, + "step": 629 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997979404827515, + "loss": 2.8158, + "step": 630 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029979729865949777, + "loss": 2.7271, + "step": 631 + }, + { + "epoch": 0.05, + "learning_rate": 0.000299796655819203, + "loss": 2.8752, + "step": 632 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997960119618716, + "loss": 2.7863, + "step": 633 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029979536708750796, + "loss": 2.763, + "step": 634 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997947211961164, + "loss": 2.784, + "step": 635 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997940742877014, + "loss": 2.8061, + "step": 636 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997934263622673, + "loss": 2.7848, + "step": 637 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029979277741981847, + "loss": 2.7763, + "step": 638 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029979212746035933, + "loss": 2.8128, + "step": 639 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997914764838943, + "loss": 2.822, + "step": 640 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029979082449042784, + "loss": 2.7838, + "step": 641 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029979017147996437, + "loss": 2.7593, + "step": 642 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997895174525082, + "loss": 2.7969, + "step": 643 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029978886240806396, + "loss": 2.8005, + "step": 644 + }, + { + "epoch": 0.05, + "learning_rate": 0.000299788206346636, + "loss": 2.8598, + "step": 645 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029978754926822875, + "loss": 2.8033, + "step": 646 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997868911728467, + "loss": 2.8566, + "step": 647 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997862320604943, + "loss": 2.8095, + "step": 648 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997855719311761, + "loss": 2.8218, + "step": 649 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029978491078489644, + "loss": 2.8158, + "step": 650 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029978424862166, + "loss": 2.8407, + "step": 651 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997835854414711, + "loss": 2.8192, + "step": 652 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997829212443343, + "loss": 2.7773, + "step": 653 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029978225603025414, + "loss": 2.766, + "step": 654 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029978158979923516, + "loss": 2.7477, + "step": 655 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997809225512818, + "loss": 2.789, + "step": 656 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997802542863986, + "loss": 2.7875, + "step": 657 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029977958500459025, + "loss": 2.7513, + "step": 658 + }, + { + "epoch": 0.05, + "learning_rate": 0.000299778914705861, + "loss": 2.773, + "step": 659 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997782433902157, + "loss": 2.7224, + "step": 660 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997775710576587, + "loss": 2.7683, + "step": 661 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029977689770819475, + "loss": 2.7416, + "step": 662 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997762233418283, + "loss": 2.7285, + "step": 663 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997755479585639, + "loss": 2.7482, + "step": 664 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029977487155840617, + "loss": 2.749, + "step": 665 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997741941413598, + "loss": 2.7525, + "step": 666 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029977351570742916, + "loss": 2.756, + "step": 667 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997728362566191, + "loss": 2.7868, + "step": 668 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997721557889341, + "loss": 2.7722, + "step": 669 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029977147430437887, + "loss": 2.7262, + "step": 670 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997707918029579, + "loss": 2.6959, + "step": 671 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029977010828467597, + "loss": 2.7339, + "step": 672 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997694237495376, + "loss": 2.7857, + "step": 673 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029976873819754753, + "loss": 2.7681, + "step": 674 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997680516287104, + "loss": 2.8482, + "step": 675 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997673640430308, + "loss": 2.7562, + "step": 676 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029976667544051345, + "loss": 2.7379, + "step": 677 + }, + { + "epoch": 0.05, + "learning_rate": 0.000299765985821163, + "loss": 2.7353, + "step": 678 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029976529518498416, + "loss": 2.7259, + "step": 679 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029976460353198166, + "loss": 2.6819, + "step": 680 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997639108621601, + "loss": 2.7155, + "step": 681 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997632171755243, + "loss": 2.7437, + "step": 682 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029976252247207886, + "loss": 2.7525, + "step": 683 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997618267518285, + "loss": 2.7651, + "step": 684 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029976113001477803, + "loss": 2.7274, + "step": 685 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029976043226093217, + "loss": 2.7239, + "step": 686 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029975973349029555, + "loss": 2.7285, + "step": 687 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029975903370287304, + "loss": 2.7144, + "step": 688 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997583328986693, + "loss": 2.7124, + "step": 689 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029975763107768907, + "loss": 2.7374, + "step": 690 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997569282399372, + "loss": 2.6965, + "step": 691 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997562243854185, + "loss": 2.6688, + "step": 692 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997555195141376, + "loss": 2.6655, + "step": 693 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029975481362609944, + "loss": 2.7675, + "step": 694 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029975410672130866, + "loss": 2.6698, + "step": 695 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029975339879977016, + "loss": 2.6249, + "step": 696 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029975268986148876, + "loss": 2.7753, + "step": 697 + }, + { + "epoch": 0.05, + "learning_rate": 0.0002997519799064692, + "loss": 2.6617, + "step": 698 + }, + { + "epoch": 0.05, + "learning_rate": 0.00029975126893471636, + "loss": 2.7121, + "step": 699 + }, + { + "epoch": 0.06, + "learning_rate": 0.000299750556946235, + "loss": 2.703, + "step": 700 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029974984394103005, + "loss": 2.6435, + "step": 701 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029974912991910627, + "loss": 2.7209, + "step": 702 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029974841488046854, + "loss": 2.6562, + "step": 703 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997476988251217, + "loss": 2.7547, + "step": 704 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029974698175307064, + "loss": 2.725, + "step": 705 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029974626366432023, + "loss": 2.6492, + "step": 706 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997455445588753, + "loss": 2.7403, + "step": 707 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029974482443674073, + "loss": 2.6681, + "step": 708 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997441032979215, + "loss": 2.6877, + "step": 709 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029974338114242236, + "loss": 2.6949, + "step": 710 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029974265797024836, + "loss": 2.715, + "step": 711 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997419337814043, + "loss": 2.7013, + "step": 712 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029974120857589523, + "loss": 2.6937, + "step": 713 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029974048235372597, + "loss": 2.7083, + "step": 714 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997397551149014, + "loss": 2.6838, + "step": 715 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029973902685942656, + "loss": 2.6127, + "step": 716 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997382975873064, + "loss": 2.6922, + "step": 717 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029973756729854577, + "loss": 2.671, + "step": 718 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029973683599314975, + "loss": 2.6742, + "step": 719 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997361036711232, + "loss": 2.6964, + "step": 720 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997353703324711, + "loss": 2.7109, + "step": 721 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029973463597719854, + "loss": 2.6909, + "step": 722 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029973390060531043, + "loss": 2.6496, + "step": 723 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997331642168117, + "loss": 2.6552, + "step": 724 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997324268117075, + "loss": 2.6508, + "step": 725 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997316883900027, + "loss": 2.6862, + "step": 726 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997309489517024, + "loss": 2.6635, + "step": 727 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997302084968115, + "loss": 2.7271, + "step": 728 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997294670253352, + "loss": 2.7378, + "step": 729 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029972872453727845, + "loss": 2.6311, + "step": 730 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997279810326462, + "loss": 2.6636, + "step": 731 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029972723651144363, + "loss": 2.6636, + "step": 732 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997264909736758, + "loss": 2.6617, + "step": 733 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029972574441934765, + "loss": 2.6394, + "step": 734 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029972499684846436, + "loss": 2.6642, + "step": 735 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029972424826103095, + "loss": 2.6409, + "step": 736 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029972349865705256, + "loss": 2.693, + "step": 737 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997227480365342, + "loss": 2.663, + "step": 738 + }, + { + "epoch": 0.06, + "learning_rate": 0.000299721996399481, + "loss": 2.6709, + "step": 739 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029972124374589806, + "loss": 2.6218, + "step": 740 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029972049007579056, + "loss": 2.6124, + "step": 741 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997197353891635, + "loss": 2.6537, + "step": 742 + }, + { + "epoch": 0.06, + "learning_rate": 0.000299718979686022, + "loss": 2.6436, + "step": 743 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029971822296637136, + "loss": 2.7085, + "step": 744 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997174652302166, + "loss": 2.6817, + "step": 745 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997167064775628, + "loss": 2.6789, + "step": 746 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997159467084152, + "loss": 2.63, + "step": 747 + }, + { + "epoch": 0.06, + "learning_rate": 0.000299715185922779, + "loss": 2.6452, + "step": 748 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997144241206593, + "loss": 2.62, + "step": 749 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029971366130206124, + "loss": 2.5923, + "step": 750 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029971289746699004, + "loss": 2.6451, + "step": 751 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997121326154509, + "loss": 2.686, + "step": 752 + }, + { + "epoch": 0.06, + "learning_rate": 0.000299711366747449, + "loss": 2.6839, + "step": 753 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029971059986298954, + "loss": 2.6962, + "step": 754 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997098319620777, + "loss": 2.7167, + "step": 755 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997090630447187, + "loss": 2.6266, + "step": 756 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029970829311091785, + "loss": 2.6245, + "step": 757 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997075221606802, + "loss": 2.6621, + "step": 758 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029970675019401125, + "loss": 2.6386, + "step": 759 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029970597721091596, + "loss": 2.5819, + "step": 760 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029970520321139974, + "loss": 2.5905, + "step": 761 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997044281954678, + "loss": 2.5932, + "step": 762 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997036521631254, + "loss": 2.6202, + "step": 763 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029970287511437777, + "loss": 2.6357, + "step": 764 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029970209704923025, + "loss": 2.6803, + "step": 765 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029970131796768813, + "loss": 2.6636, + "step": 766 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002997005378697567, + "loss": 2.6329, + "step": 767 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996997567554412, + "loss": 2.6367, + "step": 768 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029969897462474695, + "loss": 2.6472, + "step": 769 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996981914776793, + "loss": 2.6662, + "step": 770 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996974073142435, + "loss": 2.6139, + "step": 771 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029969662213444494, + "loss": 2.6069, + "step": 772 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996958359382889, + "loss": 2.645, + "step": 773 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996950487257808, + "loss": 2.6586, + "step": 774 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996942604969259, + "loss": 2.5542, + "step": 775 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029969347125172955, + "loss": 2.5838, + "step": 776 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996926809901972, + "loss": 2.5294, + "step": 777 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029969188971233407, + "loss": 2.5473, + "step": 778 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996910974181457, + "loss": 2.619, + "step": 779 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029969030410763737, + "loss": 2.6307, + "step": 780 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996895097808144, + "loss": 2.5601, + "step": 781 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029968871443768235, + "loss": 2.6346, + "step": 782 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996879180782465, + "loss": 2.556, + "step": 783 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996871207025123, + "loss": 2.6346, + "step": 784 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996863223104852, + "loss": 2.6499, + "step": 785 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029968552290217046, + "loss": 2.5265, + "step": 786 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996847224775737, + "loss": 2.6261, + "step": 787 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996839210367003, + "loss": 2.5314, + "step": 788 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996831185795556, + "loss": 2.5658, + "step": 789 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996823151061452, + "loss": 2.5705, + "step": 790 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029968151061647444, + "loss": 2.6045, + "step": 791 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996807051105488, + "loss": 2.5943, + "step": 792 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029967989858837386, + "loss": 2.6569, + "step": 793 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996790910499549, + "loss": 2.5255, + "step": 794 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996782824952976, + "loss": 2.5351, + "step": 795 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029967747292440736, + "loss": 2.6453, + "step": 796 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029967666233728964, + "loss": 2.6611, + "step": 797 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029967585073395, + "loss": 2.6491, + "step": 798 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029967503811439386, + "loss": 2.5658, + "step": 799 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996742244786269, + "loss": 2.5757, + "step": 800 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996734098266545, + "loss": 2.5302, + "step": 801 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996725941584823, + "loss": 2.6165, + "step": 802 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996717774741158, + "loss": 2.6171, + "step": 803 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996709597735604, + "loss": 2.5399, + "step": 804 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996701410568219, + "loss": 2.5831, + "step": 805 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996693213239057, + "loss": 2.6413, + "step": 806 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996685005748174, + "loss": 2.5815, + "step": 807 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029966767880956253, + "loss": 2.5611, + "step": 808 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996668560281468, + "loss": 2.5994, + "step": 809 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996660322305756, + "loss": 2.5329, + "step": 810 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029966520741685475, + "loss": 2.5664, + "step": 811 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029966438158698965, + "loss": 2.5142, + "step": 812 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029966355474098604, + "loss": 2.6147, + "step": 813 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029966272687884945, + "loss": 2.5826, + "step": 814 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996618980005855, + "loss": 2.5187, + "step": 815 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996610681062, + "loss": 2.5356, + "step": 816 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996602371956983, + "loss": 2.5211, + "step": 817 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996594052690862, + "loss": 2.6099, + "step": 818 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029965857232636936, + "loss": 2.5885, + "step": 819 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996577383675534, + "loss": 2.5264, + "step": 820 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029965690339264393, + "loss": 2.5787, + "step": 821 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029965606740164674, + "loss": 2.5851, + "step": 822 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029965523039456743, + "loss": 2.5709, + "step": 823 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996543923714117, + "loss": 2.6202, + "step": 824 + }, + { + "epoch": 0.06, + "learning_rate": 0.0002996535533321852, + "loss": 2.6058, + "step": 825 + }, + { + "epoch": 0.06, + "learning_rate": 0.00029965271327689363, + "loss": 2.5827, + "step": 826 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996518722055428, + "loss": 2.5765, + "step": 827 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996510301181383, + "loss": 2.596, + "step": 828 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996501870146859, + "loss": 2.5547, + "step": 829 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029964934289519133, + "loss": 2.5631, + "step": 830 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996484977596603, + "loss": 2.6027, + "step": 831 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996476516080985, + "loss": 2.5882, + "step": 832 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029964680444051175, + "loss": 2.5488, + "step": 833 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996459562569058, + "loss": 2.6001, + "step": 834 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996451070572864, + "loss": 2.5521, + "step": 835 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996442568416592, + "loss": 2.5387, + "step": 836 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029964340561003025, + "loss": 2.5248, + "step": 837 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996425533624051, + "loss": 2.5476, + "step": 838 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996417000987895, + "loss": 2.6041, + "step": 839 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996408458191894, + "loss": 2.5255, + "step": 840 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029963999052361054, + "loss": 2.504, + "step": 841 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029963913421205877, + "loss": 2.5725, + "step": 842 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996382768845398, + "loss": 2.5711, + "step": 843 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029963741854105945, + "loss": 2.5388, + "step": 844 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996365591816237, + "loss": 2.5449, + "step": 845 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996356988062382, + "loss": 2.5452, + "step": 846 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029963483741490897, + "loss": 2.5475, + "step": 847 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029963397500764173, + "loss": 2.5254, + "step": 848 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029963311158444237, + "loss": 2.5781, + "step": 849 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996322471453168, + "loss": 2.5725, + "step": 850 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029963138169027077, + "loss": 2.5344, + "step": 851 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996305152193103, + "loss": 2.5037, + "step": 852 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996296477324412, + "loss": 2.526, + "step": 853 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996287792296693, + "loss": 2.5008, + "step": 854 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996279097110006, + "loss": 2.5345, + "step": 855 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029962703917644096, + "loss": 2.5446, + "step": 856 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996261676259963, + "loss": 2.5178, + "step": 857 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029962529505967253, + "loss": 2.5473, + "step": 858 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029962442147747555, + "loss": 2.5066, + "step": 859 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996235468794114, + "loss": 2.5714, + "step": 860 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996226712654859, + "loss": 2.5312, + "step": 861 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029962179463570497, + "loss": 2.5288, + "step": 862 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996209169900747, + "loss": 2.5205, + "step": 863 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029962003832860093, + "loss": 2.5438, + "step": 864 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029961915865128963, + "loss": 2.4147, + "step": 865 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996182779581469, + "loss": 2.4565, + "step": 866 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996173962491786, + "loss": 2.5225, + "step": 867 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996165135243907, + "loss": 2.5473, + "step": 868 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996156297837893, + "loss": 2.5291, + "step": 869 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996147450273803, + "loss": 2.469, + "step": 870 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029961385925516973, + "loss": 2.4727, + "step": 871 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029961297246716364, + "loss": 2.545, + "step": 872 + }, + { + "epoch": 0.07, + "learning_rate": 0.000299612084663368, + "loss": 2.4788, + "step": 873 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029961119584378897, + "loss": 2.4692, + "step": 874 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029961030600843237, + "loss": 2.5087, + "step": 875 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996094151573044, + "loss": 2.5419, + "step": 876 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996085232904111, + "loss": 2.4337, + "step": 877 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996076304077584, + "loss": 2.5069, + "step": 878 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996067365093525, + "loss": 2.4574, + "step": 879 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996058415951994, + "loss": 2.5347, + "step": 880 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029960494566530526, + "loss": 2.5104, + "step": 881 + }, + { + "epoch": 0.07, + "learning_rate": 0.000299604048719676, + "loss": 2.4503, + "step": 882 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029960315075831784, + "loss": 2.4959, + "step": 883 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996022517812369, + "loss": 2.4698, + "step": 884 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996013517884392, + "loss": 2.5045, + "step": 885 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002996004507799308, + "loss": 2.4809, + "step": 886 + }, + { + "epoch": 0.07, + "learning_rate": 0.000299599548755718, + "loss": 2.503, + "step": 887 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029959864571580677, + "loss": 2.4994, + "step": 888 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029959774166020333, + "loss": 2.5109, + "step": 889 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995968365889137, + "loss": 2.5131, + "step": 890 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029959593050194415, + "loss": 2.5158, + "step": 891 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029959502339930083, + "loss": 2.4482, + "step": 892 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995941152809898, + "loss": 2.4369, + "step": 893 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995932061470173, + "loss": 2.5019, + "step": 894 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029959229599738947, + "loss": 2.5694, + "step": 895 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995913848321125, + "loss": 2.4724, + "step": 896 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995904726511926, + "loss": 2.4821, + "step": 897 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995895594546359, + "loss": 2.4301, + "step": 898 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029958864524244866, + "loss": 2.4892, + "step": 899 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995877300146371, + "loss": 2.4758, + "step": 900 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995868137712074, + "loss": 2.5378, + "step": 901 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029958589651216577, + "loss": 2.5377, + "step": 902 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995849782375184, + "loss": 2.5067, + "step": 903 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029958405894727163, + "loss": 2.4893, + "step": 904 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029958313864143164, + "loss": 2.4583, + "step": 905 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995822173200047, + "loss": 2.5087, + "step": 906 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029958129498299706, + "loss": 2.4668, + "step": 907 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029958037163041495, + "loss": 2.4651, + "step": 908 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995794472622646, + "loss": 2.4443, + "step": 909 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029957852187855247, + "loss": 2.4472, + "step": 910 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995775954792846, + "loss": 2.4927, + "step": 911 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995766680644675, + "loss": 2.4594, + "step": 912 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029957573963410733, + "loss": 2.4903, + "step": 913 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029957481018821045, + "loss": 2.4069, + "step": 914 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995738797267831, + "loss": 2.4509, + "step": 915 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029957294824983164, + "loss": 2.4611, + "step": 916 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029957201575736244, + "loss": 2.4849, + "step": 917 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995710822493818, + "loss": 2.439, + "step": 918 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029957014772589606, + "loss": 2.4639, + "step": 919 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995692121869115, + "loss": 2.4206, + "step": 920 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029956827563243463, + "loss": 2.4601, + "step": 921 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995673380624716, + "loss": 2.4707, + "step": 922 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029956639947702896, + "loss": 2.4538, + "step": 923 + }, + { + "epoch": 0.07, + "learning_rate": 0.000299565459876113, + "loss": 2.4373, + "step": 924 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029956451925973004, + "loss": 2.5479, + "step": 925 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995635776278866, + "loss": 2.403, + "step": 926 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029956263498058896, + "loss": 2.4772, + "step": 927 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995616913178435, + "loss": 2.4567, + "step": 928 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995607466396568, + "loss": 2.419, + "step": 929 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029955980094603516, + "loss": 2.5241, + "step": 930 + }, + { + "epoch": 0.07, + "learning_rate": 0.000299558854236985, + "loss": 2.4799, + "step": 931 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995579065125127, + "loss": 2.4064, + "step": 932 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029955695777262475, + "loss": 2.4598, + "step": 933 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029955600801732766, + "loss": 2.4473, + "step": 934 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029955505724662775, + "loss": 2.4555, + "step": 935 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995541054605316, + "loss": 2.489, + "step": 936 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995531526590455, + "loss": 2.468, + "step": 937 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995521988421761, + "loss": 2.5146, + "step": 938 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995512440099298, + "loss": 2.4364, + "step": 939 + }, + { + "epoch": 0.07, + "learning_rate": 0.000299550288162313, + "loss": 2.4377, + "step": 940 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029954933129933234, + "loss": 2.4465, + "step": 941 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995483734209942, + "loss": 2.3763, + "step": 942 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995474145273052, + "loss": 2.4142, + "step": 943 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995464546182718, + "loss": 2.4981, + "step": 944 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995454936939004, + "loss": 2.4564, + "step": 945 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995445317541977, + "loss": 2.4549, + "step": 946 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029954356879917013, + "loss": 2.4502, + "step": 947 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029954260482882426, + "loss": 2.5091, + "step": 948 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029954163984316663, + "loss": 2.4336, + "step": 949 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029954067384220376, + "loss": 2.4883, + "step": 950 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029953970682594226, + "loss": 2.3717, + "step": 951 + }, + { + "epoch": 0.07, + "learning_rate": 0.0002995387387943887, + "loss": 2.4009, + "step": 952 + }, + { + "epoch": 0.07, + "learning_rate": 0.00029953776974754956, + "loss": 2.4802, + "step": 953 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002995367996854315, + "loss": 2.446, + "step": 954 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029953582860804115, + "loss": 2.4634, + "step": 955 + }, + { + "epoch": 0.08, + "learning_rate": 0.000299534856515385, + "loss": 2.5318, + "step": 956 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002995338834074697, + "loss": 2.4799, + "step": 957 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029953290928430186, + "loss": 2.4091, + "step": 958 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002995319341458881, + "loss": 2.4339, + "step": 959 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029953095799223497, + "loss": 2.4347, + "step": 960 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029952998082334923, + "loss": 2.5073, + "step": 961 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002995290026392374, + "loss": 2.4782, + "step": 962 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002995280234399061, + "loss": 2.4541, + "step": 963 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029952704322536215, + "loss": 2.4737, + "step": 964 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029952606199561203, + "loss": 2.4332, + "step": 965 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002995250797506625, + "loss": 2.4217, + "step": 966 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029952409649052007, + "loss": 2.4552, + "step": 967 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029952311221519167, + "loss": 2.4707, + "step": 968 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002995221269246838, + "loss": 2.4569, + "step": 969 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002995211406190032, + "loss": 2.4627, + "step": 970 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002995201532981566, + "loss": 2.371, + "step": 971 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029951916496215065, + "loss": 2.4857, + "step": 972 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002995181756109921, + "loss": 2.4537, + "step": 973 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002995171852446876, + "loss": 2.3908, + "step": 974 + }, + { + "epoch": 0.08, + "learning_rate": 0.000299516193863244, + "loss": 2.4091, + "step": 975 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029951520146666793, + "loss": 2.4143, + "step": 976 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002995142080549661, + "loss": 2.3941, + "step": 977 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029951321362814534, + "loss": 2.4339, + "step": 978 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029951221818621236, + "loss": 2.4741, + "step": 979 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029951122172917395, + "loss": 2.4196, + "step": 980 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029951022425703683, + "loss": 2.3997, + "step": 981 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002995092257698078, + "loss": 2.4117, + "step": 982 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002995082262674936, + "loss": 2.4115, + "step": 983 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002995072257501011, + "loss": 2.4152, + "step": 984 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029950622421763697, + "loss": 2.496, + "step": 985 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002995052216701082, + "loss": 2.4278, + "step": 986 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002995042181075214, + "loss": 2.4514, + "step": 987 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029950321352988345, + "loss": 2.4254, + "step": 988 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029950220793720125, + "loss": 2.391, + "step": 989 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002995012013294815, + "loss": 2.4277, + "step": 990 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029950019370673106, + "loss": 2.3824, + "step": 991 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994991850689569, + "loss": 2.4789, + "step": 992 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029949817541616574, + "loss": 2.4771, + "step": 993 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029949716474836444, + "loss": 2.4451, + "step": 994 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994961530655599, + "loss": 2.4752, + "step": 995 + }, + { + "epoch": 0.08, + "learning_rate": 0.000299495140367759, + "loss": 2.487, + "step": 996 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029949412665496855, + "loss": 2.4093, + "step": 997 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029949311192719555, + "loss": 2.4467, + "step": 998 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994920961844468, + "loss": 2.3478, + "step": 999 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994910794267292, + "loss": 2.4378, + "step": 1000 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994900616540496, + "loss": 2.475, + "step": 1001 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029948904286641507, + "loss": 2.4273, + "step": 1002 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994880230638324, + "loss": 2.4318, + "step": 1003 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029948700224630853, + "loss": 2.3908, + "step": 1004 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994859804138504, + "loss": 2.4367, + "step": 1005 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029948495756646507, + "loss": 2.3635, + "step": 1006 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029948393370415926, + "loss": 2.3885, + "step": 1007 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029948290882694003, + "loss": 2.3733, + "step": 1008 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994818829348144, + "loss": 2.4475, + "step": 1009 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994808560277892, + "loss": 2.3787, + "step": 1010 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994798281058716, + "loss": 2.435, + "step": 1011 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994787991690683, + "loss": 2.4531, + "step": 1012 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029947776921738654, + "loss": 2.38, + "step": 1013 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994767382508332, + "loss": 2.4337, + "step": 1014 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994757062694153, + "loss": 2.4192, + "step": 1015 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994746732731398, + "loss": 2.3856, + "step": 1016 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994736392620138, + "loss": 2.4188, + "step": 1017 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994726042360443, + "loss": 2.4096, + "step": 1018 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029947156819523825, + "loss": 2.4401, + "step": 1019 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994705311396027, + "loss": 2.4234, + "step": 1020 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029946949306914483, + "loss": 2.398, + "step": 1021 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029946845398387155, + "loss": 2.3451, + "step": 1022 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994674138837899, + "loss": 2.4133, + "step": 1023 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994663727689071, + "loss": 2.3542, + "step": 1024 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029946533063923, + "loss": 2.3276, + "step": 1025 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029946428749476583, + "loss": 2.3944, + "step": 1026 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029946324333552163, + "loss": 2.4432, + "step": 1027 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994621981615045, + "loss": 2.3894, + "step": 1028 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994611519727215, + "loss": 2.4597, + "step": 1029 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029946010476917975, + "loss": 2.4048, + "step": 1030 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994590565508864, + "loss": 2.4021, + "step": 1031 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029945800731784853, + "loss": 2.383, + "step": 1032 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994569570700733, + "loss": 2.3822, + "step": 1033 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029945590580756774, + "loss": 2.3227, + "step": 1034 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029945485353033907, + "loss": 2.4405, + "step": 1035 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029945380023839446, + "loss": 2.3948, + "step": 1036 + }, + { + "epoch": 0.08, + "learning_rate": 0.000299452745931741, + "loss": 2.4439, + "step": 1037 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029945169061038583, + "loss": 2.371, + "step": 1038 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994506342743362, + "loss": 2.3856, + "step": 1039 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029944957692359925, + "loss": 2.3976, + "step": 1040 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029944851855818214, + "loss": 2.4161, + "step": 1041 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029944745917809203, + "loss": 2.4012, + "step": 1042 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029944639878333614, + "loss": 2.3819, + "step": 1043 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029944533737392173, + "loss": 2.3812, + "step": 1044 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029944427494985585, + "loss": 2.4046, + "step": 1045 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029944321151114593, + "loss": 2.3437, + "step": 1046 + }, + { + "epoch": 0.08, + "learning_rate": 0.000299442147057799, + "loss": 2.3255, + "step": 1047 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994410815898224, + "loss": 2.3473, + "step": 1048 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994400151072233, + "loss": 2.3679, + "step": 1049 + }, + { + "epoch": 0.08, + "learning_rate": 0.000299438947610009, + "loss": 2.4013, + "step": 1050 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029943787909818666, + "loss": 2.3646, + "step": 1051 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994368095717636, + "loss": 2.3633, + "step": 1052 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029943573903074705, + "loss": 2.3307, + "step": 1053 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029943466747514434, + "loss": 2.4129, + "step": 1054 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029943359490496274, + "loss": 2.3662, + "step": 1055 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994325213202094, + "loss": 2.4338, + "step": 1056 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994314467208918, + "loss": 2.382, + "step": 1057 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994303711070171, + "loss": 2.4172, + "step": 1058 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994292944785926, + "loss": 2.3932, + "step": 1059 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994282168356257, + "loss": 2.3519, + "step": 1060 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994271381781236, + "loss": 2.3415, + "step": 1061 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994260585060938, + "loss": 2.3339, + "step": 1062 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029942497781954345, + "loss": 2.3717, + "step": 1063 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029942389611848, + "loss": 2.3452, + "step": 1064 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994228134029107, + "loss": 2.387, + "step": 1065 + }, + { + "epoch": 0.08, + "learning_rate": 0.000299421729672843, + "loss": 2.4084, + "step": 1066 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029942064492828423, + "loss": 2.378, + "step": 1067 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029941955916924166, + "loss": 2.3161, + "step": 1068 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994184723957228, + "loss": 2.3644, + "step": 1069 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029941738460773494, + "loss": 2.3616, + "step": 1070 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029941629580528553, + "loss": 2.4232, + "step": 1071 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029941520598838193, + "loss": 2.4228, + "step": 1072 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994141151570315, + "loss": 2.3709, + "step": 1073 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994130233112417, + "loss": 2.3049, + "step": 1074 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994119304510199, + "loss": 2.3026, + "step": 1075 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029941083657637356, + "loss": 2.4302, + "step": 1076 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029940974168731014, + "loss": 2.3535, + "step": 1077 + }, + { + "epoch": 0.08, + "learning_rate": 0.00029940864578383697, + "loss": 2.3673, + "step": 1078 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994075488659616, + "loss": 2.4297, + "step": 1079 + }, + { + "epoch": 0.08, + "learning_rate": 0.0002994064509336913, + "loss": 2.3842, + "step": 1080 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029940535198703374, + "loss": 2.4028, + "step": 1081 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002994042520259963, + "loss": 2.351, + "step": 1082 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002994031510505864, + "loss": 2.3518, + "step": 1083 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029940204906081156, + "loss": 2.3705, + "step": 1084 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029940094605667924, + "loss": 2.3662, + "step": 1085 + }, + { + "epoch": 0.09, + "learning_rate": 0.000299399842038197, + "loss": 2.3791, + "step": 1086 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029939873700537224, + "loss": 2.3287, + "step": 1087 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993976309582125, + "loss": 2.3227, + "step": 1088 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029939652389672527, + "loss": 2.382, + "step": 1089 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993954158209181, + "loss": 2.3469, + "step": 1090 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993943067307985, + "loss": 2.3566, + "step": 1091 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029939319662637405, + "loss": 2.4023, + "step": 1092 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029939208550765217, + "loss": 2.3514, + "step": 1093 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029939097337464046, + "loss": 2.4021, + "step": 1094 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993898602273465, + "loss": 2.3949, + "step": 1095 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993887460657779, + "loss": 2.4319, + "step": 1096 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993876308899421, + "loss": 2.304, + "step": 1097 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993865146998467, + "loss": 2.3651, + "step": 1098 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029938539749549935, + "loss": 2.3467, + "step": 1099 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993842792769075, + "loss": 2.3879, + "step": 1100 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029938316004407897, + "loss": 2.3875, + "step": 1101 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029938203979702115, + "loss": 2.3303, + "step": 1102 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993809185357417, + "loss": 2.3821, + "step": 1103 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029937979626024823, + "loss": 2.2558, + "step": 1104 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993786729705485, + "loss": 2.3245, + "step": 1105 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029937754866664985, + "loss": 2.3711, + "step": 1106 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029937642334856016, + "loss": 2.365, + "step": 1107 + }, + { + "epoch": 0.09, + "learning_rate": 0.000299375297016287, + "loss": 2.3451, + "step": 1108 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029937416966983795, + "loss": 2.3633, + "step": 1109 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029937304130922077, + "loss": 2.2995, + "step": 1110 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029937191193444304, + "loss": 2.3672, + "step": 1111 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029937078154551247, + "loss": 2.3361, + "step": 1112 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993696501424367, + "loss": 2.3314, + "step": 1113 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993685177252235, + "loss": 2.3841, + "step": 1114 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029936738429388044, + "loss": 2.4108, + "step": 1115 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029936624984841525, + "loss": 2.3474, + "step": 1116 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993651143888357, + "loss": 2.3531, + "step": 1117 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029936397791514944, + "loss": 2.4115, + "step": 1118 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993628404273642, + "loss": 2.3839, + "step": 1119 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993617019254877, + "loss": 2.3253, + "step": 1120 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993605624095276, + "loss": 2.4003, + "step": 1121 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029935942187949175, + "loss": 2.3408, + "step": 1122 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993582803353879, + "loss": 2.3725, + "step": 1123 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993571377772237, + "loss": 2.2697, + "step": 1124 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029935599420500696, + "loss": 2.3347, + "step": 1125 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993548496187454, + "loss": 2.3484, + "step": 1126 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993537040184469, + "loss": 2.297, + "step": 1127 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993525574041192, + "loss": 2.3223, + "step": 1128 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029935140977576996, + "loss": 2.335, + "step": 1129 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029935026113340715, + "loss": 2.3161, + "step": 1130 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029934911147703845, + "loss": 2.3505, + "step": 1131 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029934796080667163, + "loss": 2.3098, + "step": 1132 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029934680912231464, + "loss": 2.3859, + "step": 1133 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029934565642397525, + "loss": 2.3531, + "step": 1134 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029934450271166125, + "loss": 2.3284, + "step": 1135 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993433479853805, + "loss": 2.3244, + "step": 1136 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993421922451408, + "loss": 2.3494, + "step": 1137 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993410354909501, + "loss": 2.3158, + "step": 1138 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993398777228161, + "loss": 2.3333, + "step": 1139 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993387189407468, + "loss": 2.3285, + "step": 1140 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029933755914475, + "loss": 2.2959, + "step": 1141 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993363983348335, + "loss": 2.3677, + "step": 1142 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993352365110054, + "loss": 2.3779, + "step": 1143 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993340736732734, + "loss": 2.3492, + "step": 1144 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993329098216454, + "loss": 2.3765, + "step": 1145 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029933174495612935, + "loss": 2.2705, + "step": 1146 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029933057907673323, + "loss": 2.2813, + "step": 1147 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029932941218346486, + "loss": 2.3203, + "step": 1148 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993282442763322, + "loss": 2.3697, + "step": 1149 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993270753553431, + "loss": 2.345, + "step": 1150 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029932590542050563, + "loss": 2.3425, + "step": 1151 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993247344718277, + "loss": 2.309, + "step": 1152 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029932356250931717, + "loss": 2.3064, + "step": 1153 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993223895329821, + "loss": 2.3906, + "step": 1154 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993212155428303, + "loss": 2.3233, + "step": 1155 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029932004053886995, + "loss": 2.2987, + "step": 1156 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029931886452110886, + "loss": 2.3208, + "step": 1157 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029931768748955515, + "loss": 2.3308, + "step": 1158 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993165094442167, + "loss": 2.2566, + "step": 1159 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993153303851016, + "loss": 2.2499, + "step": 1160 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029931415031221777, + "loss": 2.3562, + "step": 1161 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993129692255732, + "loss": 2.4091, + "step": 1162 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029931178712517604, + "loss": 2.2999, + "step": 1163 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029931060401103423, + "loss": 2.3525, + "step": 1164 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993094198831558, + "loss": 2.345, + "step": 1165 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993082347415488, + "loss": 2.3671, + "step": 1166 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029930704858622127, + "loss": 2.3732, + "step": 1167 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029930586141718133, + "loss": 2.2735, + "step": 1168 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029930467323443697, + "loss": 2.3849, + "step": 1169 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993034840379962, + "loss": 2.3249, + "step": 1170 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029930229382786724, + "loss": 2.2889, + "step": 1171 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002993011026040581, + "loss": 2.3531, + "step": 1172 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002992999103665768, + "loss": 2.3658, + "step": 1173 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002992987171154316, + "loss": 2.2872, + "step": 1174 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029929752285063043, + "loss": 2.227, + "step": 1175 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029929632757218146, + "loss": 2.3207, + "step": 1176 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029929513128009285, + "loss": 2.3177, + "step": 1177 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002992939339743726, + "loss": 2.3545, + "step": 1178 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002992927356550291, + "loss": 2.3748, + "step": 1179 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002992915363220701, + "loss": 2.3329, + "step": 1180 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029929033597550416, + "loss": 2.3714, + "step": 1181 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002992891346153391, + "loss": 2.3309, + "step": 1182 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002992879322415832, + "loss": 2.3011, + "step": 1183 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002992867288542447, + "loss": 2.3083, + "step": 1184 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029928552445333167, + "loss": 2.3324, + "step": 1185 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002992843190388522, + "loss": 2.2712, + "step": 1186 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029928311261081473, + "loss": 2.287, + "step": 1187 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002992819051692272, + "loss": 2.3039, + "step": 1188 + }, + { + "epoch": 0.09, + "learning_rate": 0.000299280696714098, + "loss": 2.31, + "step": 1189 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002992794872454352, + "loss": 2.3548, + "step": 1190 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002992782767632471, + "loss": 2.346, + "step": 1191 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029927706526754183, + "loss": 2.3461, + "step": 1192 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002992758527583277, + "loss": 2.3094, + "step": 1193 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002992746392356129, + "loss": 2.3003, + "step": 1194 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029927342469940565, + "loss": 2.2723, + "step": 1195 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029927220914971426, + "loss": 2.3339, + "step": 1196 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029927099258654694, + "loss": 2.2432, + "step": 1197 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029926977500991194, + "loss": 2.2951, + "step": 1198 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029926855641981755, + "loss": 2.3517, + "step": 1199 + }, + { + "epoch": 0.09, + "learning_rate": 0.000299267336816272, + "loss": 2.3117, + "step": 1200 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002992661161992836, + "loss": 2.38, + "step": 1201 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029926489456886076, + "loss": 2.2939, + "step": 1202 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029926367192501153, + "loss": 2.3006, + "step": 1203 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002992624482677444, + "loss": 2.2403, + "step": 1204 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002992612235970676, + "loss": 2.3654, + "step": 1205 + }, + { + "epoch": 0.09, + "learning_rate": 0.00029925999791298945, + "loss": 2.3106, + "step": 1206 + }, + { + "epoch": 0.09, + "learning_rate": 0.0002992587712155183, + "loss": 2.3772, + "step": 1207 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029925754350466243, + "loss": 2.3017, + "step": 1208 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029925631478043026, + "loss": 2.3505, + "step": 1209 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029925508504283004, + "loss": 2.3589, + "step": 1210 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992538542918702, + "loss": 2.3399, + "step": 1211 + }, + { + "epoch": 0.1, + "learning_rate": 0.000299252622527559, + "loss": 2.303, + "step": 1212 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992513897499049, + "loss": 2.3314, + "step": 1213 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992501559589162, + "loss": 2.2983, + "step": 1214 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029924892115460133, + "loss": 2.3586, + "step": 1215 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992476853369686, + "loss": 2.3238, + "step": 1216 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992464485060265, + "loss": 2.2895, + "step": 1217 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029924521066178333, + "loss": 2.3198, + "step": 1218 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029924397180424757, + "loss": 2.3352, + "step": 1219 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992427319334276, + "loss": 2.3122, + "step": 1220 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992414910493318, + "loss": 2.2916, + "step": 1221 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992402491519687, + "loss": 2.3309, + "step": 1222 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992390062413466, + "loss": 2.3214, + "step": 1223 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029923776231747406, + "loss": 2.2273, + "step": 1224 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029923651738035945, + "loss": 2.2507, + "step": 1225 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029923527143001124, + "loss": 2.2916, + "step": 1226 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992340244664379, + "loss": 2.3058, + "step": 1227 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029923277648964783, + "loss": 2.3431, + "step": 1228 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992315274996496, + "loss": 2.2535, + "step": 1229 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992302774964517, + "loss": 2.2523, + "step": 1230 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029922902648006253, + "loss": 2.2878, + "step": 1231 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029922777445049066, + "loss": 2.2703, + "step": 1232 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992265214077445, + "loss": 2.3091, + "step": 1233 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992252673518326, + "loss": 2.243, + "step": 1234 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992240122827635, + "loss": 2.3052, + "step": 1235 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029922275620054573, + "loss": 2.2856, + "step": 1236 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992214991051878, + "loss": 2.3244, + "step": 1237 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992202409966982, + "loss": 2.3054, + "step": 1238 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029921898187508554, + "loss": 2.3059, + "step": 1239 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992177217403583, + "loss": 2.2835, + "step": 1240 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992164605925251, + "loss": 2.2558, + "step": 1241 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992151984315944, + "loss": 2.2837, + "step": 1242 + }, + { + "epoch": 0.1, + "learning_rate": 0.000299213935257575, + "loss": 2.2823, + "step": 1243 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992126710704752, + "loss": 2.2721, + "step": 1244 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029921140587030375, + "loss": 2.3294, + "step": 1245 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992101396570692, + "loss": 2.2795, + "step": 1246 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029920887243078015, + "loss": 2.2918, + "step": 1247 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002992076041914452, + "loss": 2.2752, + "step": 1248 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029920633493907294, + "loss": 2.3004, + "step": 1249 + }, + { + "epoch": 0.1, + "learning_rate": 0.000299205064673672, + "loss": 2.2249, + "step": 1250 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029920379339525103, + "loss": 2.3005, + "step": 1251 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029920252110381866, + "loss": 2.2747, + "step": 1252 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029920124779938347, + "loss": 2.2074, + "step": 1253 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991999734819541, + "loss": 2.2401, + "step": 1254 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029919869815153927, + "loss": 2.2449, + "step": 1255 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029919742180814767, + "loss": 2.362, + "step": 1256 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991961444517879, + "loss": 2.2386, + "step": 1257 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991948660824686, + "loss": 2.2823, + "step": 1258 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991935867001985, + "loss": 2.2594, + "step": 1259 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991923063049863, + "loss": 2.2936, + "step": 1260 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029919102489684064, + "loss": 2.3273, + "step": 1261 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991897424757703, + "loss": 2.2155, + "step": 1262 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991884590417839, + "loss": 2.2727, + "step": 1263 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991871745948902, + "loss": 2.2812, + "step": 1264 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991858891350979, + "loss": 2.3013, + "step": 1265 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991846026624158, + "loss": 2.2453, + "step": 1266 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991833151768525, + "loss": 2.3341, + "step": 1267 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991820266784169, + "loss": 2.2844, + "step": 1268 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029918073716711757, + "loss": 2.276, + "step": 1269 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991794466429634, + "loss": 2.2514, + "step": 1270 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991781551059631, + "loss": 2.2779, + "step": 1271 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991768625561255, + "loss": 2.2921, + "step": 1272 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991755689934592, + "loss": 2.3068, + "step": 1273 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991742744179733, + "loss": 2.2414, + "step": 1274 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991729788296763, + "loss": 2.2875, + "step": 1275 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029917168222857706, + "loss": 2.3323, + "step": 1276 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991703846146844, + "loss": 2.2571, + "step": 1277 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029916908598800725, + "loss": 2.286, + "step": 1278 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029916778634855423, + "loss": 2.3245, + "step": 1279 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029916648569633435, + "loss": 2.2922, + "step": 1280 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029916518403135623, + "loss": 2.3175, + "step": 1281 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991638813536289, + "loss": 2.2577, + "step": 1282 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991625776631611, + "loss": 2.2547, + "step": 1283 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029916127295996175, + "loss": 2.2539, + "step": 1284 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991599672440397, + "loss": 2.2686, + "step": 1285 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991586605154037, + "loss": 2.2998, + "step": 1286 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029915735277406276, + "loss": 2.2583, + "step": 1287 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991560440200257, + "loss": 2.2717, + "step": 1288 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029915473425330143, + "loss": 2.3273, + "step": 1289 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029915342347389877, + "loss": 2.3117, + "step": 1290 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991521116818267, + "loss": 2.2886, + "step": 1291 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991507988770941, + "loss": 2.2959, + "step": 1292 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991494850597099, + "loss": 2.2705, + "step": 1293 + }, + { + "epoch": 0.1, + "learning_rate": 0.000299148170229683, + "loss": 2.2778, + "step": 1294 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029914685438702237, + "loss": 2.2373, + "step": 1295 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991455375317368, + "loss": 2.2591, + "step": 1296 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991442196638354, + "loss": 2.2761, + "step": 1297 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029914290078332707, + "loss": 2.3094, + "step": 1298 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029914158089022075, + "loss": 2.2261, + "step": 1299 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991402599845254, + "loss": 2.2192, + "step": 1300 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029913893806624996, + "loss": 2.2404, + "step": 1301 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991376151354034, + "loss": 2.3354, + "step": 1302 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029913629119199476, + "loss": 2.2274, + "step": 1303 + }, + { + "epoch": 0.1, + "learning_rate": 0.000299134966236033, + "loss": 2.249, + "step": 1304 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029913364026752713, + "loss": 2.2798, + "step": 1305 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991323132864862, + "loss": 2.2279, + "step": 1306 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991309852929191, + "loss": 2.31, + "step": 1307 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029912965628683486, + "loss": 2.226, + "step": 1308 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029912832626824263, + "loss": 2.2669, + "step": 1309 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029912699523715135, + "loss": 2.2233, + "step": 1310 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029912566319357, + "loss": 2.2139, + "step": 1311 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991243301375078, + "loss": 2.1867, + "step": 1312 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991229960689736, + "loss": 2.3259, + "step": 1313 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029912166098797655, + "loss": 2.2711, + "step": 1314 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991203248945258, + "loss": 2.2433, + "step": 1315 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029911898778863026, + "loss": 2.2516, + "step": 1316 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029911764967029906, + "loss": 2.3148, + "step": 1317 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991163105395414, + "loss": 2.2438, + "step": 1318 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029911497039636624, + "loss": 2.3155, + "step": 1319 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991136292407827, + "loss": 2.3223, + "step": 1320 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991122870727999, + "loss": 2.2481, + "step": 1321 + }, + { + "epoch": 0.1, + "learning_rate": 0.000299110943892427, + "loss": 2.1777, + "step": 1322 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029910959969967304, + "loss": 2.237, + "step": 1323 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991082544945472, + "loss": 2.2744, + "step": 1324 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991069082770586, + "loss": 2.3008, + "step": 1325 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029910556104721637, + "loss": 2.2419, + "step": 1326 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002991042128050297, + "loss": 2.256, + "step": 1327 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029910286355050767, + "loss": 2.2861, + "step": 1328 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029910151328365947, + "loss": 2.2915, + "step": 1329 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029910016200449424, + "loss": 2.2158, + "step": 1330 + }, + { + "epoch": 0.1, + "learning_rate": 0.00029909880971302127, + "loss": 2.2429, + "step": 1331 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002990974564092496, + "loss": 2.3137, + "step": 1332 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002990961020931885, + "loss": 2.2434, + "step": 1333 + }, + { + "epoch": 0.1, + "learning_rate": 0.0002990947467648472, + "loss": 2.283, + "step": 1334 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990933904242348, + "loss": 2.2016, + "step": 1335 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990920330713605, + "loss": 2.2708, + "step": 1336 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029909067470623366, + "loss": 2.2704, + "step": 1337 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029908931532886333, + "loss": 2.2657, + "step": 1338 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990879549392589, + "loss": 2.2082, + "step": 1339 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990865935374295, + "loss": 2.156, + "step": 1340 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990852311233844, + "loss": 2.2998, + "step": 1341 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029908386769713285, + "loss": 2.2839, + "step": 1342 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990825032586841, + "loss": 2.238, + "step": 1343 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990811378080475, + "loss": 2.3014, + "step": 1344 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029907977134523215, + "loss": 2.2402, + "step": 1345 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029907840387024745, + "loss": 2.1791, + "step": 1346 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990770353831027, + "loss": 2.2696, + "step": 1347 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990756658838071, + "loss": 2.2638, + "step": 1348 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029907429537237, + "loss": 2.2995, + "step": 1349 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990729238488007, + "loss": 2.279, + "step": 1350 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029907155131310854, + "loss": 2.2776, + "step": 1351 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029907017776530277, + "loss": 2.2641, + "step": 1352 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990688032053928, + "loss": 2.2566, + "step": 1353 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990674276333879, + "loss": 2.1764, + "step": 1354 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990660510492974, + "loss": 2.249, + "step": 1355 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990646734531307, + "loss": 2.2813, + "step": 1356 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990632948448971, + "loss": 2.2117, + "step": 1357 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029906191522460605, + "loss": 2.2857, + "step": 1358 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990605345922668, + "loss": 2.2811, + "step": 1359 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990591529478888, + "loss": 2.156, + "step": 1360 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990577702914814, + "loss": 2.2633, + "step": 1361 + }, + { + "epoch": 0.11, + "learning_rate": 0.000299056386623054, + "loss": 2.2355, + "step": 1362 + }, + { + "epoch": 0.11, + "learning_rate": 0.000299055001942616, + "loss": 2.2899, + "step": 1363 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990536162501768, + "loss": 2.1595, + "step": 1364 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029905222954574576, + "loss": 2.2554, + "step": 1365 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990508418293324, + "loss": 2.2497, + "step": 1366 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029904945310094605, + "loss": 2.2659, + "step": 1367 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990480633605961, + "loss": 2.1866, + "step": 1368 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990466726082921, + "loss": 2.1895, + "step": 1369 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029904528084404345, + "loss": 2.2193, + "step": 1370 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990438880678596, + "loss": 2.2468, + "step": 1371 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029904249427975, + "loss": 2.2725, + "step": 1372 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990410994797241, + "loss": 2.3099, + "step": 1373 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990397036677914, + "loss": 2.2717, + "step": 1374 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990383068439613, + "loss": 2.306, + "step": 1375 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029903690900824343, + "loss": 2.2852, + "step": 1376 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990355101606472, + "loss": 2.2374, + "step": 1377 + }, + { + "epoch": 0.11, + "learning_rate": 0.000299034110301182, + "loss": 2.2756, + "step": 1378 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990327094298575, + "loss": 2.2199, + "step": 1379 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029903130754668317, + "loss": 2.2428, + "step": 1380 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029902990465166844, + "loss": 2.2253, + "step": 1381 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990285007448229, + "loss": 2.2212, + "step": 1382 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990270958261561, + "loss": 2.1472, + "step": 1383 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029902568989567755, + "loss": 2.1944, + "step": 1384 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990242829533968, + "loss": 2.2057, + "step": 1385 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990228749993235, + "loss": 2.2136, + "step": 1386 + }, + { + "epoch": 0.11, + "learning_rate": 0.000299021466033467, + "loss": 2.2321, + "step": 1387 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029902005605583705, + "loss": 2.2625, + "step": 1388 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029901864506644315, + "loss": 2.1827, + "step": 1389 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990172330652949, + "loss": 2.2403, + "step": 1390 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029901582005240177, + "loss": 2.1749, + "step": 1391 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029901440602777353, + "loss": 2.2954, + "step": 1392 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990129909914197, + "loss": 2.1392, + "step": 1393 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990115749433499, + "loss": 2.2645, + "step": 1394 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990101578835737, + "loss": 2.2146, + "step": 1395 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990087398121008, + "loss": 2.1732, + "step": 1396 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990073207289408, + "loss": 2.2542, + "step": 1397 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990059006341033, + "loss": 2.2259, + "step": 1398 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990044795275979, + "loss": 2.2574, + "step": 1399 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029900305740943446, + "loss": 2.2283, + "step": 1400 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990016342796224, + "loss": 2.2289, + "step": 1401 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002990002101381714, + "loss": 2.2219, + "step": 1402 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989987849850913, + "loss": 2.2482, + "step": 1403 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029899735882039165, + "loss": 2.2349, + "step": 1404 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989959316440821, + "loss": 2.2729, + "step": 1405 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029899450345617244, + "loss": 2.2761, + "step": 1406 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989930742566724, + "loss": 2.1782, + "step": 1407 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029899164404559146, + "loss": 2.1507, + "step": 1408 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029899021282293956, + "loss": 2.2426, + "step": 1409 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029898878058872634, + "loss": 2.2458, + "step": 1410 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029898734734296154, + "loss": 2.2228, + "step": 1411 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989859130856548, + "loss": 2.1809, + "step": 1412 + }, + { + "epoch": 0.11, + "learning_rate": 0.000298984477816816, + "loss": 2.2409, + "step": 1413 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989830415364548, + "loss": 2.1761, + "step": 1414 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989816042445809, + "loss": 2.2293, + "step": 1415 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029898016594120415, + "loss": 2.2045, + "step": 1416 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029897872662633433, + "loss": 2.2635, + "step": 1417 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029897728629998114, + "loss": 2.2475, + "step": 1418 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989758449621544, + "loss": 2.2031, + "step": 1419 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989744026128638, + "loss": 2.1903, + "step": 1420 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989729592521193, + "loss": 2.2399, + "step": 1421 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989715148799306, + "loss": 2.2325, + "step": 1422 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029897006949630755, + "loss": 2.2861, + "step": 1423 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989686231012599, + "loss": 2.2586, + "step": 1424 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989671756947975, + "loss": 2.2288, + "step": 1425 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029896572727693024, + "loss": 2.2129, + "step": 1426 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029896427784766787, + "loss": 2.2348, + "step": 1427 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029896282740702023, + "loss": 2.2703, + "step": 1428 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989613759549972, + "loss": 2.2204, + "step": 1429 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029895992349160866, + "loss": 2.223, + "step": 1430 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029895847001686445, + "loss": 2.1746, + "step": 1431 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989570155307744, + "loss": 2.1627, + "step": 1432 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989555600333484, + "loss": 2.2254, + "step": 1433 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029895410352459643, + "loss": 2.2195, + "step": 1434 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029895264600452825, + "loss": 2.2381, + "step": 1435 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029895118747315375, + "loss": 2.1993, + "step": 1436 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029894972793048294, + "loss": 2.2728, + "step": 1437 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029894826737652565, + "loss": 2.2043, + "step": 1438 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029894680581129185, + "loss": 2.1461, + "step": 1439 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989453432347914, + "loss": 2.2156, + "step": 1440 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029894387964703433, + "loss": 2.1993, + "step": 1441 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029894241504803046, + "loss": 2.1735, + "step": 1442 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029894094943778976, + "loss": 2.1631, + "step": 1443 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029893948281632226, + "loss": 2.2642, + "step": 1444 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989380151836378, + "loss": 2.2007, + "step": 1445 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989365465397465, + "loss": 2.206, + "step": 1446 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029893507688465816, + "loss": 2.192, + "step": 1447 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029893360621838287, + "loss": 2.188, + "step": 1448 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029893213454093055, + "loss": 2.2701, + "step": 1449 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989306618523112, + "loss": 2.2279, + "step": 1450 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029892918815253497, + "loss": 2.1853, + "step": 1451 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029892771344161166, + "loss": 2.2011, + "step": 1452 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989262377195513, + "loss": 2.2103, + "step": 1453 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989247609863641, + "loss": 2.2034, + "step": 1454 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029892328324205984, + "loss": 2.2322, + "step": 1455 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029892180448664875, + "loss": 2.2289, + "step": 1456 + }, + { + "epoch": 0.11, + "learning_rate": 0.00029892032472014074, + "loss": 2.1437, + "step": 1457 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989188439425459, + "loss": 2.1984, + "step": 1458 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989173621538743, + "loss": 2.2417, + "step": 1459 + }, + { + "epoch": 0.11, + "learning_rate": 0.000298915879354136, + "loss": 2.2136, + "step": 1460 + }, + { + "epoch": 0.11, + "learning_rate": 0.0002989143955433411, + "loss": 2.184, + "step": 1461 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002989129107214996, + "loss": 2.2474, + "step": 1462 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002989114248886216, + "loss": 2.2761, + "step": 1463 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002989099380447172, + "loss": 2.2075, + "step": 1464 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029890845018979654, + "loss": 2.1724, + "step": 1465 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002989069613238696, + "loss": 2.2103, + "step": 1466 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002989054714469466, + "loss": 2.2627, + "step": 1467 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002989039805590376, + "loss": 2.1205, + "step": 1468 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002989024886601528, + "loss": 2.2104, + "step": 1469 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029890099575030226, + "loss": 2.2042, + "step": 1470 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029889950182949613, + "loss": 2.166, + "step": 1471 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988980068977445, + "loss": 2.2088, + "step": 1472 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988965109550576, + "loss": 2.1938, + "step": 1473 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988950140014456, + "loss": 2.169, + "step": 1474 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988935160369186, + "loss": 2.2156, + "step": 1475 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029889201706148676, + "loss": 2.2353, + "step": 1476 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988905170751603, + "loss": 2.1904, + "step": 1477 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988890160779494, + "loss": 2.243, + "step": 1478 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029888751406986427, + "loss": 2.1584, + "step": 1479 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029888601105091506, + "loss": 2.2631, + "step": 1480 + }, + { + "epoch": 0.12, + "learning_rate": 0.000298884507021112, + "loss": 2.2254, + "step": 1481 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029888300198046533, + "loss": 2.2107, + "step": 1482 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988814959289852, + "loss": 2.1813, + "step": 1483 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029887998886668184, + "loss": 2.2832, + "step": 1484 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988784807935656, + "loss": 2.1508, + "step": 1485 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029887697170964656, + "loss": 2.2261, + "step": 1486 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029887546161493507, + "loss": 2.1346, + "step": 1487 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029887395050944135, + "loss": 2.2042, + "step": 1488 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988724383931756, + "loss": 2.2109, + "step": 1489 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988709252661482, + "loss": 2.1533, + "step": 1490 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988694111283694, + "loss": 2.1824, + "step": 1491 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988678959798494, + "loss": 2.2079, + "step": 1492 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988663798205986, + "loss": 2.2151, + "step": 1493 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988648626506272, + "loss": 2.1928, + "step": 1494 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029886334446994553, + "loss": 2.2146, + "step": 1495 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988618252785639, + "loss": 2.1861, + "step": 1496 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029886030507649263, + "loss": 2.2149, + "step": 1497 + }, + { + "epoch": 0.12, + "learning_rate": 0.000298858783863742, + "loss": 2.1886, + "step": 1498 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029885726164032245, + "loss": 2.1713, + "step": 1499 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988557384062442, + "loss": 2.1847, + "step": 1500 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988542141615176, + "loss": 2.2112, + "step": 1501 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029885268890615305, + "loss": 2.1595, + "step": 1502 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029885116264016093, + "loss": 2.1959, + "step": 1503 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029884963536355155, + "loss": 2.1425, + "step": 1504 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988481070763352, + "loss": 2.1818, + "step": 1505 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988465777785224, + "loss": 2.1529, + "step": 1506 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988450474701235, + "loss": 2.2113, + "step": 1507 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029884351615114887, + "loss": 2.203, + "step": 1508 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029884198382160886, + "loss": 2.1563, + "step": 1509 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029884045048151394, + "loss": 2.1907, + "step": 1510 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988389161308745, + "loss": 2.1973, + "step": 1511 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029883738076970096, + "loss": 2.2092, + "step": 1512 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029883584439800373, + "loss": 2.1936, + "step": 1513 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029883430701579326, + "loss": 2.212, + "step": 1514 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029883276862307997, + "loss": 2.168, + "step": 1515 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988312292198743, + "loss": 2.183, + "step": 1516 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988296888061868, + "loss": 2.2227, + "step": 1517 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029882814738202776, + "loss": 2.2064, + "step": 1518 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029882660494740773, + "loss": 2.2372, + "step": 1519 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029882506150233725, + "loss": 2.1928, + "step": 1520 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029882351704682667, + "loss": 2.1667, + "step": 1521 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988219715808865, + "loss": 2.1858, + "step": 1522 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029882042510452736, + "loss": 2.2124, + "step": 1523 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029881887761775956, + "loss": 2.194, + "step": 1524 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988173291205938, + "loss": 2.1799, + "step": 1525 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988157796130405, + "loss": 2.1445, + "step": 1526 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029881422909511007, + "loss": 2.212, + "step": 1527 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029881267756681323, + "loss": 2.1268, + "step": 1528 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988111250281604, + "loss": 2.2192, + "step": 1529 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988095714791622, + "loss": 2.2349, + "step": 1530 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988080169198291, + "loss": 2.2881, + "step": 1531 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988064613501717, + "loss": 2.1888, + "step": 1532 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988049047702005, + "loss": 2.1631, + "step": 1533 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988033471799262, + "loss": 2.1618, + "step": 1534 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002988017885793592, + "loss": 2.1457, + "step": 1535 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029880022896851017, + "loss": 2.2007, + "step": 1536 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029879866834738977, + "loss": 2.1804, + "step": 1537 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029879710671600854, + "loss": 2.2279, + "step": 1538 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029879554407437694, + "loss": 2.2549, + "step": 1539 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987939804225058, + "loss": 2.1679, + "step": 1540 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029879241576040563, + "loss": 2.2338, + "step": 1541 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987908500880871, + "loss": 2.1545, + "step": 1542 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987892834055608, + "loss": 2.1905, + "step": 1543 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987877157128373, + "loss": 2.2264, + "step": 1544 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987861470099274, + "loss": 2.1504, + "step": 1545 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029878457729684164, + "loss": 2.1733, + "step": 1546 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987830065735907, + "loss": 2.1416, + "step": 1547 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029878143484018526, + "loss": 2.1406, + "step": 1548 + }, + { + "epoch": 0.12, + "learning_rate": 0.000298779862096636, + "loss": 2.1978, + "step": 1549 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029877828834295355, + "loss": 2.2242, + "step": 1550 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029877671357914857, + "loss": 2.179, + "step": 1551 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987751378052319, + "loss": 2.23, + "step": 1552 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029877356102121414, + "loss": 2.1981, + "step": 1553 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029877198322710594, + "loss": 2.2069, + "step": 1554 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029877040442291813, + "loss": 2.1688, + "step": 1555 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029876882460866134, + "loss": 2.163, + "step": 1556 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029876724378434636, + "loss": 2.1265, + "step": 1557 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029876566194998386, + "loss": 2.1042, + "step": 1558 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029876407910558463, + "loss": 2.2501, + "step": 1559 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029876249525115936, + "loss": 2.191, + "step": 1560 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029876091038671883, + "loss": 2.2461, + "step": 1561 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987593245122739, + "loss": 2.1558, + "step": 1562 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987577376278352, + "loss": 2.1951, + "step": 1563 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029875614973341356, + "loss": 2.1827, + "step": 1564 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987545608290197, + "loss": 2.1871, + "step": 1565 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029875297091466453, + "loss": 2.1709, + "step": 1566 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029875137999035877, + "loss": 2.166, + "step": 1567 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987497880561132, + "loss": 2.2106, + "step": 1568 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029874819511193864, + "loss": 2.1877, + "step": 1569 + }, + { + "epoch": 0.12, + "learning_rate": 0.000298746601157846, + "loss": 2.1716, + "step": 1570 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987450061938459, + "loss": 2.2267, + "step": 1571 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987434102199494, + "loss": 2.2037, + "step": 1572 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987418132361672, + "loss": 2.105, + "step": 1573 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029874021524251015, + "loss": 2.1917, + "step": 1574 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029873861623898914, + "loss": 2.1727, + "step": 1575 + }, + { + "epoch": 0.12, + "learning_rate": 0.000298737016225615, + "loss": 2.1393, + "step": 1576 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987354152023986, + "loss": 2.1622, + "step": 1577 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987338131693508, + "loss": 2.1551, + "step": 1578 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987322101264825, + "loss": 2.1921, + "step": 1579 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029873060607380457, + "loss": 2.1609, + "step": 1580 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987290010113279, + "loss": 2.1404, + "step": 1581 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987273949390634, + "loss": 2.1939, + "step": 1582 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029872578785702193, + "loss": 2.1734, + "step": 1583 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987241797652145, + "loss": 2.1535, + "step": 1584 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987225706636519, + "loss": 2.1899, + "step": 1585 + }, + { + "epoch": 0.12, + "learning_rate": 0.0002987209605523451, + "loss": 2.1826, + "step": 1586 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029871934943130504, + "loss": 2.2027, + "step": 1587 + }, + { + "epoch": 0.12, + "learning_rate": 0.00029871773730054277, + "loss": 2.2024, + "step": 1588 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029871612416006903, + "loss": 2.1965, + "step": 1589 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029871451000989494, + "loss": 2.1987, + "step": 1590 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029871289485003134, + "loss": 2.1309, + "step": 1591 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002987112786804893, + "loss": 2.136, + "step": 1592 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002987096615012797, + "loss": 2.1502, + "step": 1593 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002987080433124136, + "loss": 2.1717, + "step": 1594 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029870642411390197, + "loss": 2.1368, + "step": 1595 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002987048039057557, + "loss": 2.1807, + "step": 1596 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029870318268798593, + "loss": 2.0779, + "step": 1597 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029870156046060367, + "loss": 2.1779, + "step": 1598 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029869993722361977, + "loss": 2.1772, + "step": 1599 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986983129770454, + "loss": 2.1448, + "step": 1600 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986966877208915, + "loss": 2.217, + "step": 1601 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986950614551692, + "loss": 2.1402, + "step": 1602 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986934341798895, + "loss": 2.1366, + "step": 1603 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029869180589506343, + "loss": 2.1701, + "step": 1604 + }, + { + "epoch": 0.13, + "learning_rate": 0.000298690176600702, + "loss": 2.1613, + "step": 1605 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986885462968164, + "loss": 2.1917, + "step": 1606 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986869149834176, + "loss": 2.104, + "step": 1607 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029868528266051666, + "loss": 2.1767, + "step": 1608 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029868364932812474, + "loss": 2.1956, + "step": 1609 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029868201498625284, + "loss": 2.1908, + "step": 1610 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029868037963491216, + "loss": 2.0974, + "step": 1611 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986787432741138, + "loss": 2.1681, + "step": 1612 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986771059038687, + "loss": 2.1826, + "step": 1613 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029867546752418813, + "loss": 2.2034, + "step": 1614 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029867382813508325, + "loss": 2.1469, + "step": 1615 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029867218773656505, + "loss": 2.1692, + "step": 1616 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029867054632864477, + "loss": 2.1702, + "step": 1617 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029866890391133357, + "loss": 2.1748, + "step": 1618 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986672604846425, + "loss": 2.0923, + "step": 1619 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986656160485828, + "loss": 2.0945, + "step": 1620 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986639706031655, + "loss": 2.1307, + "step": 1621 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029866232414840196, + "loss": 2.1507, + "step": 1622 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029866067668430333, + "loss": 2.1876, + "step": 1623 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986590282108807, + "loss": 2.2496, + "step": 1624 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986573787281453, + "loss": 2.1585, + "step": 1625 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029865572823610834, + "loss": 2.1524, + "step": 1626 + }, + { + "epoch": 0.13, + "learning_rate": 0.000298654076734781, + "loss": 2.1303, + "step": 1627 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986524242241745, + "loss": 2.1074, + "step": 1628 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029865077070430015, + "loss": 2.197, + "step": 1629 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029864911617516905, + "loss": 2.1973, + "step": 1630 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029864746063679247, + "loss": 2.1203, + "step": 1631 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986458040891817, + "loss": 2.1545, + "step": 1632 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986441465323479, + "loss": 2.1817, + "step": 1633 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029864248796630246, + "loss": 2.1906, + "step": 1634 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029864082839105646, + "loss": 2.1046, + "step": 1635 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986391678066213, + "loss": 2.1656, + "step": 1636 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029863750621300823, + "loss": 2.2246, + "step": 1637 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986358436102285, + "loss": 2.1789, + "step": 1638 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986341799982934, + "loss": 2.1392, + "step": 1639 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986325153772142, + "loss": 2.1503, + "step": 1640 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029863084974700234, + "loss": 2.231, + "step": 1641 + }, + { + "epoch": 0.13, + "learning_rate": 0.000298629183107669, + "loss": 2.1608, + "step": 1642 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986275154592255, + "loss": 2.1695, + "step": 1643 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029862584680168325, + "loss": 2.1409, + "step": 1644 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029862417713505347, + "loss": 2.11, + "step": 1645 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986225064593475, + "loss": 2.1576, + "step": 1646 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986208347745768, + "loss": 2.1858, + "step": 1647 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029861916208075265, + "loss": 2.1326, + "step": 1648 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029861748837788635, + "loss": 2.1728, + "step": 1649 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986158136659894, + "loss": 2.1791, + "step": 1650 + }, + { + "epoch": 0.13, + "learning_rate": 0.000298614137945073, + "loss": 2.1387, + "step": 1651 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029861246121514867, + "loss": 2.1347, + "step": 1652 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029861078347622773, + "loss": 2.212, + "step": 1653 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986091047283216, + "loss": 2.136, + "step": 1654 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986074249714416, + "loss": 2.1591, + "step": 1655 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029860574420559924, + "loss": 2.1468, + "step": 1656 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029860406243080586, + "loss": 2.1566, + "step": 1657 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002986023796470729, + "loss": 2.1466, + "step": 1658 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029860069585441185, + "loss": 2.1327, + "step": 1659 + }, + { + "epoch": 0.13, + "learning_rate": 0.000298599011052834, + "loss": 2.1703, + "step": 1660 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985973252423509, + "loss": 2.1211, + "step": 1661 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029859563842297396, + "loss": 2.0964, + "step": 1662 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029859395059471464, + "loss": 2.1919, + "step": 1663 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985922617575844, + "loss": 2.1765, + "step": 1664 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985905719115947, + "loss": 2.0886, + "step": 1665 + }, + { + "epoch": 0.13, + "learning_rate": 0.000298588881056757, + "loss": 2.1489, + "step": 1666 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985871891930828, + "loss": 2.1171, + "step": 1667 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985854963205836, + "loss": 2.1176, + "step": 1668 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985838024392709, + "loss": 2.194, + "step": 1669 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029858210754915614, + "loss": 2.1693, + "step": 1670 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029858041165025084, + "loss": 2.1486, + "step": 1671 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985787147425666, + "loss": 2.1522, + "step": 1672 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985770168261148, + "loss": 2.0775, + "step": 1673 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985753179009071, + "loss": 2.129, + "step": 1674 + }, + { + "epoch": 0.13, + "learning_rate": 0.000298573617966955, + "loss": 2.1159, + "step": 1675 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029857191702426997, + "loss": 2.1265, + "step": 1676 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029857021507286366, + "loss": 2.1547, + "step": 1677 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985685121127476, + "loss": 2.1417, + "step": 1678 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985668081439333, + "loss": 2.1155, + "step": 1679 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985651031664323, + "loss": 2.1564, + "step": 1680 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985633971802563, + "loss": 2.1448, + "step": 1681 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029856169018541677, + "loss": 2.1477, + "step": 1682 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029855998218192536, + "loss": 2.1409, + "step": 1683 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985582731697937, + "loss": 2.2081, + "step": 1684 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985565631490333, + "loss": 2.1486, + "step": 1685 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029855485211965584, + "loss": 2.1437, + "step": 1686 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985531400816729, + "loss": 2.1065, + "step": 1687 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985514270350962, + "loss": 2.1489, + "step": 1688 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029854971297993714, + "loss": 2.1137, + "step": 1689 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985479979162076, + "loss": 2.0653, + "step": 1690 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985462818439191, + "loss": 2.1414, + "step": 1691 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029854456476308334, + "loss": 2.1617, + "step": 1692 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029854284667371194, + "loss": 2.0816, + "step": 1693 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985411275758166, + "loss": 2.1953, + "step": 1694 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985394074694089, + "loss": 2.1632, + "step": 1695 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985376863545007, + "loss": 2.1247, + "step": 1696 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029853596423110355, + "loss": 2.1243, + "step": 1697 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029853424109922916, + "loss": 2.1436, + "step": 1698 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985325169588892, + "loss": 2.0919, + "step": 1699 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985307918100955, + "loss": 2.114, + "step": 1700 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029852906565285963, + "loss": 2.1471, + "step": 1701 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985273384871934, + "loss": 2.1755, + "step": 1702 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985256103131085, + "loss": 2.0671, + "step": 1703 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985238811306167, + "loss": 2.1626, + "step": 1704 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029852215093972964, + "loss": 2.109, + "step": 1705 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029852041974045917, + "loss": 2.1473, + "step": 1706 + }, + { + "epoch": 0.13, + "learning_rate": 0.000298518687532817, + "loss": 2.1695, + "step": 1707 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985169543168149, + "loss": 2.0578, + "step": 1708 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029851522009246466, + "loss": 2.1915, + "step": 1709 + }, + { + "epoch": 0.13, + "learning_rate": 0.000298513484859778, + "loss": 2.1502, + "step": 1710 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985117486187668, + "loss": 2.1214, + "step": 1711 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985100113694427, + "loss": 2.1327, + "step": 1712 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985082731118176, + "loss": 2.1127, + "step": 1713 + }, + { + "epoch": 0.13, + "learning_rate": 0.00029850653384590333, + "loss": 2.1345, + "step": 1714 + }, + { + "epoch": 0.13, + "learning_rate": 0.0002985047935717116, + "loss": 2.1206, + "step": 1715 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002985030522892543, + "loss": 2.1727, + "step": 1716 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002985013099985432, + "loss": 2.1201, + "step": 1717 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029849956669959017, + "loss": 2.1598, + "step": 1718 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029849782239240705, + "loss": 2.1567, + "step": 1719 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984960770770056, + "loss": 2.0893, + "step": 1720 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984943307533978, + "loss": 2.1736, + "step": 1721 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984925834215954, + "loss": 2.1083, + "step": 1722 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029849083508161036, + "loss": 2.2107, + "step": 1723 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029848908573345444, + "loss": 2.1482, + "step": 1724 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984873353771396, + "loss": 2.0993, + "step": 1725 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029848558401267765, + "loss": 2.1198, + "step": 1726 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984838316400806, + "loss": 2.1393, + "step": 1727 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029848207825936023, + "loss": 2.1333, + "step": 1728 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029848032387052843, + "loss": 2.1517, + "step": 1729 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029847856847359727, + "loss": 2.076, + "step": 1730 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984768120685785, + "loss": 2.1096, + "step": 1731 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984750546554841, + "loss": 2.0964, + "step": 1732 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984732962343261, + "loss": 2.1119, + "step": 1733 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984715368051163, + "loss": 2.1913, + "step": 1734 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984697763678667, + "loss": 2.0996, + "step": 1735 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029846801492258924, + "loss": 2.1228, + "step": 1736 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984662524692959, + "loss": 2.1225, + "step": 1737 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984644890079986, + "loss": 2.0825, + "step": 1738 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984627245387094, + "loss": 2.1463, + "step": 1739 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984609590614402, + "loss": 2.1498, + "step": 1740 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029845919257620303, + "loss": 2.1505, + "step": 1741 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029845742508300994, + "loss": 2.1349, + "step": 1742 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029845565658187273, + "loss": 2.0794, + "step": 1743 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984538870728036, + "loss": 2.1205, + "step": 1744 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984521165558145, + "loss": 2.144, + "step": 1745 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029845034503091743, + "loss": 2.1375, + "step": 1746 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029844857249812447, + "loss": 2.2027, + "step": 1747 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984467989574476, + "loss": 2.2231, + "step": 1748 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029844502440889894, + "loss": 2.165, + "step": 1749 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984432488524904, + "loss": 2.0761, + "step": 1750 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029844147228823417, + "loss": 2.1433, + "step": 1751 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984396947161422, + "loss": 2.1032, + "step": 1752 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984379161362267, + "loss": 2.1027, + "step": 1753 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984361365484996, + "loss": 2.0934, + "step": 1754 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984343559529731, + "loss": 2.1541, + "step": 1755 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984325743496592, + "loss": 2.1226, + "step": 1756 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984307917385701, + "loss": 2.0648, + "step": 1757 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029842900811971775, + "loss": 2.1117, + "step": 1758 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029842722349311435, + "loss": 2.106, + "step": 1759 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029842543785877203, + "loss": 2.0773, + "step": 1760 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029842365121670293, + "loss": 2.167, + "step": 1761 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984218635669191, + "loss": 2.1321, + "step": 1762 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029842007490943275, + "loss": 2.1468, + "step": 1763 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029841828524425595, + "loss": 2.105, + "step": 1764 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029841649457140095, + "loss": 2.1599, + "step": 1765 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984147028908798, + "loss": 2.09, + "step": 1766 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984129102027048, + "loss": 2.1181, + "step": 1767 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029841111650688796, + "loss": 2.1486, + "step": 1768 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029840932180344156, + "loss": 2.1206, + "step": 1769 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029840752609237777, + "loss": 2.1056, + "step": 1770 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984057293737088, + "loss": 2.1371, + "step": 1771 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029840393164744683, + "loss": 2.1292, + "step": 1772 + }, + { + "epoch": 0.14, + "learning_rate": 0.000298402132913604, + "loss": 2.1206, + "step": 1773 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002984003331721927, + "loss": 2.1644, + "step": 1774 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029839853242322493, + "loss": 2.1951, + "step": 1775 + }, + { + "epoch": 0.14, + "learning_rate": 0.000298396730666713, + "loss": 2.1413, + "step": 1776 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983949279026692, + "loss": 2.0627, + "step": 1777 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029839312413110577, + "loss": 2.1125, + "step": 1778 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029839131935203484, + "loss": 2.1571, + "step": 1779 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983895135654688, + "loss": 2.102, + "step": 1780 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983877067714198, + "loss": 2.1605, + "step": 1781 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983858989699002, + "loss": 2.1056, + "step": 1782 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029838409016092225, + "loss": 2.1043, + "step": 1783 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983822803444982, + "loss": 2.1526, + "step": 1784 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983804695206403, + "loss": 2.1203, + "step": 1785 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029837865768936095, + "loss": 2.1357, + "step": 1786 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983768448506723, + "loss": 2.074, + "step": 1787 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983750310045869, + "loss": 2.1207, + "step": 1788 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029837321615111686, + "loss": 2.1483, + "step": 1789 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983714002902746, + "loss": 2.0702, + "step": 1790 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983695834220723, + "loss": 2.1475, + "step": 1791 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029836776554652245, + "loss": 2.0906, + "step": 1792 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983659466636374, + "loss": 2.0866, + "step": 1793 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983641267734294, + "loss": 2.1692, + "step": 1794 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029836230587591085, + "loss": 2.1635, + "step": 1795 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029836048397109417, + "loss": 2.1463, + "step": 1796 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983586610589916, + "loss": 2.1025, + "step": 1797 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983568371396156, + "loss": 2.083, + "step": 1798 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983550122129786, + "loss": 2.1, + "step": 1799 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983531862790929, + "loss": 2.1389, + "step": 1800 + }, + { + "epoch": 0.14, + "learning_rate": 0.000298351359337971, + "loss": 2.1027, + "step": 1801 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029834953138962517, + "loss": 2.1155, + "step": 1802 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983477024340679, + "loss": 2.1127, + "step": 1803 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983458724713116, + "loss": 2.1712, + "step": 1804 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029834404150136867, + "loss": 2.1102, + "step": 1805 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029834220952425157, + "loss": 2.1189, + "step": 1806 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983403765399728, + "loss": 2.1613, + "step": 1807 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029833854254854465, + "loss": 2.0533, + "step": 1808 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029833670754997966, + "loss": 2.0744, + "step": 1809 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983348715442903, + "loss": 2.086, + "step": 1810 + }, + { + "epoch": 0.14, + "learning_rate": 0.000298333034531489, + "loss": 2.1715, + "step": 1811 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983311965115883, + "loss": 2.0703, + "step": 1812 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029832935748460063, + "loss": 2.1604, + "step": 1813 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983275174505384, + "loss": 2.1146, + "step": 1814 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029832567640941427, + "loss": 2.1245, + "step": 1815 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983238343612406, + "loss": 2.1382, + "step": 1816 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029832199130603, + "loss": 2.0584, + "step": 1817 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983201472437948, + "loss": 2.1155, + "step": 1818 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983183021745478, + "loss": 2.1389, + "step": 1819 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029831645609830135, + "loss": 2.0812, + "step": 1820 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983146090150679, + "loss": 2.0847, + "step": 1821 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029831276092486024, + "loss": 2.0771, + "step": 1822 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983109118276907, + "loss": 2.0103, + "step": 1823 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029830906172357197, + "loss": 2.136, + "step": 1824 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029830721061251646, + "loss": 2.0985, + "step": 1825 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983053584945369, + "loss": 2.0993, + "step": 1826 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983035053696458, + "loss": 2.1484, + "step": 1827 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002983016512378557, + "loss": 2.0569, + "step": 1828 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002982997960991793, + "loss": 2.1837, + "step": 1829 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002982979399536291, + "loss": 2.0861, + "step": 1830 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029829608280121763, + "loss": 2.1901, + "step": 1831 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002982942246419577, + "loss": 2.1696, + "step": 1832 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002982923654758618, + "loss": 2.0924, + "step": 1833 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002982905053029425, + "loss": 2.1322, + "step": 1834 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029828864412321257, + "loss": 2.1428, + "step": 1835 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002982867819366846, + "loss": 2.1243, + "step": 1836 + }, + { + "epoch": 0.14, + "learning_rate": 0.00029828491874337115, + "loss": 2.0579, + "step": 1837 + }, + { + "epoch": 0.14, + "learning_rate": 0.000298283054543285, + "loss": 2.0992, + "step": 1838 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002982811893364387, + "loss": 2.0864, + "step": 1839 + }, + { + "epoch": 0.14, + "learning_rate": 0.000298279323122845, + "loss": 2.1639, + "step": 1840 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002982774559025164, + "loss": 2.042, + "step": 1841 + }, + { + "epoch": 0.14, + "learning_rate": 0.0002982755876754658, + "loss": 2.0863, + "step": 1842 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029827371844170575, + "loss": 2.1037, + "step": 1843 + }, + { + "epoch": 0.15, + "learning_rate": 0.000298271848201249, + "loss": 2.1247, + "step": 1844 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029826997695410826, + "loss": 2.1401, + "step": 1845 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029826810470029615, + "loss": 2.099, + "step": 1846 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029826623143982547, + "loss": 2.0617, + "step": 1847 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002982643571727088, + "loss": 2.1113, + "step": 1848 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029826248189895904, + "loss": 2.0926, + "step": 1849 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029826060561858887, + "loss": 2.039, + "step": 1850 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002982587283316109, + "loss": 2.0609, + "step": 1851 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002982568500380381, + "loss": 2.0624, + "step": 1852 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029825497073788306, + "loss": 2.0925, + "step": 1853 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029825309043115855, + "loss": 2.1533, + "step": 1854 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002982512091178774, + "loss": 2.1004, + "step": 1855 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002982493267980523, + "loss": 2.1255, + "step": 1856 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002982474434716962, + "loss": 2.0605, + "step": 1857 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029824555913882166, + "loss": 2.1017, + "step": 1858 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029824367379944165, + "loss": 2.0656, + "step": 1859 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029824178745356886, + "loss": 2.133, + "step": 1860 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002982399001012161, + "loss": 2.1528, + "step": 1861 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002982380117423963, + "loss": 2.0659, + "step": 1862 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029823612237712217, + "loss": 2.1178, + "step": 1863 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002982342320054066, + "loss": 2.0502, + "step": 1864 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002982323406272624, + "loss": 2.1164, + "step": 1865 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029823044824270236, + "loss": 2.197, + "step": 1866 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002982285548517394, + "loss": 2.1077, + "step": 1867 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029822666045438634, + "loss": 2.1033, + "step": 1868 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002982247650506561, + "loss": 2.1061, + "step": 1869 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029822286864056145, + "loss": 2.1054, + "step": 1870 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002982209712241154, + "loss": 2.0998, + "step": 1871 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002982190728013307, + "loss": 2.0731, + "step": 1872 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002982171733722202, + "loss": 2.097, + "step": 1873 + }, + { + "epoch": 0.15, + "learning_rate": 0.000298215272936797, + "loss": 2.0627, + "step": 1874 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002982133714950738, + "loss": 2.0485, + "step": 1875 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002982114690470637, + "loss": 2.0982, + "step": 1876 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029820956559277944, + "loss": 2.1116, + "step": 1877 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029820766113223407, + "loss": 2.0901, + "step": 1878 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029820575566544044, + "loss": 2.1517, + "step": 1879 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002982038491924115, + "loss": 2.0426, + "step": 1880 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029820194171316025, + "loss": 2.1224, + "step": 1881 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029820003322769955, + "loss": 2.1719, + "step": 1882 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029819812373604247, + "loss": 2.1116, + "step": 1883 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029819621323820187, + "loss": 2.1149, + "step": 1884 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029819430173419075, + "loss": 2.0367, + "step": 1885 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981923892240222, + "loss": 2.1769, + "step": 1886 + }, + { + "epoch": 0.15, + "learning_rate": 0.000298190475707709, + "loss": 2.118, + "step": 1887 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981885611852643, + "loss": 2.0837, + "step": 1888 + }, + { + "epoch": 0.15, + "learning_rate": 0.000298186645656701, + "loss": 2.1307, + "step": 1889 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981847291220322, + "loss": 2.1015, + "step": 1890 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029818281158127086, + "loss": 2.1098, + "step": 1891 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029818089303442993, + "loss": 2.0871, + "step": 1892 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029817897348152257, + "loss": 2.1796, + "step": 1893 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029817705292256173, + "loss": 2.113, + "step": 1894 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981751313575605, + "loss": 2.0994, + "step": 1895 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029817320878653195, + "loss": 2.0587, + "step": 1896 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029817128520948896, + "loss": 2.1509, + "step": 1897 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981693606264448, + "loss": 2.1152, + "step": 1898 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981674350374124, + "loss": 2.0958, + "step": 1899 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981655084424049, + "loss": 2.1211, + "step": 1900 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981635808414354, + "loss": 2.1006, + "step": 1901 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981616522345169, + "loss": 2.1289, + "step": 1902 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029815972262166253, + "loss": 2.116, + "step": 1903 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029815779200288543, + "loss": 2.1032, + "step": 1904 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981558603781987, + "loss": 2.1299, + "step": 1905 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981539277476154, + "loss": 2.0542, + "step": 1906 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029815199411114873, + "loss": 2.0813, + "step": 1907 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981500594688117, + "loss": 2.0603, + "step": 1908 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029814812382061764, + "loss": 2.1037, + "step": 1909 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981461871665795, + "loss": 2.1415, + "step": 1910 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981442495067105, + "loss": 2.0485, + "step": 1911 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981423108410238, + "loss": 2.1192, + "step": 1912 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029814037116953257, + "loss": 2.0676, + "step": 1913 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029813843049225, + "loss": 2.1396, + "step": 1914 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981364888091892, + "loss": 2.0359, + "step": 1915 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981345461203634, + "loss": 2.0844, + "step": 1916 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981326024257858, + "loss": 2.0771, + "step": 1917 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029813065772546954, + "loss": 1.9899, + "step": 1918 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981287120194279, + "loss": 2.1394, + "step": 1919 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029812676530767396, + "loss": 2.1107, + "step": 1920 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029812481759022115, + "loss": 2.1022, + "step": 1921 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029812286886708245, + "loss": 2.0473, + "step": 1922 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981209191382713, + "loss": 2.0597, + "step": 1923 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029811896840380083, + "loss": 2.0929, + "step": 1924 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029811701666368435, + "loss": 2.0362, + "step": 1925 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029811506391793497, + "loss": 2.0858, + "step": 1926 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029811311016656605, + "loss": 2.0956, + "step": 1927 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981111554095909, + "loss": 2.1622, + "step": 1928 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981091996470227, + "loss": 2.0585, + "step": 1929 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002981072428788748, + "loss": 2.0899, + "step": 1930 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029810528510516046, + "loss": 2.1545, + "step": 1931 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029810332632589293, + "loss": 2.122, + "step": 1932 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029810136654108557, + "loss": 2.1382, + "step": 1933 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029809940575075165, + "loss": 2.1048, + "step": 1934 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980974439549045, + "loss": 2.0918, + "step": 1935 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029809548115355744, + "loss": 2.0786, + "step": 1936 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980935173467237, + "loss": 2.0457, + "step": 1937 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980915525344168, + "loss": 2.0637, + "step": 1938 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029808958671664995, + "loss": 2.0678, + "step": 1939 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980876198934366, + "loss": 2.0648, + "step": 1940 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029808565206478993, + "loss": 2.1495, + "step": 1941 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029808368323072345, + "loss": 2.0806, + "step": 1942 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980817133912505, + "loss": 2.0858, + "step": 1943 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980797425463844, + "loss": 2.0444, + "step": 1944 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980777706961385, + "loss": 2.0482, + "step": 1945 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980757978405264, + "loss": 2.0571, + "step": 1946 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980738239795613, + "loss": 2.0845, + "step": 1947 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029807184911325655, + "loss": 2.0928, + "step": 1948 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029806987324162575, + "loss": 2.0836, + "step": 1949 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980678963646822, + "loss": 2.1321, + "step": 1950 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980659184824394, + "loss": 2.1398, + "step": 1951 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980639395949106, + "loss": 2.1146, + "step": 1952 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029806195970210947, + "loss": 2.1719, + "step": 1953 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980599788040493, + "loss": 2.0902, + "step": 1954 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980579969007436, + "loss": 2.0675, + "step": 1955 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029805601399220577, + "loss": 2.118, + "step": 1956 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980540300784493, + "loss": 2.0734, + "step": 1957 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980520451594877, + "loss": 2.0605, + "step": 1958 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980500592353344, + "loss": 2.0097, + "step": 1959 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980480723060029, + "loss": 2.0526, + "step": 1960 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980460843715067, + "loss": 2.0645, + "step": 1961 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980440954318593, + "loss": 2.0868, + "step": 1962 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029804210548707414, + "loss": 2.0909, + "step": 1963 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029804011453716487, + "loss": 2.129, + "step": 1964 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029803812258214483, + "loss": 2.0605, + "step": 1965 + }, + { + "epoch": 0.15, + "learning_rate": 0.0002980361296220277, + "loss": 2.0563, + "step": 1966 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029803413565682684, + "loss": 2.0395, + "step": 1967 + }, + { + "epoch": 0.15, + "learning_rate": 0.000298032140686556, + "loss": 2.0976, + "step": 1968 + }, + { + "epoch": 0.15, + "learning_rate": 0.00029803014471122853, + "loss": 2.1083, + "step": 1969 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029802814773085813, + "loss": 2.0368, + "step": 1970 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002980261497454583, + "loss": 2.0448, + "step": 1971 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029802415075504254, + "loss": 2.0911, + "step": 1972 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002980221507596245, + "loss": 2.1286, + "step": 1973 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029802014975921775, + "loss": 2.079, + "step": 1974 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002980181477538359, + "loss": 2.1284, + "step": 1975 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002980161447434925, + "loss": 2.0862, + "step": 1976 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002980141407282011, + "loss": 2.0963, + "step": 1977 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002980121357079754, + "loss": 2.1027, + "step": 1978 + }, + { + "epoch": 0.16, + "learning_rate": 0.000298010129682829, + "loss": 2.0803, + "step": 1979 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002980081226527755, + "loss": 2.1294, + "step": 1980 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029800611461782854, + "loss": 2.0762, + "step": 1981 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002980041055780017, + "loss": 2.1366, + "step": 1982 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029800209553330865, + "loss": 2.0884, + "step": 1983 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029800008448376306, + "loss": 2.1108, + "step": 1984 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029799807242937863, + "loss": 2.0597, + "step": 1985 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002979960593701689, + "loss": 2.0843, + "step": 1986 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029799404530614755, + "loss": 2.0863, + "step": 1987 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002979920302373284, + "loss": 2.0951, + "step": 1988 + }, + { + "epoch": 0.16, + "learning_rate": 0.000297990014163725, + "loss": 2.0718, + "step": 1989 + }, + { + "epoch": 0.16, + "learning_rate": 0.000297987997085351, + "loss": 2.0991, + "step": 1990 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029798597900222023, + "loss": 2.1001, + "step": 1991 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029798395991434634, + "loss": 2.0343, + "step": 1992 + }, + { + "epoch": 0.16, + "learning_rate": 0.000297981939821743, + "loss": 2.0072, + "step": 1993 + }, + { + "epoch": 0.16, + "learning_rate": 0.000297979918724424, + "loss": 2.1331, + "step": 1994 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029797789662240295, + "loss": 2.0478, + "step": 1995 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029797587351569366, + "loss": 2.096, + "step": 1996 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029797384940430984, + "loss": 2.0997, + "step": 1997 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029797182428826526, + "loss": 2.0899, + "step": 1998 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002979697981675737, + "loss": 2.0784, + "step": 1999 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029796777104224877, + "loss": 2.062, + "step": 2000 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002979657429123044, + "loss": 2.1609, + "step": 2001 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029796371377775423, + "loss": 2.0302, + "step": 2002 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002979616836386121, + "loss": 2.0556, + "step": 2003 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029795965249489187, + "loss": 2.1351, + "step": 2004 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002979576203466072, + "loss": 2.0698, + "step": 2005 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029795558719377193, + "loss": 2.0186, + "step": 2006 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002979535530363999, + "loss": 2.1455, + "step": 2007 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002979515178745049, + "loss": 2.097, + "step": 2008 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029794948170810064, + "loss": 2.0649, + "step": 2009 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029794744453720117, + "loss": 2.0702, + "step": 2010 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029794540636182015, + "loss": 2.0724, + "step": 2011 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029794336718197146, + "loss": 2.0918, + "step": 2012 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029794132699766893, + "loss": 2.1205, + "step": 2013 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029793928580892643, + "loss": 2.0488, + "step": 2014 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029793724361575785, + "loss": 2.0626, + "step": 2015 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029793520041817705, + "loss": 2.0544, + "step": 2016 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002979331562161978, + "loss": 2.0483, + "step": 2017 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002979311110098341, + "loss": 2.0416, + "step": 2018 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002979290647990998, + "loss": 2.0207, + "step": 2019 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029792701758400876, + "loss": 2.0848, + "step": 2020 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002979249693645749, + "loss": 2.0843, + "step": 2021 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002979229201408122, + "loss": 2.0351, + "step": 2022 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029792086991273437, + "loss": 2.0054, + "step": 2023 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029791881868035554, + "loss": 2.0135, + "step": 2024 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029791676644368956, + "loss": 2.026, + "step": 2025 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029791471320275036, + "loss": 2.0051, + "step": 2026 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002979126589575519, + "loss": 2.0053, + "step": 2027 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002979106037081081, + "loss": 1.9975, + "step": 2028 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002979085474544329, + "loss": 2.04, + "step": 2029 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002979064901965403, + "loss": 2.1558, + "step": 2030 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029790443193444425, + "loss": 2.0497, + "step": 2031 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029790237266815876, + "loss": 2.0991, + "step": 2032 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029790031239769775, + "loss": 2.0086, + "step": 2033 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029789825112307524, + "loss": 2.076, + "step": 2034 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029789618884430523, + "loss": 2.0976, + "step": 2035 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978941255614017, + "loss": 2.0804, + "step": 2036 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029789206127437865, + "loss": 2.098, + "step": 2037 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029788999598325016, + "loss": 2.023, + "step": 2038 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978879296880302, + "loss": 2.0611, + "step": 2039 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978858623887328, + "loss": 2.0857, + "step": 2040 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029788379408537204, + "loss": 2.0188, + "step": 2041 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978817247779619, + "loss": 2.0464, + "step": 2042 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029787965446651643, + "loss": 2.0408, + "step": 2043 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029787758315104974, + "loss": 2.0794, + "step": 2044 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029787551083157584, + "loss": 2.1005, + "step": 2045 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978734375081089, + "loss": 2.1179, + "step": 2046 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029787136318066285, + "loss": 2.0216, + "step": 2047 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029786928784925184, + "loss": 2.0963, + "step": 2048 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029786721151389, + "loss": 2.0275, + "step": 2049 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029786513417459144, + "loss": 2.072, + "step": 2050 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978630558313701, + "loss": 2.0075, + "step": 2051 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029786097648424025, + "loss": 2.0537, + "step": 2052 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029785889613321605, + "loss": 2.0671, + "step": 2053 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978568147783115, + "loss": 2.0466, + "step": 2054 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978547324195407, + "loss": 2.0278, + "step": 2055 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978526490569179, + "loss": 2.0642, + "step": 2056 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978505646904572, + "loss": 2.11, + "step": 2057 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978484793201728, + "loss": 2.0614, + "step": 2058 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029784639294607877, + "loss": 2.0719, + "step": 2059 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029784430556818937, + "loss": 2.1282, + "step": 2060 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029784221718651865, + "loss": 2.0671, + "step": 2061 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978401278010809, + "loss": 2.0684, + "step": 2062 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978380374118903, + "loss": 2.075, + "step": 2063 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029783594601896096, + "loss": 2.0885, + "step": 2064 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978338536223071, + "loss": 2.0645, + "step": 2065 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978317602219431, + "loss": 2.0678, + "step": 2066 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978296658178829, + "loss": 1.9937, + "step": 2067 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978275704101409, + "loss": 2.0585, + "step": 2068 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029782547399873126, + "loss": 2.0658, + "step": 2069 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029782337658366823, + "loss": 2.0577, + "step": 2070 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029782127816496603, + "loss": 2.0205, + "step": 2071 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978191787426389, + "loss": 2.0324, + "step": 2072 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978170783167012, + "loss": 2.0606, + "step": 2073 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029781497688716706, + "loss": 2.0331, + "step": 2074 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978128744540508, + "loss": 2.103, + "step": 2075 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978107710173667, + "loss": 2.0845, + "step": 2076 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029780866657712904, + "loss": 2.0656, + "step": 2077 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029780656113335204, + "loss": 2.0141, + "step": 2078 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029780445468605013, + "loss": 2.0724, + "step": 2079 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029780234723523753, + "loss": 2.0112, + "step": 2080 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002978002387809285, + "loss": 2.0819, + "step": 2081 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002977981293231375, + "loss": 2.0999, + "step": 2082 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002977960188618787, + "loss": 2.0487, + "step": 2083 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002977939073971665, + "loss": 2.0621, + "step": 2084 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029779179492901524, + "loss": 2.04, + "step": 2085 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029778968145743927, + "loss": 2.1299, + "step": 2086 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002977875669824529, + "loss": 2.0178, + "step": 2087 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002977854515040705, + "loss": 2.1118, + "step": 2088 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002977833350223065, + "loss": 2.0414, + "step": 2089 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002977812175371751, + "loss": 2.121, + "step": 2090 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002977790990486909, + "loss": 2.0813, + "step": 2091 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029777697955686805, + "loss": 2.0198, + "step": 2092 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002977748590617211, + "loss": 2.089, + "step": 2093 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029777273756326445, + "loss": 2.0841, + "step": 2094 + }, + { + "epoch": 0.16, + "learning_rate": 0.0002977706150615124, + "loss": 2.1186, + "step": 2095 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029776849155647945, + "loss": 2.0711, + "step": 2096 + }, + { + "epoch": 0.16, + "learning_rate": 0.00029776636704818, + "loss": 2.082, + "step": 2097 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002977642415366285, + "loss": 2.032, + "step": 2098 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029776211502183925, + "loss": 1.9796, + "step": 2099 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029775998750382685, + "loss": 2.0689, + "step": 2100 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029775785898260564, + "loss": 2.0642, + "step": 2101 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002977557294581901, + "loss": 2.0572, + "step": 2102 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029775359893059473, + "loss": 2.0389, + "step": 2103 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002977514673998339, + "loss": 2.0647, + "step": 2104 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002977493348659222, + "loss": 2.0641, + "step": 2105 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002977472013288741, + "loss": 2.0664, + "step": 2106 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029774506678870394, + "loss": 2.0554, + "step": 2107 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029774293124542635, + "loss": 2.0276, + "step": 2108 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002977407946990558, + "loss": 2.1035, + "step": 2109 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029773865714960673, + "loss": 2.0557, + "step": 2110 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002977365185970937, + "loss": 2.0137, + "step": 2111 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029773437904153136, + "loss": 2.0536, + "step": 2112 + }, + { + "epoch": 0.17, + "learning_rate": 0.000297732238482934, + "loss": 2.074, + "step": 2113 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002977300969213163, + "loss": 2.0864, + "step": 2114 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029772795435669276, + "loss": 2.0714, + "step": 2115 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029772581078907795, + "loss": 2.0288, + "step": 2116 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029772366621848637, + "loss": 2.0503, + "step": 2117 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002977215206449327, + "loss": 2.0838, + "step": 2118 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029771937406843134, + "loss": 2.0481, + "step": 2119 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029771722648899696, + "loss": 2.0937, + "step": 2120 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002977150779066441, + "loss": 2.1101, + "step": 2121 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002977129283213875, + "loss": 2.0104, + "step": 2122 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002977107777332415, + "loss": 2.0527, + "step": 2123 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002977086261422209, + "loss": 2.0377, + "step": 2124 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002977064735483402, + "loss": 2.1298, + "step": 2125 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002977043199516141, + "loss": 1.9907, + "step": 2126 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029770216535205714, + "loss": 2.0703, + "step": 2127 + }, + { + "epoch": 0.17, + "learning_rate": 0.000297700009749684, + "loss": 2.0826, + "step": 2128 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029769785314450934, + "loss": 2.1026, + "step": 2129 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029769569553654774, + "loss": 1.9585, + "step": 2130 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029769353692581384, + "loss": 2.0692, + "step": 2131 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029769137731232233, + "loss": 2.0531, + "step": 2132 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976892166960879, + "loss": 2.0007, + "step": 2133 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976870550771252, + "loss": 2.0547, + "step": 2134 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976848924554489, + "loss": 2.0598, + "step": 2135 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976827288310736, + "loss": 2.048, + "step": 2136 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976805642040141, + "loss": 2.0446, + "step": 2137 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976783985742851, + "loss": 2.0287, + "step": 2138 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976762319419013, + "loss": 1.9962, + "step": 2139 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029767406430687737, + "loss": 2.0513, + "step": 2140 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029767189566922797, + "loss": 2.0286, + "step": 2141 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029766972602896793, + "loss": 2.0442, + "step": 2142 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029766755538611193, + "loss": 1.9561, + "step": 2143 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976653837406748, + "loss": 2.0029, + "step": 2144 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029766321109267105, + "loss": 1.9993, + "step": 2145 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976610374421157, + "loss": 2.0265, + "step": 2146 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029765886278902335, + "loss": 1.993, + "step": 2147 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976566871334088, + "loss": 2.005, + "step": 2148 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029765451047528683, + "loss": 2.0068, + "step": 2149 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976523328146723, + "loss": 2.0281, + "step": 2150 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976501541515798, + "loss": 2.0225, + "step": 2151 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029764797448602427, + "loss": 2.0236, + "step": 2152 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029764579381802046, + "loss": 2.0292, + "step": 2153 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976436121475832, + "loss": 2.0494, + "step": 2154 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976414294747273, + "loss": 1.9895, + "step": 2155 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029763924579946757, + "loss": 2.0417, + "step": 2156 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976370611218188, + "loss": 2.0193, + "step": 2157 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976348754417959, + "loss": 1.9845, + "step": 2158 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976326887594137, + "loss": 2.0772, + "step": 2159 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976305010746869, + "loss": 1.9947, + "step": 2160 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029762831238763055, + "loss": 2.0011, + "step": 2161 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029762612269825943, + "loss": 2.0307, + "step": 2162 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029762393200658834, + "loss": 2.0028, + "step": 2163 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976217403126323, + "loss": 2.0346, + "step": 2164 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029761954761640605, + "loss": 2.0064, + "step": 2165 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976173539179246, + "loss": 2.0099, + "step": 2166 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029761515921720267, + "loss": 1.9836, + "step": 2167 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029761296351425536, + "loss": 2.0739, + "step": 2168 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029761076680909747, + "loss": 2.0707, + "step": 2169 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976085691017439, + "loss": 2.0542, + "step": 2170 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029760637039220964, + "loss": 1.9908, + "step": 2171 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002976041706805096, + "loss": 2.0917, + "step": 2172 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029760196996665863, + "loss": 1.9794, + "step": 2173 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975997682506718, + "loss": 2.0231, + "step": 2174 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029759756553256395, + "loss": 2.0645, + "step": 2175 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975953618123501, + "loss": 2.0146, + "step": 2176 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029759315709004515, + "loss": 2.0661, + "step": 2177 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975909513656642, + "loss": 2.1059, + "step": 2178 + }, + { + "epoch": 0.17, + "learning_rate": 0.000297588744639222, + "loss": 2.0158, + "step": 2179 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029758653691073383, + "loss": 2.0777, + "step": 2180 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975843281802144, + "loss": 2.0022, + "step": 2181 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029758211844767887, + "loss": 2.065, + "step": 2182 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029757990771314225, + "loss": 2.0385, + "step": 2183 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975776959766194, + "loss": 2.1027, + "step": 2184 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975754832381255, + "loss": 2.0524, + "step": 2185 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975732694976755, + "loss": 2.0303, + "step": 2186 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975710547552844, + "loss": 2.0443, + "step": 2187 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975688390109673, + "loss": 2.0221, + "step": 2188 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975666222647393, + "loss": 2.0339, + "step": 2189 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029756440451661524, + "loss": 2.0506, + "step": 2190 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029756218576661034, + "loss": 2.0456, + "step": 2191 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029755996601473964, + "loss": 2.0234, + "step": 2192 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975577452610182, + "loss": 2.0346, + "step": 2193 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975555235054611, + "loss": 1.9801, + "step": 2194 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975533007480835, + "loss": 2.0117, + "step": 2195 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975510769889003, + "loss": 2.0455, + "step": 2196 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029754885222792676, + "loss": 2.0469, + "step": 2197 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029754662646517795, + "loss": 2.0352, + "step": 2198 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029754439970066895, + "loss": 2.0883, + "step": 2199 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029754217193441487, + "loss": 2.0761, + "step": 2200 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029753994316643095, + "loss": 2.0705, + "step": 2201 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029753771339673216, + "loss": 2.0135, + "step": 2202 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975354826253337, + "loss": 2.0529, + "step": 2203 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029753325085225075, + "loss": 2.0421, + "step": 2204 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975310180774985, + "loss": 2.016, + "step": 2205 + }, + { + "epoch": 0.17, + "learning_rate": 0.000297528784301092, + "loss": 2.0118, + "step": 2206 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975265495230465, + "loss": 2.0527, + "step": 2207 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975243137433771, + "loss": 2.0918, + "step": 2208 + }, + { + "epoch": 0.17, + "learning_rate": 0.000297522076962099, + "loss": 2.0351, + "step": 2209 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029751983917922746, + "loss": 2.0207, + "step": 2210 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029751760039477764, + "loss": 1.9672, + "step": 2211 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975153606087647, + "loss": 2.0564, + "step": 2212 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975131198212038, + "loss": 2.0539, + "step": 2213 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029751087803211025, + "loss": 2.0942, + "step": 2214 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002975086352414993, + "loss": 2.0008, + "step": 2215 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029750639144938604, + "loss": 2.0416, + "step": 2216 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029750414665578585, + "loss": 2.0801, + "step": 2217 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029750190086071386, + "loss": 2.1112, + "step": 2218 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002974996540641854, + "loss": 2.0678, + "step": 2219 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002974974062662157, + "loss": 2.0654, + "step": 2220 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002974951574668199, + "loss": 1.9966, + "step": 2221 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002974929076660135, + "loss": 2.0512, + "step": 2222 + }, + { + "epoch": 0.17, + "learning_rate": 0.0002974906568638116, + "loss": 1.9626, + "step": 2223 + }, + { + "epoch": 0.17, + "learning_rate": 0.00029748840506022955, + "loss": 2.0349, + "step": 2224 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029748615225528256, + "loss": 2.0563, + "step": 2225 + }, + { + "epoch": 0.18, + "learning_rate": 0.000297483898448986, + "loss": 2.0378, + "step": 2226 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002974816436413552, + "loss": 2.0308, + "step": 2227 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002974793878324054, + "loss": 2.0502, + "step": 2228 + }, + { + "epoch": 0.18, + "learning_rate": 0.000297477131022152, + "loss": 2.0889, + "step": 2229 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029747487321061026, + "loss": 2.0482, + "step": 2230 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029747261439779546, + "loss": 2.0146, + "step": 2231 + }, + { + "epoch": 0.18, + "learning_rate": 0.000297470354583723, + "loss": 1.9986, + "step": 2232 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002974680937684082, + "loss": 2.0331, + "step": 2233 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002974658319518664, + "loss": 2.0258, + "step": 2234 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029746356913411303, + "loss": 2.0237, + "step": 2235 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002974613053151634, + "loss": 1.9972, + "step": 2236 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002974590404950329, + "loss": 2.0583, + "step": 2237 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029745677467373687, + "loss": 2.0153, + "step": 2238 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002974545078512907, + "loss": 2.003, + "step": 2239 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029745224002770976, + "loss": 2.0097, + "step": 2240 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029744997120300954, + "loss": 2.0615, + "step": 2241 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002974477013772054, + "loss": 2.0004, + "step": 2242 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002974454305503127, + "loss": 2.0837, + "step": 2243 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002974431587223469, + "loss": 2.016, + "step": 2244 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002974408858933234, + "loss": 2.0561, + "step": 2245 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029743861206325763, + "loss": 1.9982, + "step": 2246 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002974363372321651, + "loss": 1.9744, + "step": 2247 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002974340614000612, + "loss": 1.9857, + "step": 2248 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002974317845669614, + "loss": 2.0216, + "step": 2249 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029742950673288107, + "loss": 1.9925, + "step": 2250 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029742722789783576, + "loss": 1.9485, + "step": 2251 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029742494806184096, + "loss": 2.0601, + "step": 2252 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029742266722491213, + "loss": 2.0974, + "step": 2253 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029742038538706477, + "loss": 2.0268, + "step": 2254 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029741810254831427, + "loss": 2.009, + "step": 2255 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002974158187086763, + "loss": 2.0584, + "step": 2256 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029741353386816615, + "loss": 1.9799, + "step": 2257 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029741124802679954, + "loss": 2.0101, + "step": 2258 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002974089611845919, + "loss": 1.9844, + "step": 2259 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029740667334155873, + "loss": 1.9978, + "step": 2260 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002974043844977156, + "loss": 2.0596, + "step": 2261 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029740209465307807, + "loss": 1.9981, + "step": 2262 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973998038076616, + "loss": 2.0235, + "step": 2263 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029739751196148186, + "loss": 2.0412, + "step": 2264 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029739521911455435, + "loss": 2.0586, + "step": 2265 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973929252668946, + "loss": 2.0472, + "step": 2266 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973906304185183, + "loss": 1.9671, + "step": 2267 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029738833456944094, + "loss": 2.0461, + "step": 2268 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973860377196781, + "loss": 2.0701, + "step": 2269 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973837398692454, + "loss": 2.0441, + "step": 2270 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973814410181584, + "loss": 2.0637, + "step": 2271 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973791411664328, + "loss": 1.9487, + "step": 2272 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973768403140842, + "loss": 2.0448, + "step": 2273 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029737453846112805, + "loss": 1.9852, + "step": 2274 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029737223560758017, + "loss": 1.99, + "step": 2275 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973699317534562, + "loss": 1.9973, + "step": 2276 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029736762689877165, + "loss": 1.9632, + "step": 2277 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973653210435423, + "loss": 2.0139, + "step": 2278 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973630141877837, + "loss": 2.0155, + "step": 2279 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029736070633151155, + "loss": 2.0101, + "step": 2280 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029735839747474155, + "loss": 1.9569, + "step": 2281 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973560876174893, + "loss": 2.0218, + "step": 2282 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973537767597706, + "loss": 2.0646, + "step": 2283 + }, + { + "epoch": 0.18, + "learning_rate": 0.000297351464901601, + "loss": 2.0021, + "step": 2284 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029734915204299633, + "loss": 2.0048, + "step": 2285 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973468381839722, + "loss": 2.0572, + "step": 2286 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973445233245444, + "loss": 1.9633, + "step": 2287 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029734220746472853, + "loss": 2.0672, + "step": 2288 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029733989060454045, + "loss": 2.0408, + "step": 2289 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029733757274399573, + "loss": 2.0763, + "step": 2290 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973352538831103, + "loss": 2.014, + "step": 2291 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973329340218998, + "loss": 1.9616, + "step": 2292 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973306131603799, + "loss": 1.992, + "step": 2293 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029732829129856646, + "loss": 1.9646, + "step": 2294 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029732596843647525, + "loss": 2.0177, + "step": 2295 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029732364457412205, + "loss": 2.0241, + "step": 2296 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973213197115225, + "loss": 2.0753, + "step": 2297 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029731899384869255, + "loss": 2.0899, + "step": 2298 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029731666698564797, + "loss": 2.0446, + "step": 2299 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029731433912240444, + "loss": 1.9972, + "step": 2300 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973120102589779, + "loss": 2.0201, + "step": 2301 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029730968039538407, + "loss": 1.9923, + "step": 2302 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029730734953163884, + "loss": 1.9962, + "step": 2303 + }, + { + "epoch": 0.18, + "learning_rate": 0.000297305017667758, + "loss": 2.023, + "step": 2304 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002973026848037573, + "loss": 2.0546, + "step": 2305 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029730035093965273, + "loss": 2.0335, + "step": 2306 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029729801607546, + "loss": 2.0116, + "step": 2307 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002972956802111951, + "loss": 2.0399, + "step": 2308 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002972933433468738, + "loss": 2.0488, + "step": 2309 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029729100548251194, + "loss": 2.022, + "step": 2310 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002972886666181255, + "loss": 2.0583, + "step": 2311 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029728632675373026, + "loss": 2.0473, + "step": 2312 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029728398588934214, + "loss": 2.0611, + "step": 2313 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029728164402497705, + "loss": 1.9656, + "step": 2314 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029727930116065084, + "loss": 1.9663, + "step": 2315 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029727695729637945, + "loss": 1.9858, + "step": 2316 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002972746124321788, + "loss": 1.9981, + "step": 2317 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029727226656806483, + "loss": 2.0173, + "step": 2318 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029726991970405344, + "loss": 2.0221, + "step": 2319 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029726757184016055, + "loss": 2.0794, + "step": 2320 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002972652229764021, + "loss": 1.9978, + "step": 2321 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002972628731127941, + "loss": 2.0507, + "step": 2322 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002972605222493524, + "loss": 1.9727, + "step": 2323 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029725817038609304, + "loss": 1.9691, + "step": 2324 + }, + { + "epoch": 0.18, + "learning_rate": 0.000297255817523032, + "loss": 2.006, + "step": 2325 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002972534636601852, + "loss": 2.0526, + "step": 2326 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002972511087975686, + "loss": 1.9908, + "step": 2327 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002972487529351983, + "loss": 2.0024, + "step": 2328 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029724639607309016, + "loss": 2.0674, + "step": 2329 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029724403821126033, + "loss": 1.968, + "step": 2330 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002972416793497247, + "loss": 2.0535, + "step": 2331 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002972393194884993, + "loss": 2.0276, + "step": 2332 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002972369586276002, + "loss": 2.0136, + "step": 2333 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002972345967670434, + "loss": 2.0052, + "step": 2334 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029723223390684493, + "loss": 2.0048, + "step": 2335 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029722987004702085, + "loss": 2.0477, + "step": 2336 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029722750518758714, + "loss": 2.0199, + "step": 2337 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029722513932856, + "loss": 1.9927, + "step": 2338 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002972227724699554, + "loss": 2.0408, + "step": 2339 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029722040461178934, + "loss": 2.0293, + "step": 2340 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029721803575407806, + "loss": 2.0718, + "step": 2341 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029721566589683754, + "loss": 2.0359, + "step": 2342 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002972132950400839, + "loss": 1.9944, + "step": 2343 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002972109231838332, + "loss": 1.9929, + "step": 2344 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029720855032810153, + "loss": 1.986, + "step": 2345 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029720617647290514, + "loss": 1.9758, + "step": 2346 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029720380161825995, + "loss": 1.9972, + "step": 2347 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029720142576418224, + "loss": 2.0297, + "step": 2348 + }, + { + "epoch": 0.18, + "learning_rate": 0.00029719904891068805, + "loss": 2.0381, + "step": 2349 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002971966710577936, + "loss": 2.02, + "step": 2350 + }, + { + "epoch": 0.18, + "learning_rate": 0.0002971942922055149, + "loss": 2.0395, + "step": 2351 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029719191235386827, + "loss": 1.9586, + "step": 2352 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002971895315028697, + "loss": 1.9831, + "step": 2353 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002971871496525355, + "loss": 2.0259, + "step": 2354 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029718476680288175, + "loss": 2.096, + "step": 2355 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029718238295392465, + "loss": 1.9924, + "step": 2356 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029717999810568047, + "loss": 2.0112, + "step": 2357 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002971776122581652, + "loss": 2.0257, + "step": 2358 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002971752254113953, + "loss": 1.9993, + "step": 2359 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029717283756538674, + "loss": 2.0093, + "step": 2360 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029717044872015584, + "loss": 2.003, + "step": 2361 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029716805887571875, + "loss": 1.9982, + "step": 2362 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002971656680320919, + "loss": 1.9967, + "step": 2363 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002971632761892913, + "loss": 2.0754, + "step": 2364 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029716088334733325, + "loss": 2.0053, + "step": 2365 + }, + { + "epoch": 0.19, + "learning_rate": 0.000297158489506234, + "loss": 1.9816, + "step": 2366 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029715609466600987, + "loss": 2.0577, + "step": 2367 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029715369882667706, + "loss": 1.9694, + "step": 2368 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002971513019882518, + "loss": 2.0338, + "step": 2369 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002971489041507504, + "loss": 2.0154, + "step": 2370 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002971465053141892, + "loss": 1.9841, + "step": 2371 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029714410547858436, + "loss": 1.9484, + "step": 2372 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002971417046439523, + "loss": 2.0448, + "step": 2373 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029713930281030925, + "loss": 2.0485, + "step": 2374 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002971368999776715, + "loss": 2.0419, + "step": 2375 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002971344961460554, + "loss": 2.0089, + "step": 2376 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029713209131547734, + "loss": 2.0564, + "step": 2377 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029712968548595357, + "loss": 1.9625, + "step": 2378 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029712727865750034, + "loss": 2.0046, + "step": 2379 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029712487083013414, + "loss": 2.027, + "step": 2380 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029712246200387123, + "loss": 1.9644, + "step": 2381 + }, + { + "epoch": 0.19, + "learning_rate": 0.000297120052178728, + "loss": 2.0078, + "step": 2382 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002971176413547208, + "loss": 2.0496, + "step": 2383 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029711522953186604, + "loss": 2.0311, + "step": 2384 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029711281671018, + "loss": 2.0109, + "step": 2385 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029711040288967914, + "loss": 1.9503, + "step": 2386 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029710798807037987, + "loss": 2.0139, + "step": 2387 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002971055722522985, + "loss": 2.0064, + "step": 2388 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002971031554354514, + "loss": 2.0027, + "step": 2389 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002971007376198552, + "loss": 2.0233, + "step": 2390 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029709831880552607, + "loss": 2.0745, + "step": 2391 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029709589899248054, + "loss": 2.0128, + "step": 2392 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029709347818073504, + "loss": 2.0563, + "step": 2393 + }, + { + "epoch": 0.19, + "learning_rate": 0.000297091056370306, + "loss": 1.9942, + "step": 2394 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029708863356120994, + "loss": 2.0181, + "step": 2395 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970862097534631, + "loss": 2.036, + "step": 2396 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970837849470821, + "loss": 2.0131, + "step": 2397 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029708135914208335, + "loss": 2.0232, + "step": 2398 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970789323384834, + "loss": 1.9136, + "step": 2399 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029707650453629866, + "loss": 2.0167, + "step": 2400 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970740757355456, + "loss": 2.0475, + "step": 2401 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029707164593624074, + "loss": 2.0281, + "step": 2402 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029706921513840054, + "loss": 2.055, + "step": 2403 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970667833420415, + "loss": 2.0329, + "step": 2404 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970643505471802, + "loss": 2.0095, + "step": 2405 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970619167538331, + "loss": 1.9488, + "step": 2406 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970594819620168, + "loss": 2.058, + "step": 2407 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970570461717477, + "loss": 1.9563, + "step": 2408 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029705460938304245, + "loss": 1.9938, + "step": 2409 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970521715959175, + "loss": 1.9573, + "step": 2410 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970497328103895, + "loss": 2.0006, + "step": 2411 + }, + { + "epoch": 0.19, + "learning_rate": 0.000297047293026475, + "loss": 1.9403, + "step": 2412 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970448522441904, + "loss": 2.0205, + "step": 2413 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029704241046355254, + "loss": 1.9802, + "step": 2414 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970399676845778, + "loss": 1.9518, + "step": 2415 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970375239072828, + "loss": 1.9705, + "step": 2416 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970350791316842, + "loss": 2.0769, + "step": 2417 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970326333577985, + "loss": 1.9603, + "step": 2418 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970301865856424, + "loss": 2.0071, + "step": 2419 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029702773881523246, + "loss": 1.9773, + "step": 2420 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970252900465853, + "loss": 1.9815, + "step": 2421 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970228402797176, + "loss": 1.964, + "step": 2422 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029702038951464585, + "loss": 1.9941, + "step": 2423 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970179377513869, + "loss": 2.0307, + "step": 2424 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970154849899572, + "loss": 1.9634, + "step": 2425 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029701303123037354, + "loss": 1.9698, + "step": 2426 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970105764726525, + "loss": 2.0627, + "step": 2427 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029700812071681076, + "loss": 1.9517, + "step": 2428 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029700566396286503, + "loss": 1.9837, + "step": 2429 + }, + { + "epoch": 0.19, + "learning_rate": 0.000297003206210832, + "loss": 1.9546, + "step": 2430 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002970007474607283, + "loss": 2.0251, + "step": 2431 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002969982877125706, + "loss": 2.0164, + "step": 2432 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002969958269663757, + "loss": 2.0477, + "step": 2433 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002969933652221602, + "loss": 1.9873, + "step": 2434 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002969909024799409, + "loss": 2.0496, + "step": 2435 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002969884387397345, + "loss": 1.966, + "step": 2436 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029698597400155773, + "loss": 1.9939, + "step": 2437 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029698350826542726, + "loss": 1.9706, + "step": 2438 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029698104153135993, + "loss": 2.0138, + "step": 2439 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029697857379937237, + "loss": 2.0823, + "step": 2440 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029697610506948145, + "loss": 2.032, + "step": 2441 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002969736353417039, + "loss": 1.9983, + "step": 2442 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029697116461605645, + "loss": 1.9871, + "step": 2443 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029696869289255593, + "loss": 2.0175, + "step": 2444 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029696622017121905, + "loss": 2.0184, + "step": 2445 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002969637464520627, + "loss": 1.9509, + "step": 2446 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029696127173510354, + "loss": 1.9664, + "step": 2447 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029695879602035846, + "loss": 2.0135, + "step": 2448 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029695631930784424, + "loss": 1.9805, + "step": 2449 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029695384159757773, + "loss": 1.9801, + "step": 2450 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029695136288957575, + "loss": 2.001, + "step": 2451 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002969488831838551, + "loss": 1.9125, + "step": 2452 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002969464024804326, + "loss": 1.9304, + "step": 2453 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029694392077932516, + "loss": 2.0199, + "step": 2454 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029694143808054954, + "loss": 1.9943, + "step": 2455 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002969389543841227, + "loss": 2.0079, + "step": 2456 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002969364696900614, + "loss": 1.9573, + "step": 2457 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002969339839983826, + "loss": 1.9591, + "step": 2458 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002969314973091031, + "loss": 1.9963, + "step": 2459 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029692900962223983, + "loss": 1.9902, + "step": 2460 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029692652093780964, + "loss": 1.9797, + "step": 2461 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029692403125582947, + "loss": 2.0361, + "step": 2462 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029692154057631625, + "loss": 2.0035, + "step": 2463 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002969190488992868, + "loss": 1.976, + "step": 2464 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002969165562247581, + "loss": 1.9639, + "step": 2465 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029691406255274706, + "loss": 2.0134, + "step": 2466 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002969115678832706, + "loss": 2.0125, + "step": 2467 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002969090722163457, + "loss": 2.0011, + "step": 2468 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002969065755519892, + "loss": 1.9907, + "step": 2469 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029690407789021816, + "loss": 1.9621, + "step": 2470 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029690157923104954, + "loss": 1.9823, + "step": 2471 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002968990795745002, + "loss": 2.0053, + "step": 2472 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002968965789205872, + "loss": 1.9784, + "step": 2473 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029689407726932746, + "loss": 1.9604, + "step": 2474 + }, + { + "epoch": 0.19, + "learning_rate": 0.00029689157462073806, + "loss": 1.9723, + "step": 2475 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002968890709748359, + "loss": 2.0323, + "step": 2476 + }, + { + "epoch": 0.19, + "learning_rate": 0.000296886566331638, + "loss": 1.9825, + "step": 2477 + }, + { + "epoch": 0.19, + "learning_rate": 0.0002968840606911614, + "loss": 1.9766, + "step": 2478 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002968815540534231, + "loss": 2.0157, + "step": 2479 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029687904641844006, + "loss": 2.0257, + "step": 2480 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029687653778622935, + "loss": 1.9628, + "step": 2481 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029687402815680797, + "loss": 1.9822, + "step": 2482 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002968715175301931, + "loss": 1.9808, + "step": 2483 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029686900590640157, + "loss": 2.0006, + "step": 2484 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002968664932854506, + "loss": 1.9586, + "step": 2485 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002968639796673572, + "loss": 2.0379, + "step": 2486 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029686146505213834, + "loss": 2.0451, + "step": 2487 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002968589494398112, + "loss": 1.9686, + "step": 2488 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002968564328303929, + "loss": 1.993, + "step": 2489 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029685391522390044, + "loss": 1.9356, + "step": 2490 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002968513966203509, + "loss": 1.9931, + "step": 2491 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029684887701976145, + "loss": 2.018, + "step": 2492 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029684635642214914, + "loss": 2.0143, + "step": 2493 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029684383482753114, + "loss": 1.9808, + "step": 2494 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002968413122359245, + "loss": 2.0329, + "step": 2495 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029683878864734644, + "loss": 1.9966, + "step": 2496 + }, + { + "epoch": 0.2, + "learning_rate": 0.000296836264061814, + "loss": 2.0304, + "step": 2497 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029683373847934433, + "loss": 2.0164, + "step": 2498 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002968312118999547, + "loss": 2.0047, + "step": 2499 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029682868432366204, + "loss": 1.9647, + "step": 2500 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002968261557504837, + "loss": 1.9896, + "step": 2501 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002968236261804368, + "loss": 1.974, + "step": 2502 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029682109561353847, + "loss": 1.9904, + "step": 2503 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029681856404980596, + "loss": 1.9792, + "step": 2504 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029681603148925645, + "loss": 1.9467, + "step": 2505 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029681349793190707, + "loss": 2.0217, + "step": 2506 + }, + { + "epoch": 0.2, + "learning_rate": 0.000296810963377775, + "loss": 1.9819, + "step": 2507 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029680842782687757, + "loss": 2.0507, + "step": 2508 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002968058912792319, + "loss": 2.0176, + "step": 2509 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029680335373485526, + "loss": 1.9551, + "step": 2510 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029680081519376487, + "loss": 1.9957, + "step": 2511 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029679827565597794, + "loss": 1.9503, + "step": 2512 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029679573512151177, + "loss": 1.9952, + "step": 2513 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967931935903835, + "loss": 2.0082, + "step": 2514 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029679065106261046, + "loss": 1.9837, + "step": 2515 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029678810753821, + "loss": 1.9005, + "step": 2516 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967855630171992, + "loss": 1.9805, + "step": 2517 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967830174995955, + "loss": 1.9415, + "step": 2518 + }, + { + "epoch": 0.2, + "learning_rate": 0.000296780470985416, + "loss": 1.9818, + "step": 2519 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029677792347467815, + "loss": 1.9898, + "step": 2520 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029677537496739924, + "loss": 2.0611, + "step": 2521 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967728254635965, + "loss": 2.0332, + "step": 2522 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967702749632873, + "loss": 2.0409, + "step": 2523 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967677234664889, + "loss": 2.0123, + "step": 2524 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967651709732187, + "loss": 1.9757, + "step": 2525 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029676261748349386, + "loss": 2.0135, + "step": 2526 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029676006299733193, + "loss": 1.9917, + "step": 2527 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029675750751475015, + "loss": 1.9844, + "step": 2528 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967549510357659, + "loss": 1.9988, + "step": 2529 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029675239356039647, + "loss": 1.9922, + "step": 2530 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967498350886593, + "loss": 1.9973, + "step": 2531 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029674727562057176, + "loss": 1.9918, + "step": 2532 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967447151561512, + "loss": 2.0375, + "step": 2533 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967421536954149, + "loss": 1.9893, + "step": 2534 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967395912383805, + "loss": 2.0233, + "step": 2535 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029673702778506514, + "loss": 1.9874, + "step": 2536 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967344633354864, + "loss": 2.0068, + "step": 2537 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967318978896616, + "loss": 1.9428, + "step": 2538 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967293314476082, + "loss": 1.9384, + "step": 2539 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967267640093436, + "loss": 2.0032, + "step": 2540 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967241955748853, + "loss": 1.9615, + "step": 2541 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967216261442506, + "loss": 1.9926, + "step": 2542 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967190557174571, + "loss": 2.0212, + "step": 2543 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967164842945221, + "loss": 2.0617, + "step": 2544 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967139118754632, + "loss": 1.9932, + "step": 2545 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967113384602978, + "loss": 2.0165, + "step": 2546 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029670876404904335, + "loss": 1.9844, + "step": 2547 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967061886417173, + "loss": 1.9715, + "step": 2548 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967036122383372, + "loss": 1.9296, + "step": 2549 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002967010348389206, + "loss": 1.968, + "step": 2550 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002966984564434849, + "loss": 1.9358, + "step": 2551 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002966958770520477, + "loss": 1.9753, + "step": 2552 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029669329666462635, + "loss": 1.9877, + "step": 2553 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002966907152812385, + "loss": 1.9404, + "step": 2554 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002966881329019017, + "loss": 1.9798, + "step": 2555 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029668554952663333, + "loss": 1.9264, + "step": 2556 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002966829651554511, + "loss": 1.9994, + "step": 2557 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002966803797883724, + "loss": 1.9565, + "step": 2558 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029667779342541496, + "loss": 1.9393, + "step": 2559 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002966752060665962, + "loss": 1.9525, + "step": 2560 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029667261771193374, + "loss": 2.011, + "step": 2561 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029667002836144515, + "loss": 1.9882, + "step": 2562 + }, + { + "epoch": 0.2, + "learning_rate": 0.000296667438015148, + "loss": 1.9444, + "step": 2563 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029666484667305987, + "loss": 1.9326, + "step": 2564 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002966622543351984, + "loss": 2.0187, + "step": 2565 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002966596610015811, + "loss": 1.9994, + "step": 2566 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002966570666722257, + "loss": 2.0058, + "step": 2567 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029665447134714977, + "loss": 1.9339, + "step": 2568 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029665187502637085, + "loss": 2.0132, + "step": 2569 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002966492777099066, + "loss": 1.9707, + "step": 2570 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029664667939777477, + "loss": 2.0033, + "step": 2571 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002966440800899929, + "loss": 1.9503, + "step": 2572 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029664147978657857, + "loss": 1.9888, + "step": 2573 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002966388784875496, + "loss": 1.9797, + "step": 2574 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029663627619292354, + "loss": 1.9514, + "step": 2575 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029663367290271806, + "loss": 1.9843, + "step": 2576 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002966310686169509, + "loss": 1.997, + "step": 2577 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029662846333563966, + "loss": 1.9394, + "step": 2578 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002966258570588021, + "loss": 2.0232, + "step": 2579 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002966232497864559, + "loss": 1.9546, + "step": 2580 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029662064151861865, + "loss": 1.9382, + "step": 2581 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029661803225530825, + "loss": 1.9501, + "step": 2582 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002966154219965423, + "loss": 1.9376, + "step": 2583 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002966128107423386, + "loss": 1.9918, + "step": 2584 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002966101984927147, + "loss": 2.003, + "step": 2585 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029660758524768853, + "loss": 2.0151, + "step": 2586 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029660497100727774, + "loss": 2.0116, + "step": 2587 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002966023557715002, + "loss": 2.0253, + "step": 2588 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002965997395403734, + "loss": 1.9861, + "step": 2589 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002965971223139154, + "loss": 1.9946, + "step": 2590 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029659450409214375, + "loss": 1.9661, + "step": 2591 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002965918848750764, + "loss": 2.0268, + "step": 2592 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029658926466273096, + "loss": 2.0264, + "step": 2593 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002965866434551254, + "loss": 1.9889, + "step": 2594 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002965840212522773, + "loss": 1.9583, + "step": 2595 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002965813980542047, + "loss": 1.9626, + "step": 2596 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002965787738609253, + "loss": 1.9797, + "step": 2597 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029657614867245683, + "loss": 2.0048, + "step": 2598 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029657352248881725, + "loss": 1.9786, + "step": 2599 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002965708953100243, + "loss": 1.9793, + "step": 2600 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029656826713609594, + "loss": 1.9795, + "step": 2601 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029656563796704984, + "loss": 1.9338, + "step": 2602 + }, + { + "epoch": 0.2, + "learning_rate": 0.00029656300780290395, + "loss": 1.9694, + "step": 2603 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002965603766436762, + "loss": 1.9332, + "step": 2604 + }, + { + "epoch": 0.2, + "learning_rate": 0.0002965577444893843, + "loss": 1.984, + "step": 2605 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002965551113400462, + "loss": 1.9802, + "step": 2606 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029655247719567973, + "loss": 2.0248, + "step": 2607 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002965498420563029, + "loss": 2.0189, + "step": 2608 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029654720592193345, + "loss": 2.0246, + "step": 2609 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002965445687925894, + "loss": 1.9814, + "step": 2610 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002965419306682885, + "loss": 1.9878, + "step": 2611 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029653929154904886, + "loss": 1.9755, + "step": 2612 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002965366514348883, + "loss": 1.9527, + "step": 2613 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029653401032582466, + "loss": 2.0234, + "step": 2614 + }, + { + "epoch": 0.21, + "learning_rate": 0.000296531368221876, + "loss": 2.0304, + "step": 2615 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029652872512306023, + "loss": 2.0101, + "step": 2616 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029652608102939524, + "loss": 1.9836, + "step": 2617 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002965234359408991, + "loss": 2.0368, + "step": 2618 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002965207898575896, + "loss": 1.9628, + "step": 2619 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002965181427794848, + "loss": 1.9667, + "step": 2620 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002965154947066027, + "loss": 1.9526, + "step": 2621 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002965128456389612, + "loss": 1.9686, + "step": 2622 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002965101955765784, + "loss": 2.0197, + "step": 2623 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002965075445194722, + "loss": 1.9785, + "step": 2624 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029650489246766054, + "loss": 1.949, + "step": 2625 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002965022394211616, + "loss": 1.9698, + "step": 2626 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964995853799933, + "loss": 1.8866, + "step": 2627 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029649693034417365, + "loss": 1.9842, + "step": 2628 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964942743137207, + "loss": 2.0231, + "step": 2629 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964916172886524, + "loss": 1.9974, + "step": 2630 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964889592689869, + "loss": 1.9512, + "step": 2631 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964863002547422, + "loss": 1.9448, + "step": 2632 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964836402459364, + "loss": 1.938, + "step": 2633 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029648097924258747, + "loss": 1.9669, + "step": 2634 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964783172447135, + "loss": 1.9492, + "step": 2635 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029647565425233263, + "loss": 1.9923, + "step": 2636 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029647299026546294, + "loss": 2.0172, + "step": 2637 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964703252841224, + "loss": 1.9175, + "step": 2638 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029646765930832925, + "loss": 1.9414, + "step": 2639 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964649923381015, + "loss": 1.9646, + "step": 2640 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964623243734573, + "loss": 2.0132, + "step": 2641 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964596554144147, + "loss": 2.0194, + "step": 2642 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964569854609918, + "loss": 2.0072, + "step": 2643 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029645431451320685, + "loss": 1.942, + "step": 2644 + }, + { + "epoch": 0.21, + "learning_rate": 0.000296451642571078, + "loss": 2.0061, + "step": 2645 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029644896963462324, + "loss": 1.9367, + "step": 2646 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964462957038608, + "loss": 1.9102, + "step": 2647 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964436207788088, + "loss": 1.99, + "step": 2648 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964409448594855, + "loss": 1.9505, + "step": 2649 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029643826794590895, + "loss": 1.9581, + "step": 2650 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964355900380974, + "loss": 1.9588, + "step": 2651 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029643291113606895, + "loss": 1.9704, + "step": 2652 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964302312398419, + "loss": 1.9731, + "step": 2653 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029642755034943436, + "loss": 1.9352, + "step": 2654 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964248684648646, + "loss": 1.935, + "step": 2655 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964221855861507, + "loss": 2.0527, + "step": 2656 + }, + { + "epoch": 0.21, + "learning_rate": 0.000296419501713311, + "loss": 1.9329, + "step": 2657 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029641681684636375, + "loss": 1.9278, + "step": 2658 + }, + { + "epoch": 0.21, + "learning_rate": 0.000296414130985327, + "loss": 1.9898, + "step": 2659 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029641144413021915, + "loss": 1.9389, + "step": 2660 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029640875628105846, + "loss": 1.9554, + "step": 2661 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029640606743786305, + "loss": 2.0226, + "step": 2662 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964033776006512, + "loss": 2.0315, + "step": 2663 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002964006867694413, + "loss": 1.9145, + "step": 2664 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002963979949442514, + "loss": 1.9504, + "step": 2665 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029639530212510003, + "loss": 2.0197, + "step": 2666 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029639260831200524, + "loss": 1.949, + "step": 2667 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002963899135049855, + "loss": 1.9843, + "step": 2668 + }, + { + "epoch": 0.21, + "learning_rate": 0.000296387217704059, + "loss": 1.9527, + "step": 2669 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002963845209092441, + "loss": 1.9631, + "step": 2670 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029638182312055904, + "loss": 1.9532, + "step": 2671 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029637912433802224, + "loss": 1.9832, + "step": 2672 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002963764245616519, + "loss": 1.9801, + "step": 2673 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029637372379146643, + "loss": 1.9372, + "step": 2674 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002963710220274842, + "loss": 1.9731, + "step": 2675 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002963683192697235, + "loss": 1.968, + "step": 2676 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029636561551820264, + "loss": 1.9807, + "step": 2677 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029636291077294, + "loss": 1.9166, + "step": 2678 + }, + { + "epoch": 0.21, + "learning_rate": 0.000296360205033954, + "loss": 1.9566, + "step": 2679 + }, + { + "epoch": 0.21, + "learning_rate": 0.000296357498301263, + "loss": 1.9442, + "step": 2680 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029635479057488537, + "loss": 1.9712, + "step": 2681 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002963520818548394, + "loss": 1.9838, + "step": 2682 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002963493721411436, + "loss": 1.9764, + "step": 2683 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002963466614338163, + "loss": 1.9933, + "step": 2684 + }, + { + "epoch": 0.21, + "learning_rate": 0.000296343949732876, + "loss": 1.9906, + "step": 2685 + }, + { + "epoch": 0.21, + "learning_rate": 0.000296341237038341, + "loss": 1.9669, + "step": 2686 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029633852335022974, + "loss": 1.9623, + "step": 2687 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029633580866856066, + "loss": 2.0132, + "step": 2688 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002963330929933522, + "loss": 1.9704, + "step": 2689 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029633037632462286, + "loss": 1.9751, + "step": 2690 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029632765866239094, + "loss": 1.971, + "step": 2691 + }, + { + "epoch": 0.21, + "learning_rate": 0.000296324940006675, + "loss": 1.9517, + "step": 2692 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029632222035749344, + "loss": 1.9593, + "step": 2693 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002963194997148648, + "loss": 2.0173, + "step": 2694 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002963167780788074, + "loss": 1.9219, + "step": 2695 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029631405544933994, + "loss": 1.9363, + "step": 2696 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002963113318264807, + "loss": 1.9497, + "step": 2697 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002963086072102483, + "loss": 1.9955, + "step": 2698 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002963058816006612, + "loss": 2.0124, + "step": 2699 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002963031549977379, + "loss": 1.94, + "step": 2700 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002963004274014969, + "loss": 1.9805, + "step": 2701 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002962976988119567, + "loss": 1.9751, + "step": 2702 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029629496922913587, + "loss": 1.9809, + "step": 2703 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029629223865305297, + "loss": 1.9919, + "step": 2704 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002962895070837265, + "loss": 1.9917, + "step": 2705 + }, + { + "epoch": 0.21, + "learning_rate": 0.000296286774521175, + "loss": 1.9391, + "step": 2706 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029628404096541705, + "loss": 1.9787, + "step": 2707 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029628130641647115, + "loss": 1.9462, + "step": 2708 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002962785708743559, + "loss": 1.9614, + "step": 2709 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029627583433908993, + "loss": 1.9167, + "step": 2710 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002962730968106917, + "loss": 1.9551, + "step": 2711 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002962703582891799, + "loss": 1.8963, + "step": 2712 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002962676187745731, + "loss": 1.9746, + "step": 2713 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029626487826688985, + "loss": 2.0041, + "step": 2714 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002962621367661488, + "loss": 1.9681, + "step": 2715 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029625939427236855, + "loss": 1.9925, + "step": 2716 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029625665078556775, + "loss": 1.9294, + "step": 2717 + }, + { + "epoch": 0.21, + "learning_rate": 0.000296253906305765, + "loss": 1.9873, + "step": 2718 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002962511608329789, + "loss": 2.0144, + "step": 2719 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002962484143672282, + "loss": 1.9049, + "step": 2720 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002962456669085314, + "loss": 1.9677, + "step": 2721 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002962429184569072, + "loss": 1.9734, + "step": 2722 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002962401690123744, + "loss": 1.9243, + "step": 2723 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002962374185749515, + "loss": 2.0186, + "step": 2724 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002962346671446572, + "loss": 1.9463, + "step": 2725 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002962319147215102, + "loss": 1.9705, + "step": 2726 + }, + { + "epoch": 0.21, + "learning_rate": 0.0002962291613055293, + "loss": 1.9483, + "step": 2727 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029622640689673296, + "loss": 2.0342, + "step": 2728 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029622365149514004, + "loss": 1.9203, + "step": 2729 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029622089510076925, + "loss": 1.9681, + "step": 2730 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029621813771363927, + "loss": 1.9432, + "step": 2731 + }, + { + "epoch": 0.21, + "learning_rate": 0.00029621537933376883, + "loss": 1.9112, + "step": 2732 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029621261996117665, + "loss": 1.9484, + "step": 2733 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002962098595958815, + "loss": 1.9799, + "step": 2734 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029620709823790207, + "loss": 1.973, + "step": 2735 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002962043358872571, + "loss": 1.9898, + "step": 2736 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029620157254396537, + "loss": 1.9215, + "step": 2737 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002961988082080457, + "loss": 1.9124, + "step": 2738 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002961960428795167, + "loss": 1.9627, + "step": 2739 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002961932765583973, + "loss": 1.9286, + "step": 2740 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029619050924470624, + "loss": 1.9117, + "step": 2741 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002961877409384623, + "loss": 1.8861, + "step": 2742 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029618497163968425, + "loss": 1.9358, + "step": 2743 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002961822013483909, + "loss": 1.9603, + "step": 2744 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002961794300646011, + "loss": 1.968, + "step": 2745 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002961766577883336, + "loss": 1.9344, + "step": 2746 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029617388451960735, + "loss": 1.943, + "step": 2747 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029617111025844107, + "loss": 1.9665, + "step": 2748 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002961683350048536, + "loss": 1.9504, + "step": 2749 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029616555875886376, + "loss": 1.9273, + "step": 2750 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029616278152049045, + "loss": 1.9235, + "step": 2751 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002961600032897525, + "loss": 1.9095, + "step": 2752 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002961572240666688, + "loss": 2.0046, + "step": 2753 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002961544438512582, + "loss": 1.9449, + "step": 2754 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029615166264353957, + "loss": 1.9432, + "step": 2755 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029614888044353187, + "loss": 1.9617, + "step": 2756 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002961460972512539, + "loss": 1.9593, + "step": 2757 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002961433130667245, + "loss": 1.8817, + "step": 2758 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002961405278899627, + "loss": 1.9769, + "step": 2759 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002961377417209874, + "loss": 1.9047, + "step": 2760 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029613495455981746, + "loss": 1.96, + "step": 2761 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029613216640647183, + "loss": 1.9076, + "step": 2762 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002961293772609694, + "loss": 1.9779, + "step": 2763 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029612658712332914, + "loss": 1.9608, + "step": 2764 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029612379599357, + "loss": 1.9472, + "step": 2765 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029612100387171094, + "loss": 1.9202, + "step": 2766 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002961182107577709, + "loss": 1.9697, + "step": 2767 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029611541665176887, + "loss": 1.958, + "step": 2768 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002961126215537237, + "loss": 1.9135, + "step": 2769 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029610982546365454, + "loss": 1.9459, + "step": 2770 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002961070283815803, + "loss": 1.9444, + "step": 2771 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002961042303075199, + "loss": 1.9797, + "step": 2772 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029610143124149244, + "loss": 2.0228, + "step": 2773 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002960986311835169, + "loss": 1.9803, + "step": 2774 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002960958301336123, + "loss": 1.9815, + "step": 2775 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002960930280917976, + "loss": 1.9171, + "step": 2776 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029609022505809184, + "loss": 1.947, + "step": 2777 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002960874210325141, + "loss": 1.9437, + "step": 2778 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029608461601508335, + "loss": 2.0045, + "step": 2779 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002960818100058188, + "loss": 1.8615, + "step": 2780 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029607900300473923, + "loss": 1.9953, + "step": 2781 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002960761950118639, + "loss": 1.9401, + "step": 2782 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002960733860272118, + "loss": 1.8921, + "step": 2783 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029607057605080206, + "loss": 1.9349, + "step": 2784 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002960677650826537, + "loss": 1.9544, + "step": 2785 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002960649531227858, + "loss": 2.0052, + "step": 2786 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002960621401712175, + "loss": 1.9634, + "step": 2787 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029605932622796786, + "loss": 1.9421, + "step": 2788 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029605651129305596, + "loss": 1.9888, + "step": 2789 + }, + { + "epoch": 0.22, + "learning_rate": 0.000296053695366501, + "loss": 1.9276, + "step": 2790 + }, + { + "epoch": 0.22, + "learning_rate": 0.000296050878448322, + "loss": 1.9866, + "step": 2791 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002960480605385382, + "loss": 1.982, + "step": 2792 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002960452416371686, + "loss": 1.9358, + "step": 2793 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029604242174423247, + "loss": 1.9882, + "step": 2794 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029603960085974884, + "loss": 1.9659, + "step": 2795 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002960367789837369, + "loss": 1.886, + "step": 2796 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029603395611621584, + "loss": 1.8837, + "step": 2797 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029603113225720485, + "loss": 1.9824, + "step": 2798 + }, + { + "epoch": 0.22, + "learning_rate": 0.000296028307406723, + "loss": 1.9849, + "step": 2799 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029602548156478956, + "loss": 1.9455, + "step": 2800 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029602265473142365, + "loss": 1.8753, + "step": 2801 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002960198269066445, + "loss": 1.959, + "step": 2802 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029601699809047135, + "loss": 1.9752, + "step": 2803 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029601416828292334, + "loss": 1.9652, + "step": 2804 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002960113374840197, + "loss": 1.9862, + "step": 2805 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029600850569377966, + "loss": 1.9705, + "step": 2806 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002960056729122224, + "loss": 1.9454, + "step": 2807 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002960028391393672, + "loss": 1.8944, + "step": 2808 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029600000437523334, + "loss": 1.9891, + "step": 2809 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029599716861984003, + "loss": 1.9916, + "step": 2810 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002959943318732065, + "loss": 1.99, + "step": 2811 + }, + { + "epoch": 0.22, + "learning_rate": 0.000295991494135352, + "loss": 1.9606, + "step": 2812 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002959886554062958, + "loss": 1.9074, + "step": 2813 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029598581568605724, + "loss": 2.0124, + "step": 2814 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002959829749746555, + "loss": 1.9879, + "step": 2815 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029598013327211, + "loss": 1.9039, + "step": 2816 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002959772905784399, + "loss": 1.9466, + "step": 2817 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002959744468936645, + "loss": 1.9618, + "step": 2818 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029597160221780326, + "loss": 1.9725, + "step": 2819 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029596875655087536, + "loss": 1.9678, + "step": 2820 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029596590989290015, + "loss": 1.9794, + "step": 2821 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029596306224389694, + "loss": 1.9197, + "step": 2822 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029596021360388513, + "loss": 1.9384, + "step": 2823 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029595736397288396, + "loss": 1.9644, + "step": 2824 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002959545133509129, + "loss": 1.9516, + "step": 2825 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002959516617379912, + "loss": 1.9611, + "step": 2826 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029594880913413825, + "loss": 1.9323, + "step": 2827 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029594595553937347, + "loss": 1.8608, + "step": 2828 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029594310095371615, + "loss": 1.9878, + "step": 2829 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002959402453771857, + "loss": 1.9338, + "step": 2830 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002959373888098016, + "loss": 1.9217, + "step": 2831 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002959345312515831, + "loss": 1.9671, + "step": 2832 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002959316727025497, + "loss": 1.9832, + "step": 2833 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029592881316272074, + "loss": 1.9989, + "step": 2834 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002959259526321157, + "loss": 1.9054, + "step": 2835 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029592309111075394, + "loss": 2.0174, + "step": 2836 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029592022859865495, + "loss": 1.9607, + "step": 2837 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002959173650958381, + "loss": 1.9148, + "step": 2838 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002959145006023229, + "loss": 1.9194, + "step": 2839 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002959116351181287, + "loss": 1.9897, + "step": 2840 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002959087686432751, + "loss": 1.94, + "step": 2841 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029590590117778144, + "loss": 1.9287, + "step": 2842 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002959030327216672, + "loss": 1.9862, + "step": 2843 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002959001632749519, + "loss": 1.944, + "step": 2844 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029589729283765505, + "loss": 1.9163, + "step": 2845 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029589442140979605, + "loss": 1.9758, + "step": 2846 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002958915489913945, + "loss": 1.9402, + "step": 2847 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002958886755824698, + "loss": 1.9588, + "step": 2848 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002958858011830415, + "loss": 1.9638, + "step": 2849 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002958829257931291, + "loss": 1.9488, + "step": 2850 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002958800494127521, + "loss": 1.8947, + "step": 2851 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002958771720419302, + "loss": 1.8807, + "step": 2852 + }, + { + "epoch": 0.22, + "learning_rate": 0.0002958742936806827, + "loss": 1.9654, + "step": 2853 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029587141432902927, + "loss": 1.9761, + "step": 2854 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029586853398698947, + "loss": 1.9502, + "step": 2855 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029586565265458275, + "loss": 1.9149, + "step": 2856 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029586277033182874, + "loss": 1.9327, + "step": 2857 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029585988701874707, + "loss": 1.9157, + "step": 2858 + }, + { + "epoch": 0.22, + "learning_rate": 0.00029585700271535725, + "loss": 2.0089, + "step": 2859 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002958541174216789, + "loss": 1.9701, + "step": 2860 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029585123113773154, + "loss": 1.9006, + "step": 2861 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002958483438635348, + "loss": 1.8724, + "step": 2862 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002958454555991083, + "loss": 1.9195, + "step": 2863 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029584256634447164, + "loss": 1.9212, + "step": 2864 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002958396760996444, + "loss": 1.9867, + "step": 2865 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029583678486464637, + "loss": 1.95, + "step": 2866 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002958338926394969, + "loss": 1.9435, + "step": 2867 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002958309994242159, + "loss": 1.9624, + "step": 2868 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002958281052188228, + "loss": 1.9409, + "step": 2869 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029582521002333737, + "loss": 1.8945, + "step": 2870 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002958223138377792, + "loss": 1.8976, + "step": 2871 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029581941666216805, + "loss": 1.9708, + "step": 2872 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002958165184965235, + "loss": 1.9649, + "step": 2873 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002958136193408653, + "loss": 1.9935, + "step": 2874 + }, + { + "epoch": 0.23, + "learning_rate": 0.000295810719195213, + "loss": 1.965, + "step": 2875 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029580781805958647, + "loss": 1.9769, + "step": 2876 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002958049159340053, + "loss": 1.9395, + "step": 2877 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002958020128184892, + "loss": 1.9522, + "step": 2878 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002957991087130579, + "loss": 1.9256, + "step": 2879 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002957962036177311, + "loss": 1.9144, + "step": 2880 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029579329753252854, + "loss": 1.8503, + "step": 2881 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029579039045746994, + "loss": 1.8861, + "step": 2882 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029578748239257504, + "loss": 1.9715, + "step": 2883 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029578457333786357, + "loss": 1.9416, + "step": 2884 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029578166329335536, + "loss": 1.9692, + "step": 2885 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029577875225907004, + "loss": 1.9936, + "step": 2886 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002957758402350275, + "loss": 1.9477, + "step": 2887 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029577292722124735, + "loss": 1.949, + "step": 2888 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002957700132177496, + "loss": 1.9662, + "step": 2889 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002957670982245538, + "loss": 1.9964, + "step": 2890 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029576418224167987, + "loss": 1.9044, + "step": 2891 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029576126526914765, + "loss": 1.9292, + "step": 2892 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002957583473069768, + "loss": 1.9478, + "step": 2893 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002957554283551872, + "loss": 1.9905, + "step": 2894 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029575250841379873, + "loss": 1.9148, + "step": 2895 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029574958748283114, + "loss": 1.9386, + "step": 2896 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029574666556230427, + "loss": 1.9857, + "step": 2897 + }, + { + "epoch": 0.23, + "learning_rate": 0.000295743742652238, + "loss": 1.9475, + "step": 2898 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002957408187526521, + "loss": 1.9442, + "step": 2899 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029573789386356646, + "loss": 1.9901, + "step": 2900 + }, + { + "epoch": 0.23, + "learning_rate": 0.000295734967985001, + "loss": 1.9528, + "step": 2901 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002957320411169755, + "loss": 1.9867, + "step": 2902 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002957291132595099, + "loss": 1.9629, + "step": 2903 + }, + { + "epoch": 0.23, + "learning_rate": 0.000295726184412624, + "loss": 1.9558, + "step": 2904 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002957232545763377, + "loss": 1.9334, + "step": 2905 + }, + { + "epoch": 0.23, + "learning_rate": 0.000295720323750671, + "loss": 1.9457, + "step": 2906 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029571739193564364, + "loss": 1.9164, + "step": 2907 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002957144591312756, + "loss": 1.9589, + "step": 2908 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029571152533758684, + "loss": 1.9847, + "step": 2909 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029570859055459724, + "loss": 1.9456, + "step": 2910 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002957056547823267, + "loss": 1.9631, + "step": 2911 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002957027180207952, + "loss": 1.9366, + "step": 2912 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029569978027002255, + "loss": 1.9959, + "step": 2913 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002956968415300289, + "loss": 1.9089, + "step": 2914 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029569390180083407, + "loss": 1.9168, + "step": 2915 + }, + { + "epoch": 0.23, + "learning_rate": 0.000295690961082458, + "loss": 1.9529, + "step": 2916 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002956880193749208, + "loss": 1.9486, + "step": 2917 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002956850766782423, + "loss": 1.9338, + "step": 2918 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029568213299244244, + "loss": 1.9291, + "step": 2919 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002956791883175414, + "loss": 1.9028, + "step": 2920 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029567624265355906, + "loss": 1.9651, + "step": 2921 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029567329600051537, + "loss": 1.9442, + "step": 2922 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002956703483584304, + "loss": 1.9134, + "step": 2923 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029566739972732416, + "loss": 1.8906, + "step": 2924 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002956644501072167, + "loss": 1.9333, + "step": 2925 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029566149949812793, + "loss": 1.9416, + "step": 2926 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029565854790007803, + "loss": 1.9291, + "step": 2927 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029565559531308694, + "loss": 1.9494, + "step": 2928 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002956526417371747, + "loss": 1.9343, + "step": 2929 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002956496871723615, + "loss": 1.9191, + "step": 2930 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029564673161866723, + "loss": 1.9258, + "step": 2931 + }, + { + "epoch": 0.23, + "learning_rate": 0.000295643775076112, + "loss": 1.9419, + "step": 2932 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029564081754471596, + "loss": 1.9564, + "step": 2933 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029563785902449917, + "loss": 1.9338, + "step": 2934 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029563489951548165, + "loss": 1.8527, + "step": 2935 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002956319390176835, + "loss": 1.9541, + "step": 2936 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002956289775311249, + "loss": 1.9187, + "step": 2937 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002956260150558259, + "loss": 1.885, + "step": 2938 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002956230515918066, + "loss": 1.8933, + "step": 2939 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029562008713908714, + "loss": 1.9181, + "step": 2940 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029561712169768765, + "loss": 1.9164, + "step": 2941 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029561415526762827, + "loss": 1.9301, + "step": 2942 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029561118784892916, + "loss": 1.9397, + "step": 2943 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002956082194416104, + "loss": 1.9171, + "step": 2944 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029560525004569216, + "loss": 1.9119, + "step": 2945 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029560227966119465, + "loss": 1.9443, + "step": 2946 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002955993082881381, + "loss": 1.9676, + "step": 2947 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029559633592654246, + "loss": 1.9644, + "step": 2948 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002955933625764281, + "loss": 1.9491, + "step": 2949 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029559038823781514, + "loss": 1.9598, + "step": 2950 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002955874129107238, + "loss": 1.8858, + "step": 2951 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002955844365951743, + "loss": 1.9092, + "step": 2952 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029558145929118674, + "loss": 2.0315, + "step": 2953 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029557848099878145, + "loss": 1.9144, + "step": 2954 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029557550171797865, + "loss": 1.9649, + "step": 2955 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002955725214487985, + "loss": 1.9522, + "step": 2956 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002955695401912612, + "loss": 1.9428, + "step": 2957 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029556655794538714, + "loss": 1.9235, + "step": 2958 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029556357471119643, + "loss": 1.9562, + "step": 2959 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002955605904887094, + "loss": 1.8647, + "step": 2960 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002955576052779463, + "loss": 1.8978, + "step": 2961 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029555461907892735, + "loss": 1.9983, + "step": 2962 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002955516318916729, + "loss": 1.9125, + "step": 2963 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002955486437162032, + "loss": 1.9381, + "step": 2964 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029554565455253845, + "loss": 1.9002, + "step": 2965 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002955426644006991, + "loss": 1.9093, + "step": 2966 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029553967326070537, + "loss": 1.9211, + "step": 2967 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029553668113257753, + "loss": 2.0067, + "step": 2968 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029553368801633597, + "loss": 1.9362, + "step": 2969 + }, + { + "epoch": 0.23, + "learning_rate": 0.000295530693912001, + "loss": 1.9031, + "step": 2970 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029552769881959287, + "loss": 1.8829, + "step": 2971 + }, + { + "epoch": 0.23, + "learning_rate": 0.000295524702739132, + "loss": 1.9544, + "step": 2972 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002955217056706387, + "loss": 1.8732, + "step": 2973 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029551870761413334, + "loss": 1.9583, + "step": 2974 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002955157085696363, + "loss": 1.9336, + "step": 2975 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002955127085371678, + "loss": 1.9872, + "step": 2976 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002955097075167484, + "loss": 1.9413, + "step": 2977 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029550670550839835, + "loss": 1.8951, + "step": 2978 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002955037025121381, + "loss": 1.9037, + "step": 2979 + }, + { + "epoch": 0.23, + "learning_rate": 0.000295500698527988, + "loss": 1.904, + "step": 2980 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002954976935559684, + "loss": 1.9517, + "step": 2981 + }, + { + "epoch": 0.23, + "learning_rate": 0.0002954946875960998, + "loss": 1.9412, + "step": 2982 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029549168064840254, + "loss": 1.9772, + "step": 2983 + }, + { + "epoch": 0.23, + "learning_rate": 0.000295488672712897, + "loss": 1.9484, + "step": 2984 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029548566378960375, + "loss": 1.9457, + "step": 2985 + }, + { + "epoch": 0.23, + "learning_rate": 0.00029548265387854307, + "loss": 1.9658, + "step": 2986 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002954796429797355, + "loss": 1.9219, + "step": 2987 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029547663109320143, + "loss": 1.9363, + "step": 2988 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029547361821896125, + "loss": 1.9417, + "step": 2989 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029547060435703554, + "loss": 1.935, + "step": 2990 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002954675895074447, + "loss": 1.9089, + "step": 2991 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002954645736702092, + "loss": 1.9596, + "step": 2992 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002954615568453495, + "loss": 1.9096, + "step": 2993 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002954585390328861, + "loss": 1.8888, + "step": 2994 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002954555202328395, + "loss": 1.9725, + "step": 2995 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029545250044523026, + "loss": 1.8987, + "step": 2996 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002954494796700787, + "loss": 1.9273, + "step": 2997 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002954464579074055, + "loss": 1.9277, + "step": 2998 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029544343515723116, + "loss": 1.9546, + "step": 2999 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002954404114195761, + "loss": 1.9802, + "step": 3000 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029543738669446086, + "loss": 1.9789, + "step": 3001 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029543436098190606, + "loss": 1.9029, + "step": 3002 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029543133428193224, + "loss": 1.9344, + "step": 3003 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002954283065945599, + "loss": 1.911, + "step": 3004 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002954252779198096, + "loss": 1.9353, + "step": 3005 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002954222482577019, + "loss": 1.9148, + "step": 3006 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029541921760825737, + "loss": 1.9345, + "step": 3007 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029541618597149667, + "loss": 1.908, + "step": 3008 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029541315334744023, + "loss": 1.9111, + "step": 3009 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002954101197361088, + "loss": 1.881, + "step": 3010 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029540708513752287, + "loss": 1.9059, + "step": 3011 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002954040495517031, + "loss": 1.9593, + "step": 3012 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029540101297867005, + "loss": 1.9005, + "step": 3013 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029539797541844434, + "loss": 1.868, + "step": 3014 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029539493687104665, + "loss": 1.8858, + "step": 3015 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002953918973364976, + "loss": 1.9514, + "step": 3016 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002953888568148177, + "loss": 1.9132, + "step": 3017 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002953858153060278, + "loss": 1.9216, + "step": 3018 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029538277281014835, + "loss": 1.8929, + "step": 3019 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029537972932720016, + "loss": 1.9299, + "step": 3020 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029537668485720385, + "loss": 1.9799, + "step": 3021 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029537363940018, + "loss": 1.9453, + "step": 3022 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029537059295614944, + "loss": 1.9296, + "step": 3023 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002953675455251328, + "loss": 1.9567, + "step": 3024 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002953644971071507, + "loss": 1.9136, + "step": 3025 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002953614477022239, + "loss": 1.8654, + "step": 3026 + }, + { + "epoch": 0.24, + "learning_rate": 0.000295358397310373, + "loss": 1.8893, + "step": 3027 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002953553459316189, + "loss": 1.9104, + "step": 3028 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029535229356598215, + "loss": 1.9047, + "step": 3029 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002953492402134836, + "loss": 1.949, + "step": 3030 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029534618587414386, + "loss": 1.8882, + "step": 3031 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029534313054798377, + "loss": 1.9409, + "step": 3032 + }, + { + "epoch": 0.24, + "learning_rate": 0.000295340074235024, + "loss": 1.9173, + "step": 3033 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002953370169352854, + "loss": 1.9195, + "step": 3034 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029533395864878855, + "loss": 1.9158, + "step": 3035 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002953308993755544, + "loss": 1.9091, + "step": 3036 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002953278391156036, + "loss": 1.9596, + "step": 3037 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029532477786895704, + "loss": 1.9425, + "step": 3038 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029532171563563536, + "loss": 1.9926, + "step": 3039 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029531865241565945, + "loss": 1.9387, + "step": 3040 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002953155882090501, + "loss": 1.9674, + "step": 3041 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029531252301582807, + "loss": 1.9419, + "step": 3042 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002953094568360142, + "loss": 1.9422, + "step": 3043 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002953063896696293, + "loss": 1.9456, + "step": 3044 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029530332151669425, + "loss": 1.9313, + "step": 3045 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002953002523772298, + "loss": 1.9425, + "step": 3046 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952971822512568, + "loss": 1.9205, + "step": 3047 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952941111387962, + "loss": 1.9096, + "step": 3048 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029529103903986866, + "loss": 1.897, + "step": 3049 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952879659544952, + "loss": 1.9927, + "step": 3050 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029528489188269664, + "loss": 1.9141, + "step": 3051 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952818168244938, + "loss": 1.9193, + "step": 3052 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952787407799076, + "loss": 1.8981, + "step": 3053 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952756637489589, + "loss": 1.847, + "step": 3054 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952725857316687, + "loss": 1.909, + "step": 3055 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952695067280577, + "loss": 1.9687, + "step": 3056 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029526642673814696, + "loss": 1.988, + "step": 3057 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952633457619574, + "loss": 1.9348, + "step": 3058 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952602637995098, + "loss": 1.8429, + "step": 3059 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029525718085082525, + "loss": 1.954, + "step": 3060 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029525409691592456, + "loss": 1.8587, + "step": 3061 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952510119948287, + "loss": 1.8805, + "step": 3062 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029524792608755864, + "loss": 1.9018, + "step": 3063 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952448391941353, + "loss": 1.915, + "step": 3064 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029524175131457963, + "loss": 1.9796, + "step": 3065 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952386624489127, + "loss": 1.9062, + "step": 3066 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952355725971554, + "loss": 1.9412, + "step": 3067 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952324817593286, + "loss": 1.8909, + "step": 3068 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952293899354535, + "loss": 1.8896, + "step": 3069 + }, + { + "epoch": 0.24, + "learning_rate": 0.000295226297125551, + "loss": 1.88, + "step": 3070 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029522320332964197, + "loss": 1.9219, + "step": 3071 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952201085477476, + "loss": 1.9041, + "step": 3072 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952170127798888, + "loss": 1.9414, + "step": 3073 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952139160260867, + "loss": 1.8893, + "step": 3074 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952108182863622, + "loss": 1.9013, + "step": 3075 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002952077195607363, + "loss": 1.8746, + "step": 3076 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029520461984923024, + "loss": 1.9317, + "step": 3077 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029520151915186487, + "loss": 1.9695, + "step": 3078 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029519841746866135, + "loss": 1.9118, + "step": 3079 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029519531479964067, + "loss": 1.9195, + "step": 3080 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029519221114482396, + "loss": 1.9328, + "step": 3081 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029518910650423225, + "loss": 1.9297, + "step": 3082 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029518600087788665, + "loss": 1.8584, + "step": 3083 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029518289426580817, + "loss": 1.8918, + "step": 3084 + }, + { + "epoch": 0.24, + "learning_rate": 0.000295179786668018, + "loss": 1.8839, + "step": 3085 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029517667808453716, + "loss": 1.9493, + "step": 3086 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002951735685153868, + "loss": 1.9459, + "step": 3087 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029517045796058805, + "loss": 1.9873, + "step": 3088 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029516734642016197, + "loss": 1.9028, + "step": 3089 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029516423389412975, + "loss": 1.9675, + "step": 3090 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029516112038251245, + "loss": 1.9186, + "step": 3091 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002951580058853313, + "loss": 1.9536, + "step": 3092 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002951548904026074, + "loss": 1.8689, + "step": 3093 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029515177393436186, + "loss": 1.8927, + "step": 3094 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002951486564806158, + "loss": 1.9158, + "step": 3095 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002951455380413906, + "loss": 1.9138, + "step": 3096 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029514241861670724, + "loss": 1.9913, + "step": 3097 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002951392982065869, + "loss": 1.9204, + "step": 3098 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002951361768110509, + "loss": 1.9286, + "step": 3099 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029513305443012034, + "loss": 1.8494, + "step": 3100 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002951299310638164, + "loss": 1.9179, + "step": 3101 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029512680671216034, + "loss": 1.9152, + "step": 3102 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029512368137517335, + "loss": 1.8952, + "step": 3103 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029512055505287666, + "loss": 1.9642, + "step": 3104 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029511742774529146, + "loss": 1.9724, + "step": 3105 + }, + { + "epoch": 0.24, + "learning_rate": 0.000295114299452439, + "loss": 1.9691, + "step": 3106 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002951111701743405, + "loss": 1.9031, + "step": 3107 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029510803991101734, + "loss": 1.8781, + "step": 3108 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002951049086624906, + "loss": 1.847, + "step": 3109 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002951017764287816, + "loss": 1.9193, + "step": 3110 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029509864320991164, + "loss": 1.9394, + "step": 3111 + }, + { + "epoch": 0.24, + "learning_rate": 0.00029509550900590193, + "loss": 1.8647, + "step": 3112 + }, + { + "epoch": 0.24, + "learning_rate": 0.0002950923738167738, + "loss": 1.9041, + "step": 3113 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002950892376425485, + "loss": 1.9499, + "step": 3114 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029508610048324733, + "loss": 1.908, + "step": 3115 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002950829623388917, + "loss": 1.944, + "step": 3116 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029507982320950275, + "loss": 1.9607, + "step": 3117 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002950766830951018, + "loss": 1.952, + "step": 3118 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029507354199571033, + "loss": 1.8981, + "step": 3119 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029507039991134957, + "loss": 1.9014, + "step": 3120 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002950672568420408, + "loss": 1.8965, + "step": 3121 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029506411278780545, + "loss": 1.9028, + "step": 3122 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029506096774866477, + "loss": 1.9238, + "step": 3123 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029505782172464025, + "loss": 1.8958, + "step": 3124 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002950546747157531, + "loss": 1.9214, + "step": 3125 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002950515267220248, + "loss": 1.9544, + "step": 3126 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029504837774347665, + "loss": 1.9088, + "step": 3127 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029504522778013006, + "loss": 1.8887, + "step": 3128 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029504207683200644, + "loss": 1.8931, + "step": 3129 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029503892489912714, + "loss": 1.9432, + "step": 3130 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029503577198151357, + "loss": 1.8974, + "step": 3131 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029503261807918715, + "loss": 1.8648, + "step": 3132 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002950294631921693, + "loss": 1.8926, + "step": 3133 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029502630732048144, + "loss": 1.8848, + "step": 3134 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029502315046414494, + "loss": 1.8976, + "step": 3135 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002950199926231814, + "loss": 1.9414, + "step": 3136 + }, + { + "epoch": 0.25, + "learning_rate": 0.000295016833797612, + "loss": 1.9216, + "step": 3137 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002950136739874584, + "loss": 1.921, + "step": 3138 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029501051319274195, + "loss": 1.9192, + "step": 3139 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002950073514134841, + "loss": 1.8751, + "step": 3140 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002950041886497064, + "loss": 1.908, + "step": 3141 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029500102490143034, + "loss": 1.8686, + "step": 3142 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029499786016867725, + "loss": 1.9418, + "step": 3143 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002949946944514687, + "loss": 1.9682, + "step": 3144 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029499152774982624, + "loss": 1.8931, + "step": 3145 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002949883600637713, + "loss": 1.9508, + "step": 3146 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002949851913933254, + "loss": 1.9572, + "step": 3147 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002949820217385101, + "loss": 1.9157, + "step": 3148 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029497885109934686, + "loss": 1.9099, + "step": 3149 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002949756794758572, + "loss": 1.855, + "step": 3150 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002949725068680627, + "loss": 1.9448, + "step": 3151 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029496933327598484, + "loss": 1.9213, + "step": 3152 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029496615869964524, + "loss": 1.927, + "step": 3153 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029496298313906545, + "loss": 1.8928, + "step": 3154 + }, + { + "epoch": 0.25, + "learning_rate": 0.000294959806594267, + "loss": 1.888, + "step": 3155 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002949566290652714, + "loss": 1.9317, + "step": 3156 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029495345055210033, + "loss": 1.8719, + "step": 3157 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029495027105477535, + "loss": 1.904, + "step": 3158 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029494709057331794, + "loss": 1.8777, + "step": 3159 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029494390910774984, + "loss": 1.8914, + "step": 3160 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002949407266580926, + "loss": 1.9697, + "step": 3161 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002949375432243677, + "loss": 1.8965, + "step": 3162 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029493435880659696, + "loss": 1.9026, + "step": 3163 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029493117340480187, + "loss": 1.8232, + "step": 3164 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029492798701900413, + "loss": 1.9288, + "step": 3165 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029492479964922526, + "loss": 1.9273, + "step": 3166 + }, + { + "epoch": 0.25, + "learning_rate": 0.000294921611295487, + "loss": 1.9318, + "step": 3167 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029491842195781106, + "loss": 1.9087, + "step": 3168 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002949152316362189, + "loss": 1.8782, + "step": 3169 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002949120403307324, + "loss": 1.9071, + "step": 3170 + }, + { + "epoch": 0.25, + "learning_rate": 0.000294908848041373, + "loss": 1.8867, + "step": 3171 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002949056547681625, + "loss": 1.9326, + "step": 3172 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029490246051112266, + "loss": 1.9377, + "step": 3173 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029489926527027504, + "loss": 1.9129, + "step": 3174 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029489606904564133, + "loss": 1.9018, + "step": 3175 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002948928718372433, + "loss": 1.9011, + "step": 3176 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029488967364510265, + "loss": 1.9105, + "step": 3177 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029488647446924103, + "loss": 1.9082, + "step": 3178 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002948832743096802, + "loss": 1.9626, + "step": 3179 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002948800731664419, + "loss": 1.9482, + "step": 3180 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002948768710395479, + "loss": 1.9301, + "step": 3181 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029487366792901984, + "loss": 1.9821, + "step": 3182 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002948704638348796, + "loss": 1.9031, + "step": 3183 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029486725875714877, + "loss": 1.8373, + "step": 3184 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002948640526958492, + "loss": 1.8805, + "step": 3185 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002948608456510027, + "loss": 1.8826, + "step": 3186 + }, + { + "epoch": 0.25, + "learning_rate": 0.000294857637622631, + "loss": 1.9156, + "step": 3187 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002948544286107559, + "loss": 1.9861, + "step": 3188 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029485121861539906, + "loss": 1.8897, + "step": 3189 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002948480076365825, + "loss": 1.934, + "step": 3190 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002948447956743278, + "loss": 1.9889, + "step": 3191 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029484158272865695, + "loss": 1.8649, + "step": 3192 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002948383687995917, + "loss": 1.8908, + "step": 3193 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029483515388715374, + "loss": 1.9103, + "step": 3194 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002948319379913651, + "loss": 1.9455, + "step": 3195 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002948287211122475, + "loss": 1.9045, + "step": 3196 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002948255032498228, + "loss": 1.9232, + "step": 3197 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029482228440411287, + "loss": 1.9125, + "step": 3198 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002948190645751396, + "loss": 1.9784, + "step": 3199 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002948158437629247, + "loss": 1.8743, + "step": 3200 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002948126219674902, + "loss": 1.8962, + "step": 3201 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002948093991888579, + "loss": 1.902, + "step": 3202 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002948061754270497, + "loss": 1.944, + "step": 3203 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002948029506820874, + "loss": 1.9382, + "step": 3204 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002947997249539931, + "loss": 1.9346, + "step": 3205 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002947964982427885, + "loss": 1.9171, + "step": 3206 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029479327054849556, + "loss": 1.9261, + "step": 3207 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002947900418711363, + "loss": 1.9266, + "step": 3208 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029478681221073243, + "loss": 1.9622, + "step": 3209 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029478358156730615, + "loss": 1.9768, + "step": 3210 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029478034994087914, + "loss": 1.8953, + "step": 3211 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029477711733147356, + "loss": 1.9088, + "step": 3212 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029477388373911115, + "loss": 1.9035, + "step": 3213 + }, + { + "epoch": 0.25, + "learning_rate": 0.000294770649163814, + "loss": 1.9174, + "step": 3214 + }, + { + "epoch": 0.25, + "learning_rate": 0.000294767413605604, + "loss": 1.8209, + "step": 3215 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002947641770645032, + "loss": 1.9644, + "step": 3216 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002947609395405335, + "loss": 1.8753, + "step": 3217 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002947577010337169, + "loss": 1.8886, + "step": 3218 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002947544615440754, + "loss": 1.8764, + "step": 3219 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029475122107163105, + "loss": 1.9021, + "step": 3220 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029474797961640567, + "loss": 1.9067, + "step": 3221 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002947447371784215, + "loss": 1.9475, + "step": 3222 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029474149375770036, + "loss": 1.9191, + "step": 3223 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029473824935426435, + "loss": 1.9519, + "step": 3224 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002947350039681355, + "loss": 1.9099, + "step": 3225 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002947317575993359, + "loss": 1.8684, + "step": 3226 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002947285102478876, + "loss": 1.9149, + "step": 3227 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029472526191381244, + "loss": 1.9164, + "step": 3228 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002947220125971327, + "loss": 1.8882, + "step": 3229 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002947187622978703, + "loss": 1.8581, + "step": 3230 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002947155110160474, + "loss": 1.9002, + "step": 3231 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029471225875168607, + "loss": 1.9286, + "step": 3232 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002947090055048083, + "loss": 1.8482, + "step": 3233 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029470575127543626, + "loss": 1.8948, + "step": 3234 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029470249606359204, + "loss": 1.8938, + "step": 3235 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002946992398692977, + "loss": 1.912, + "step": 3236 + }, + { + "epoch": 0.25, + "learning_rate": 0.00029469598269257546, + "loss": 1.9163, + "step": 3237 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002946927245334472, + "loss": 1.9518, + "step": 3238 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002946894653919353, + "loss": 1.9013, + "step": 3239 + }, + { + "epoch": 0.25, + "learning_rate": 0.0002946862052680617, + "loss": 1.9324, + "step": 3240 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002946829441618487, + "loss": 1.8947, + "step": 3241 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002946796820733183, + "loss": 1.9273, + "step": 3242 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002946764190024927, + "loss": 1.9069, + "step": 3243 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002946731549493941, + "loss": 1.9343, + "step": 3244 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029466988991404453, + "loss": 1.9035, + "step": 3245 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002946666238964663, + "loss": 1.9506, + "step": 3246 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002946633568966815, + "loss": 1.8922, + "step": 3247 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029466008891471237, + "loss": 1.8763, + "step": 3248 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002946568199505811, + "loss": 1.8464, + "step": 3249 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029465355000430975, + "loss": 1.8973, + "step": 3250 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029465027907592066, + "loss": 1.8987, + "step": 3251 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029464700716543604, + "loss": 1.8277, + "step": 3252 + }, + { + "epoch": 0.26, + "learning_rate": 0.000294643734272878, + "loss": 1.8928, + "step": 3253 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002946404603982689, + "loss": 1.926, + "step": 3254 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002946371855416309, + "loss": 1.9245, + "step": 3255 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002946339097029861, + "loss": 1.9048, + "step": 3256 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029463063288235697, + "loss": 1.8699, + "step": 3257 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029462735507976566, + "loss": 1.9063, + "step": 3258 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002946240762952344, + "loss": 1.9673, + "step": 3259 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029462079652878547, + "loss": 1.9287, + "step": 3260 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029461751578044115, + "loss": 1.9137, + "step": 3261 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029461423405022366, + "loss": 1.8875, + "step": 3262 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002946109513381554, + "loss": 1.8623, + "step": 3263 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002946076676442585, + "loss": 1.8767, + "step": 3264 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002946043829685554, + "loss": 1.9078, + "step": 3265 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002946010973110683, + "loss": 1.8734, + "step": 3266 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002945978106718196, + "loss": 1.9253, + "step": 3267 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002945945230508315, + "loss": 1.8997, + "step": 3268 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002945912344481264, + "loss": 1.8574, + "step": 3269 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029458794486372666, + "loss": 1.8936, + "step": 3270 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029458465429765455, + "loss": 1.9375, + "step": 3271 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002945813627499324, + "loss": 1.8769, + "step": 3272 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002945780702205826, + "loss": 1.8702, + "step": 3273 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029457477670962747, + "loss": 1.9111, + "step": 3274 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002945714822170894, + "loss": 1.8927, + "step": 3275 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002945681867429907, + "loss": 1.8607, + "step": 3276 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029456489028735386, + "loss": 1.8996, + "step": 3277 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029456159285020116, + "loss": 1.8994, + "step": 3278 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029455829443155503, + "loss": 1.9765, + "step": 3279 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029455499503143787, + "loss": 1.831, + "step": 3280 + }, + { + "epoch": 0.26, + "learning_rate": 0.000294551694649872, + "loss": 1.959, + "step": 3281 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029454839328687995, + "loss": 1.8721, + "step": 3282 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029454509094248407, + "loss": 1.9269, + "step": 3283 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029454178761670677, + "loss": 1.9417, + "step": 3284 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029453848330957054, + "loss": 1.917, + "step": 3285 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002945351780210977, + "loss": 1.9386, + "step": 3286 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029453187175131084, + "loss": 1.9294, + "step": 3287 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029452856450023227, + "loss": 1.9278, + "step": 3288 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029452525626788453, + "loss": 1.9549, + "step": 3289 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029452194705429003, + "loss": 1.9348, + "step": 3290 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002945186368594713, + "loss": 1.8755, + "step": 3291 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029451532568345077, + "loss": 1.9236, + "step": 3292 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029451201352625095, + "loss": 1.9201, + "step": 3293 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029450870038789424, + "loss": 1.898, + "step": 3294 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029450538626840325, + "loss": 1.8375, + "step": 3295 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002945020711678004, + "loss": 1.8723, + "step": 3296 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002944987550861083, + "loss": 1.8253, + "step": 3297 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029449543802334934, + "loss": 1.9144, + "step": 3298 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002944921199795461, + "loss": 1.8857, + "step": 3299 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002944888009547211, + "loss": 1.9143, + "step": 3300 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002944854809488969, + "loss": 1.9129, + "step": 3301 + }, + { + "epoch": 0.26, + "learning_rate": 0.000294482159962096, + "loss": 1.9294, + "step": 3302 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029447883799434095, + "loss": 1.9072, + "step": 3303 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029447551504565433, + "loss": 1.9835, + "step": 3304 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002944721911160587, + "loss": 1.8865, + "step": 3305 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029446886620557665, + "loss": 1.9332, + "step": 3306 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002944655403142307, + "loss": 1.9307, + "step": 3307 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029446221344204345, + "loss": 1.9389, + "step": 3308 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002944588855890375, + "loss": 1.8921, + "step": 3309 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002944555567552354, + "loss": 1.9529, + "step": 3310 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002944522269406598, + "loss": 1.896, + "step": 3311 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002944488961453333, + "loss": 1.8985, + "step": 3312 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002944455643692785, + "loss": 1.9344, + "step": 3313 + }, + { + "epoch": 0.26, + "learning_rate": 0.000294442231612518, + "loss": 1.9506, + "step": 3314 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029443889787507453, + "loss": 1.8878, + "step": 3315 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002944355631569706, + "loss": 1.8725, + "step": 3316 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002944322274582289, + "loss": 1.9367, + "step": 3317 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002944288907788721, + "loss": 1.9069, + "step": 3318 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002944255531189229, + "loss": 1.9106, + "step": 3319 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002944222144784038, + "loss": 1.9446, + "step": 3320 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029441887485733763, + "loss": 1.9151, + "step": 3321 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002944155342557469, + "loss": 1.9293, + "step": 3322 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029441219267365446, + "loss": 1.9163, + "step": 3323 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002944088501110829, + "loss": 1.8758, + "step": 3324 + }, + { + "epoch": 0.26, + "learning_rate": 0.000294405506568055, + "loss": 1.9934, + "step": 3325 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002944021620445933, + "loss": 1.9279, + "step": 3326 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002943988165407207, + "loss": 1.909, + "step": 3327 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029439547005645977, + "loss": 1.8924, + "step": 3328 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002943921225918333, + "loss": 1.9478, + "step": 3329 + }, + { + "epoch": 0.26, + "learning_rate": 0.000294388774146864, + "loss": 1.8765, + "step": 3330 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029438542472157457, + "loss": 1.8346, + "step": 3331 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002943820743159878, + "loss": 1.9355, + "step": 3332 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029437872293012644, + "loss": 1.9302, + "step": 3333 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002943753705640132, + "loss": 1.9188, + "step": 3334 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002943720172176709, + "loss": 1.9095, + "step": 3335 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029436866289112224, + "loss": 1.9501, + "step": 3336 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002943653075843901, + "loss": 1.8645, + "step": 3337 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029436195129749714, + "loss": 1.9047, + "step": 3338 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029435859403046614, + "loss": 1.9049, + "step": 3339 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029435523578332006, + "loss": 1.8794, + "step": 3340 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002943518765560815, + "loss": 1.8991, + "step": 3341 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002943485163487734, + "loss": 1.8827, + "step": 3342 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002943451551614185, + "loss": 1.915, + "step": 3343 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029434179299403973, + "loss": 1.8549, + "step": 3344 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029433842984665973, + "loss": 1.8188, + "step": 3345 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002943350657193015, + "loss": 1.8822, + "step": 3346 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029433170061198786, + "loss": 1.8649, + "step": 3347 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029432833452474157, + "loss": 1.8819, + "step": 3348 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029432496745758556, + "loss": 1.8715, + "step": 3349 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029432159941054263, + "loss": 1.9307, + "step": 3350 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029431823038363574, + "loss": 1.9379, + "step": 3351 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002943148603768877, + "loss": 1.8985, + "step": 3352 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029431148939032135, + "loss": 1.8922, + "step": 3353 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002943081174239596, + "loss": 1.8819, + "step": 3354 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002943047444778254, + "loss": 1.9372, + "step": 3355 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002943013705519417, + "loss": 1.8865, + "step": 3356 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029429799564633123, + "loss": 1.8866, + "step": 3357 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002942946197610171, + "loss": 1.8663, + "step": 3358 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029429124289602205, + "loss": 1.9257, + "step": 3359 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029428786505136903, + "loss": 1.8568, + "step": 3360 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002942844862270812, + "loss": 1.8761, + "step": 3361 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029428110642318116, + "loss": 1.8608, + "step": 3362 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002942777256396921, + "loss": 1.8626, + "step": 3363 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029427434387663693, + "loss": 1.8968, + "step": 3364 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002942709611340386, + "loss": 1.8696, + "step": 3365 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029426757741191995, + "loss": 1.8726, + "step": 3366 + }, + { + "epoch": 0.26, + "learning_rate": 0.0002942641927103041, + "loss": 1.8866, + "step": 3367 + }, + { + "epoch": 0.26, + "learning_rate": 0.00029426080702921404, + "loss": 1.8828, + "step": 3368 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029425742036867273, + "loss": 1.8992, + "step": 3369 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002942540327287031, + "loss": 1.8505, + "step": 3370 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002942506441093282, + "loss": 1.8081, + "step": 3371 + }, + { + "epoch": 0.27, + "learning_rate": 0.000294247254510571, + "loss": 1.9217, + "step": 3372 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002942438639324546, + "loss": 1.8956, + "step": 3373 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029424047237500194, + "loss": 1.9423, + "step": 3374 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029423707983823605, + "loss": 1.9502, + "step": 3375 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029423368632218, + "loss": 1.96, + "step": 3376 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002942302918268568, + "loss": 1.8417, + "step": 3377 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029422689635228956, + "loss": 1.9154, + "step": 3378 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002942234998985012, + "loss": 1.8254, + "step": 3379 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029422010246551495, + "loss": 1.9248, + "step": 3380 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002942167040533538, + "loss": 1.8601, + "step": 3381 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029421330466204075, + "loss": 1.8962, + "step": 3382 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029420990429159893, + "loss": 1.947, + "step": 3383 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029420650294205154, + "loss": 1.9282, + "step": 3384 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002942031006134215, + "loss": 1.9087, + "step": 3385 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029419969730573196, + "loss": 1.8461, + "step": 3386 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002941962930190061, + "loss": 1.8558, + "step": 3387 + }, + { + "epoch": 0.27, + "learning_rate": 0.000294192887753267, + "loss": 1.8868, + "step": 3388 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002941894815085377, + "loss": 1.9549, + "step": 3389 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029418607428484145, + "loss": 1.8848, + "step": 3390 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002941826660822013, + "loss": 1.8639, + "step": 3391 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029417925690064045, + "loss": 1.8139, + "step": 3392 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029417584674018197, + "loss": 1.886, + "step": 3393 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029417243560084905, + "loss": 1.8715, + "step": 3394 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029416902348266486, + "loss": 1.908, + "step": 3395 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002941656103856526, + "loss": 1.9148, + "step": 3396 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029416219630983535, + "loss": 1.859, + "step": 3397 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002941587812552364, + "loss": 1.8007, + "step": 3398 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002941553652218788, + "loss": 1.9247, + "step": 3399 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029415194820978585, + "loss": 1.9071, + "step": 3400 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029414853021898074, + "loss": 1.9396, + "step": 3401 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002941451112494866, + "loss": 1.8785, + "step": 3402 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002941416913013268, + "loss": 1.8548, + "step": 3403 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002941382703745244, + "loss": 1.9128, + "step": 3404 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002941348484691027, + "loss": 1.9228, + "step": 3405 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002941314255850849, + "loss": 1.8807, + "step": 3406 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029412800172249427, + "loss": 1.918, + "step": 3407 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002941245768813541, + "loss": 1.8916, + "step": 3408 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002941211510616875, + "loss": 1.9117, + "step": 3409 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029411772426351786, + "loss": 1.9661, + "step": 3410 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029411429648686836, + "loss": 1.8503, + "step": 3411 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002941108677317624, + "loss": 1.8941, + "step": 3412 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002941074379982231, + "loss": 1.886, + "step": 3413 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029410400728627385, + "loss": 1.8502, + "step": 3414 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029410057559593793, + "loss": 1.8735, + "step": 3415 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029409714292723857, + "loss": 1.8865, + "step": 3416 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002940937092801992, + "loss": 1.9119, + "step": 3417 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029409027465484303, + "loss": 1.8924, + "step": 3418 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029408683905119337, + "loss": 1.886, + "step": 3419 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002940834024692736, + "loss": 1.8929, + "step": 3420 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002940799649091071, + "loss": 1.9259, + "step": 3421 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029407652637071714, + "loss": 1.8967, + "step": 3422 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029407308685412703, + "loss": 1.8536, + "step": 3423 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002940696463593602, + "loss": 1.8668, + "step": 3424 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002940662048864399, + "loss": 1.9217, + "step": 3425 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029406276243538966, + "loss": 1.9107, + "step": 3426 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002940593190062327, + "loss": 1.9356, + "step": 3427 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002940558745989925, + "loss": 1.8852, + "step": 3428 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002940524292136924, + "loss": 1.9408, + "step": 3429 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002940489828503558, + "loss": 1.8319, + "step": 3430 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002940455355090061, + "loss": 1.8672, + "step": 3431 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029404208718966673, + "loss": 1.9145, + "step": 3432 + }, + { + "epoch": 0.27, + "learning_rate": 0.000294038637892361, + "loss": 1.8757, + "step": 3433 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002940351876171125, + "loss": 1.8588, + "step": 3434 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029403173636394453, + "loss": 1.8544, + "step": 3435 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002940282841328805, + "loss": 1.9026, + "step": 3436 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029402483092394395, + "loss": 1.828, + "step": 3437 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002940213767371583, + "loss": 1.9297, + "step": 3438 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029401792157254694, + "loss": 1.7984, + "step": 3439 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029401446543013334, + "loss": 1.8732, + "step": 3440 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029401100830994106, + "loss": 1.9118, + "step": 3441 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029400755021199347, + "loss": 1.865, + "step": 3442 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002940040911363141, + "loss": 1.8978, + "step": 3443 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002940006310829264, + "loss": 1.9485, + "step": 3444 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002939971700518539, + "loss": 1.8739, + "step": 3445 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002939937080431201, + "loss": 1.8548, + "step": 3446 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002939902450567485, + "loss": 1.8391, + "step": 3447 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002939867810927625, + "loss": 1.8905, + "step": 3448 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029398331615118574, + "loss": 1.8502, + "step": 3449 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029397985023204177, + "loss": 1.9434, + "step": 3450 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029397638333535407, + "loss": 1.8861, + "step": 3451 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029397291546114616, + "loss": 1.8416, + "step": 3452 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002939694466094416, + "loss": 1.9213, + "step": 3453 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029396597678026397, + "loss": 1.8575, + "step": 3454 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029396250597363673, + "loss": 1.9116, + "step": 3455 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002939590341895836, + "loss": 1.8401, + "step": 3456 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029395556142812804, + "loss": 1.8916, + "step": 3457 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002939520876892937, + "loss": 1.914, + "step": 3458 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029394861297310406, + "loss": 1.9689, + "step": 3459 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029394513727958277, + "loss": 1.8979, + "step": 3460 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002939416606087535, + "loss": 1.8956, + "step": 3461 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029393818296063974, + "loss": 1.9295, + "step": 3462 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029393470433526517, + "loss": 1.8495, + "step": 3463 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029393122473265343, + "loss": 1.8916, + "step": 3464 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029392774415282804, + "loss": 1.8679, + "step": 3465 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002939242625958127, + "loss": 1.816, + "step": 3466 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029392078006163104, + "loss": 1.8988, + "step": 3467 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002939172965503067, + "loss": 1.9046, + "step": 3468 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029391381206186337, + "loss": 1.891, + "step": 3469 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002939103265963246, + "loss": 1.9038, + "step": 3470 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002939068401537142, + "loss": 1.8665, + "step": 3471 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029390335273405576, + "loss": 1.8903, + "step": 3472 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029389986433737297, + "loss": 1.8913, + "step": 3473 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002938963749636895, + "loss": 1.8979, + "step": 3474 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029389288461302907, + "loss": 1.9142, + "step": 3475 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029388939328541533, + "loss": 1.8765, + "step": 3476 + }, + { + "epoch": 0.27, + "learning_rate": 0.000293885900980872, + "loss": 1.8712, + "step": 3477 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029388240769942286, + "loss": 1.8507, + "step": 3478 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029387891344109156, + "loss": 1.8951, + "step": 3479 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029387541820590185, + "loss": 1.8792, + "step": 3480 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029387192199387737, + "loss": 1.8914, + "step": 3481 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029386842480504197, + "loss": 1.8681, + "step": 3482 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002938649266394194, + "loss": 1.8727, + "step": 3483 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029386142749703335, + "loss": 1.9193, + "step": 3484 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002938579273779076, + "loss": 1.9174, + "step": 3485 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002938544262820659, + "loss": 1.8653, + "step": 3486 + }, + { + "epoch": 0.27, + "learning_rate": 0.000293850924209532, + "loss": 1.9053, + "step": 3487 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002938474211603298, + "loss": 1.9031, + "step": 3488 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002938439171344829, + "loss": 1.9413, + "step": 3489 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002938404121320152, + "loss": 1.8723, + "step": 3490 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002938369061529505, + "loss": 1.925, + "step": 3491 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002938333991973126, + "loss": 1.912, + "step": 3492 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029382989126512524, + "loss": 1.9055, + "step": 3493 + }, + { + "epoch": 0.27, + "learning_rate": 0.00029382638235641234, + "loss": 1.8252, + "step": 3494 + }, + { + "epoch": 0.27, + "learning_rate": 0.0002938228724711976, + "loss": 1.8963, + "step": 3495 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029381936160950505, + "loss": 1.8776, + "step": 3496 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002938158497713583, + "loss": 1.9174, + "step": 3497 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029381233695678134, + "loss": 1.8829, + "step": 3498 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029380882316579795, + "loss": 1.8521, + "step": 3499 + }, + { + "epoch": 0.28, + "learning_rate": 0.000293805308398432, + "loss": 1.9833, + "step": 3500 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002938017926547074, + "loss": 1.8689, + "step": 3501 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029379827593464797, + "loss": 1.9059, + "step": 3502 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029379475823827756, + "loss": 1.8841, + "step": 3503 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002937912395656201, + "loss": 1.8644, + "step": 3504 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029378771991669955, + "loss": 1.8723, + "step": 3505 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002937841992915397, + "loss": 1.8964, + "step": 3506 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029378067769016445, + "loss": 1.8524, + "step": 3507 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002937771551125978, + "loss": 1.851, + "step": 3508 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002937736315588636, + "loss": 1.8929, + "step": 3509 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002937701070289857, + "loss": 1.8456, + "step": 3510 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002937665815229882, + "loss": 1.906, + "step": 3511 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029376305504089486, + "loss": 1.8846, + "step": 3512 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029375952758272977, + "loss": 1.8543, + "step": 3513 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029375599914851683, + "loss": 1.8576, + "step": 3514 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029375246973828, + "loss": 1.8287, + "step": 3515 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002937489393520432, + "loss": 1.9086, + "step": 3516 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029374540798983044, + "loss": 1.9039, + "step": 3517 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029374187565166563, + "loss": 1.8332, + "step": 3518 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002937383423375729, + "loss": 1.8905, + "step": 3519 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002937348080475761, + "loss": 1.9213, + "step": 3520 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029373127278169923, + "loss": 1.8716, + "step": 3521 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002937277365399664, + "loss": 1.8542, + "step": 3522 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029372419932240156, + "loss": 1.9162, + "step": 3523 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029372066112902867, + "loss": 1.8808, + "step": 3524 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029371712195987187, + "loss": 1.8773, + "step": 3525 + }, + { + "epoch": 0.28, + "learning_rate": 0.000293713581814955, + "loss": 1.8895, + "step": 3526 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029371004069430234, + "loss": 1.8561, + "step": 3527 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029370649859793775, + "loss": 1.9307, + "step": 3528 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029370295552588537, + "loss": 1.8744, + "step": 3529 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002936994114781692, + "loss": 1.9115, + "step": 3530 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029369586645481335, + "loss": 1.85, + "step": 3531 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002936923204558418, + "loss": 1.876, + "step": 3532 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029368877348127877, + "loss": 1.8764, + "step": 3533 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029368522553114825, + "loss": 1.949, + "step": 3534 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029368167660547435, + "loss": 1.8902, + "step": 3535 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029367812670428104, + "loss": 1.8911, + "step": 3536 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029367457582759265, + "loss": 1.8589, + "step": 3537 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002936710239754332, + "loss": 1.93, + "step": 3538 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002936674711478267, + "loss": 1.9006, + "step": 3539 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002936639173447974, + "loss": 1.8288, + "step": 3540 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029366036256636935, + "loss": 1.8171, + "step": 3541 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029365680681256673, + "loss": 1.882, + "step": 3542 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029365325008341367, + "loss": 1.8096, + "step": 3543 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029364969237893434, + "loss": 1.859, + "step": 3544 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002936461336991529, + "loss": 1.8554, + "step": 3545 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029364257404409334, + "loss": 1.8722, + "step": 3546 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029363901341378007, + "loss": 1.8734, + "step": 3547 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002936354518082372, + "loss": 1.8706, + "step": 3548 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002936318892274888, + "loss": 1.8487, + "step": 3549 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002936283256715592, + "loss": 1.867, + "step": 3550 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029362476114047246, + "loss": 1.8713, + "step": 3551 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002936211956342529, + "loss": 1.8761, + "step": 3552 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029361762915292467, + "loss": 1.8966, + "step": 3553 + }, + { + "epoch": 0.28, + "learning_rate": 0.000293614061696512, + "loss": 1.8707, + "step": 3554 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002936104932650391, + "loss": 1.886, + "step": 3555 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029360692385853017, + "loss": 1.856, + "step": 3556 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002936033534770095, + "loss": 1.8474, + "step": 3557 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029359978212050136, + "loss": 1.8249, + "step": 3558 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029359620978902987, + "loss": 1.8907, + "step": 3559 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002935926364826194, + "loss": 1.943, + "step": 3560 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002935890622012941, + "loss": 1.9245, + "step": 3561 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002935854869450784, + "loss": 1.7807, + "step": 3562 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029358191071399646, + "loss": 1.855, + "step": 3563 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029357833350807257, + "loss": 1.881, + "step": 3564 + }, + { + "epoch": 0.28, + "learning_rate": 0.000293574755327331, + "loss": 1.9171, + "step": 3565 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002935711761717961, + "loss": 1.8709, + "step": 3566 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002935675960414921, + "loss": 1.8531, + "step": 3567 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029356401493644337, + "loss": 1.9297, + "step": 3568 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002935604328566743, + "loss": 1.8881, + "step": 3569 + }, + { + "epoch": 0.28, + "learning_rate": 0.000293556849802209, + "loss": 1.8073, + "step": 3570 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002935532657730719, + "loss": 1.8636, + "step": 3571 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002935496807692874, + "loss": 1.8742, + "step": 3572 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002935460947908798, + "loss": 1.9165, + "step": 3573 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029354250783787336, + "loss": 1.8862, + "step": 3574 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029353891991029256, + "loss": 1.8849, + "step": 3575 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002935353310081617, + "loss": 1.9108, + "step": 3576 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002935317411315051, + "loss": 1.8664, + "step": 3577 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002935281502803473, + "loss": 1.8549, + "step": 3578 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029352455845471246, + "loss": 1.954, + "step": 3579 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029352096565462513, + "loss": 1.8654, + "step": 3580 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029351737188010963, + "loss": 1.8706, + "step": 3581 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029351377713119037, + "loss": 1.8968, + "step": 3582 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002935101814078917, + "loss": 1.8826, + "step": 3583 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002935065847102382, + "loss": 1.8131, + "step": 3584 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029350298703825415, + "loss": 1.8454, + "step": 3585 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029349938839196395, + "loss": 1.8342, + "step": 3586 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002934957887713922, + "loss": 1.8015, + "step": 3587 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002934921881765631, + "loss": 1.8381, + "step": 3588 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002934885866075013, + "loss": 1.8396, + "step": 3589 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002934849840642312, + "loss": 1.8862, + "step": 3590 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002934813805467772, + "loss": 1.9199, + "step": 3591 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002934777760551638, + "loss": 1.914, + "step": 3592 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029347417058941553, + "loss": 1.8664, + "step": 3593 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002934705641495568, + "loss": 1.9168, + "step": 3594 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029346695673561205, + "loss": 1.9159, + "step": 3595 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029346334834760596, + "loss": 1.8855, + "step": 3596 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002934597389855628, + "loss": 1.8723, + "step": 3597 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029345612864950716, + "loss": 1.8678, + "step": 3598 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002934525173394637, + "loss": 1.8975, + "step": 3599 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002934489050554567, + "loss": 1.8561, + "step": 3600 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029344529179751083, + "loss": 1.9043, + "step": 3601 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002934416775656506, + "loss": 1.8986, + "step": 3602 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029343806235990053, + "loss": 1.8334, + "step": 3603 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002934344461802851, + "loss": 1.8342, + "step": 3604 + }, + { + "epoch": 0.28, + "learning_rate": 0.000293430829026829, + "loss": 1.8611, + "step": 3605 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029342721089955674, + "loss": 1.9098, + "step": 3606 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002934235917984929, + "loss": 1.8532, + "step": 3607 + }, + { + "epoch": 0.28, + "learning_rate": 0.000293419971723662, + "loss": 1.8854, + "step": 3608 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002934163506750886, + "loss": 1.8979, + "step": 3609 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002934127286527973, + "loss": 1.8554, + "step": 3610 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029340910565681274, + "loss": 1.8685, + "step": 3611 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002934054816871595, + "loss": 1.8516, + "step": 3612 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029340185674386215, + "loss": 1.8039, + "step": 3613 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002933982308269454, + "loss": 1.8595, + "step": 3614 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029339460393643373, + "loss": 1.8485, + "step": 3615 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029339097607235183, + "loss": 1.8735, + "step": 3616 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029338734723472436, + "loss": 1.8313, + "step": 3617 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029338371742357593, + "loss": 1.8642, + "step": 3618 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029338008663893115, + "loss": 1.8645, + "step": 3619 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029337645488081474, + "loss": 1.8799, + "step": 3620 + }, + { + "epoch": 0.28, + "learning_rate": 0.0002933728221492513, + "loss": 1.9521, + "step": 3621 + }, + { + "epoch": 0.28, + "learning_rate": 0.00029336918844426554, + "loss": 1.8684, + "step": 3622 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029336555376588213, + "loss": 1.8584, + "step": 3623 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002933619181141257, + "loss": 1.8763, + "step": 3624 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002933582814890209, + "loss": 1.8755, + "step": 3625 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002933546438905926, + "loss": 1.8664, + "step": 3626 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002933510053188653, + "loss": 1.9342, + "step": 3627 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002933473657738638, + "loss": 1.8484, + "step": 3628 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002933437252556128, + "loss": 1.8537, + "step": 3629 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029334008376413696, + "loss": 1.9305, + "step": 3630 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002933364412994611, + "loss": 1.9227, + "step": 3631 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002933327978616099, + "loss": 1.8584, + "step": 3632 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029332915345060807, + "loss": 1.913, + "step": 3633 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002933255080664804, + "loss": 1.8732, + "step": 3634 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002933218617092517, + "loss": 1.8914, + "step": 3635 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029331821437894655, + "loss": 1.8562, + "step": 3636 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002933145660755898, + "loss": 1.843, + "step": 3637 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002933109167992063, + "loss": 1.8681, + "step": 3638 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029330726654982076, + "loss": 1.8742, + "step": 3639 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002933036153274579, + "loss": 1.8609, + "step": 3640 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029329996313214263, + "loss": 1.8629, + "step": 3641 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002932963099638997, + "loss": 1.8523, + "step": 3642 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029329265582275386, + "loss": 1.8933, + "step": 3643 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029328900070872997, + "loss": 1.9499, + "step": 3644 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002932853446218529, + "loss": 1.8951, + "step": 3645 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029328168756214735, + "loss": 1.8678, + "step": 3646 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002932780295296382, + "loss": 1.9005, + "step": 3647 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002932743705243503, + "loss": 1.8513, + "step": 3648 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002932707105463085, + "loss": 1.871, + "step": 3649 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029326704959553763, + "loss": 1.8629, + "step": 3650 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029326338767206257, + "loss": 1.807, + "step": 3651 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002932597247759082, + "loss": 1.8229, + "step": 3652 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029325606090709934, + "loss": 1.8936, + "step": 3653 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002932523960656609, + "loss": 1.9024, + "step": 3654 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029324873025161766, + "loss": 1.8447, + "step": 3655 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029324506346499463, + "loss": 1.9601, + "step": 3656 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002932413957058167, + "loss": 1.8687, + "step": 3657 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002932377269741087, + "loss": 1.9304, + "step": 3658 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002932340572698956, + "loss": 1.9485, + "step": 3659 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002932303865932023, + "loss": 1.8999, + "step": 3660 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002932267149440537, + "loss": 1.8835, + "step": 3661 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029322304232247474, + "loss": 1.8453, + "step": 3662 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002932193687284904, + "loss": 1.9024, + "step": 3663 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029321569416212556, + "loss": 1.9196, + "step": 3664 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029321201862340517, + "loss": 1.8549, + "step": 3665 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002932083421123542, + "loss": 1.846, + "step": 3666 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029320466462899765, + "loss": 1.8995, + "step": 3667 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029320098617336045, + "loss": 1.8672, + "step": 3668 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002931973067454676, + "loss": 1.8632, + "step": 3669 + }, + { + "epoch": 0.29, + "learning_rate": 0.000293193626345344, + "loss": 1.8765, + "step": 3670 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029318994497301473, + "loss": 1.8119, + "step": 3671 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029318626262850474, + "loss": 1.9098, + "step": 3672 + }, + { + "epoch": 0.29, + "learning_rate": 0.000293182579311839, + "loss": 1.8964, + "step": 3673 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029317889502304266, + "loss": 1.8739, + "step": 3674 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002931752097621406, + "loss": 1.8737, + "step": 3675 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002931715235291579, + "loss": 1.9244, + "step": 3676 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002931678363241195, + "loss": 1.8508, + "step": 3677 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002931641481470505, + "loss": 1.8727, + "step": 3678 + }, + { + "epoch": 0.29, + "learning_rate": 0.000293160458997976, + "loss": 1.8213, + "step": 3679 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029315676887692094, + "loss": 1.8888, + "step": 3680 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029315307778391043, + "loss": 1.868, + "step": 3681 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002931493857189695, + "loss": 1.8432, + "step": 3682 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002931456926821233, + "loss": 1.8404, + "step": 3683 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029314199867339676, + "loss": 1.8627, + "step": 3684 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029313830369281506, + "loss": 1.8389, + "step": 3685 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002931346077404033, + "loss": 1.8675, + "step": 3686 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029313091081618653, + "loss": 1.9284, + "step": 3687 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002931272129201899, + "loss": 1.8324, + "step": 3688 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002931235140524384, + "loss": 1.8801, + "step": 3689 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002931198142129573, + "loss": 1.849, + "step": 3690 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002931161134017716, + "loss": 1.8711, + "step": 3691 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002931124116189065, + "loss": 1.8488, + "step": 3692 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029310870886438704, + "loss": 1.8538, + "step": 3693 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029310500513823846, + "loss": 1.8574, + "step": 3694 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029310130044048584, + "loss": 1.8426, + "step": 3695 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002930975947711544, + "loss": 1.8836, + "step": 3696 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002930938881302692, + "loss": 1.8923, + "step": 3697 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002930901805178555, + "loss": 1.7752, + "step": 3698 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002930864719339385, + "loss": 1.8493, + "step": 3699 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002930827623785432, + "loss": 1.9699, + "step": 3700 + }, + { + "epoch": 0.29, + "learning_rate": 0.000293079051851695, + "loss": 1.9114, + "step": 3701 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029307534035341896, + "loss": 1.817, + "step": 3702 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029307162788374033, + "loss": 1.8532, + "step": 3703 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029306791444268427, + "loss": 1.8903, + "step": 3704 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029306420003027603, + "loss": 1.8512, + "step": 3705 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002930604846465408, + "loss": 1.8428, + "step": 3706 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002930567682915039, + "loss": 1.8498, + "step": 3707 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029305305096519044, + "loss": 1.8865, + "step": 3708 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029304933266762574, + "loss": 1.8317, + "step": 3709 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029304561339883495, + "loss": 1.9021, + "step": 3710 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029304189315884345, + "loss": 1.8995, + "step": 3711 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029303817194767633, + "loss": 1.8306, + "step": 3712 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002930344497653591, + "loss": 1.8712, + "step": 3713 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002930307266119168, + "loss": 1.829, + "step": 3714 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029302700248737474, + "loss": 1.8647, + "step": 3715 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002930232773917584, + "loss": 1.904, + "step": 3716 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029301955132509283, + "loss": 1.9531, + "step": 3717 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029301582428740346, + "loss": 1.8748, + "step": 3718 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029301209627871557, + "loss": 1.8884, + "step": 3719 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002930083672990545, + "loss": 1.856, + "step": 3720 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002930046373484455, + "loss": 1.8899, + "step": 3721 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029300090642691396, + "loss": 1.8595, + "step": 3722 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029299717453448514, + "loss": 1.8795, + "step": 3723 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002929934416711844, + "loss": 1.8924, + "step": 3724 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029298970783703715, + "loss": 1.8829, + "step": 3725 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029298597303206866, + "loss": 1.92, + "step": 3726 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029298223725630435, + "loss": 1.869, + "step": 3727 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029297850050976953, + "loss": 1.8094, + "step": 3728 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002929747627924896, + "loss": 1.8565, + "step": 3729 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029297102410448994, + "loss": 1.9086, + "step": 3730 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002929672844457959, + "loss": 1.8268, + "step": 3731 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029296354381643295, + "loss": 1.8803, + "step": 3732 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029295980221642634, + "loss": 1.844, + "step": 3733 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002929560596458016, + "loss": 1.8213, + "step": 3734 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029295231610458416, + "loss": 1.8576, + "step": 3735 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029294857159279937, + "loss": 1.8814, + "step": 3736 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002929448261104726, + "loss": 1.8101, + "step": 3737 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002929410796576294, + "loss": 1.874, + "step": 3738 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029293733223429515, + "loss": 1.874, + "step": 3739 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029293358384049526, + "loss": 1.862, + "step": 3740 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002929298344762552, + "loss": 1.888, + "step": 3741 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002929260841416005, + "loss": 1.8313, + "step": 3742 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029292233283655653, + "loss": 1.8884, + "step": 3743 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002929185805611488, + "loss": 1.7404, + "step": 3744 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029291482731540273, + "loss": 1.8953, + "step": 3745 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002929110730993439, + "loss": 1.8435, + "step": 3746 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002929073179129977, + "loss": 1.8881, + "step": 3747 + }, + { + "epoch": 0.29, + "learning_rate": 0.00029290356175638973, + "loss": 1.8059, + "step": 3748 + }, + { + "epoch": 0.29, + "learning_rate": 0.0002928998046295454, + "loss": 1.8443, + "step": 3749 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029289604653249027, + "loss": 1.8498, + "step": 3750 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029289228746524985, + "loss": 1.8566, + "step": 3751 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029288852742784965, + "loss": 1.8801, + "step": 3752 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002928847664203152, + "loss": 1.8613, + "step": 3753 + }, + { + "epoch": 0.3, + "learning_rate": 0.000292881004442672, + "loss": 1.8941, + "step": 3754 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002928772414949457, + "loss": 1.8492, + "step": 3755 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002928734775771617, + "loss": 1.9005, + "step": 3756 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002928697126893457, + "loss": 1.7973, + "step": 3757 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002928659468315232, + "loss": 1.8703, + "step": 3758 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002928621800037197, + "loss": 1.8873, + "step": 3759 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029285841220596083, + "loss": 1.859, + "step": 3760 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029285464343827217, + "loss": 1.8958, + "step": 3761 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002928508737006794, + "loss": 1.8631, + "step": 3762 + }, + { + "epoch": 0.3, + "learning_rate": 0.000292847102993208, + "loss": 1.8544, + "step": 3763 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029284333131588357, + "loss": 1.818, + "step": 3764 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029283955866873175, + "loss": 1.8751, + "step": 3765 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002928357850517781, + "loss": 1.8155, + "step": 3766 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002928320104650484, + "loss": 1.8479, + "step": 3767 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002928282349085681, + "loss": 1.8124, + "step": 3768 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029282445838236295, + "loss": 1.8426, + "step": 3769 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002928206808864585, + "loss": 1.8849, + "step": 3770 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002928169024208805, + "loss": 1.9025, + "step": 3771 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029281312298565443, + "loss": 1.862, + "step": 3772 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029280934258080617, + "loss": 1.8482, + "step": 3773 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029280556120636126, + "loss": 1.8786, + "step": 3774 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002928017788623454, + "loss": 1.8973, + "step": 3775 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002927979955487843, + "loss": 1.8699, + "step": 3776 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029279421126570353, + "loss": 1.9402, + "step": 3777 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002927904260131289, + "loss": 1.8483, + "step": 3778 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029278663979108606, + "loss": 1.8662, + "step": 3779 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002927828525996008, + "loss": 1.8614, + "step": 3780 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002927790644386987, + "loss": 1.8215, + "step": 3781 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002927752753084055, + "loss": 1.8448, + "step": 3782 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002927714852087471, + "loss": 1.8519, + "step": 3783 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029276769413974903, + "loss": 1.872, + "step": 3784 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002927639021014371, + "loss": 1.8297, + "step": 3785 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002927601090938371, + "loss": 1.8768, + "step": 3786 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029275631511697464, + "loss": 1.7995, + "step": 3787 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002927525201708757, + "loss": 1.8407, + "step": 3788 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029274872425556585, + "loss": 1.8582, + "step": 3789 + }, + { + "epoch": 0.3, + "learning_rate": 0.000292744927371071, + "loss": 1.8628, + "step": 3790 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029274112951741676, + "loss": 1.9647, + "step": 3791 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002927373306946291, + "loss": 1.868, + "step": 3792 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002927335309027337, + "loss": 1.8726, + "step": 3793 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029272973014175644, + "loss": 1.9098, + "step": 3794 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029272592841172307, + "loss": 1.8364, + "step": 3795 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002927221257126594, + "loss": 1.8256, + "step": 3796 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002927183220445912, + "loss": 1.8944, + "step": 3797 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002927145174075444, + "loss": 1.8338, + "step": 3798 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002927107118015448, + "loss": 1.8852, + "step": 3799 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002927069052266182, + "loss": 1.8298, + "step": 3800 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029270309768279046, + "loss": 1.9146, + "step": 3801 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029269928917008745, + "loss": 1.8635, + "step": 3802 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029269547968853503, + "loss": 1.8426, + "step": 3803 + }, + { + "epoch": 0.3, + "learning_rate": 0.000292691669238159, + "loss": 1.8323, + "step": 3804 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029268785781898536, + "loss": 1.8685, + "step": 3805 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002926840454310398, + "loss": 1.891, + "step": 3806 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029268023207434837, + "loss": 1.8702, + "step": 3807 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002926764177489369, + "loss": 1.8591, + "step": 3808 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002926726024548313, + "loss": 1.8911, + "step": 3809 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029266878619205747, + "loss": 1.8056, + "step": 3810 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029266496896064126, + "loss": 1.8174, + "step": 3811 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029266115076060874, + "loss": 1.8177, + "step": 3812 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002926573315919856, + "loss": 1.8485, + "step": 3813 + }, + { + "epoch": 0.3, + "learning_rate": 0.000292653511454798, + "loss": 1.8721, + "step": 3814 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029264969034907177, + "loss": 1.8445, + "step": 3815 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002926458682748328, + "loss": 1.8361, + "step": 3816 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029264204523210714, + "loss": 1.8296, + "step": 3817 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029263822122092077, + "loss": 1.855, + "step": 3818 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029263439624129954, + "loss": 1.8652, + "step": 3819 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002926305702932694, + "loss": 1.8488, + "step": 3820 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002926267433768565, + "loss": 1.8527, + "step": 3821 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002926229154920867, + "loss": 1.8861, + "step": 3822 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029261908663898595, + "loss": 1.8709, + "step": 3823 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002926152568175804, + "loss": 1.8831, + "step": 3824 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029261142602789587, + "loss": 1.8761, + "step": 3825 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029260759426995856, + "loss": 1.8517, + "step": 3826 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002926037615437943, + "loss": 1.9022, + "step": 3827 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029259992784942923, + "loss": 1.806, + "step": 3828 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002925960931868893, + "loss": 1.8691, + "step": 3829 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002925922575562006, + "loss": 1.8473, + "step": 3830 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002925884209573892, + "loss": 1.8514, + "step": 3831 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002925845833904811, + "loss": 1.8955, + "step": 3832 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002925807448555023, + "loss": 1.8709, + "step": 3833 + }, + { + "epoch": 0.3, + "learning_rate": 0.000292576905352479, + "loss": 1.8448, + "step": 3834 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029257306488143716, + "loss": 1.8075, + "step": 3835 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002925692234424029, + "loss": 1.8762, + "step": 3836 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029256538103540223, + "loss": 1.8292, + "step": 3837 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029256153766046134, + "loss": 1.9507, + "step": 3838 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002925576933176063, + "loss": 1.8035, + "step": 3839 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002925538480068632, + "loss": 1.8466, + "step": 3840 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029255000172825814, + "loss": 1.8564, + "step": 3841 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029254615448181723, + "loss": 1.9127, + "step": 3842 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029254230626756656, + "loss": 1.9008, + "step": 3843 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002925384570855323, + "loss": 1.891, + "step": 3844 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002925346069357406, + "loss": 1.8517, + "step": 3845 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002925307558182175, + "loss": 1.8328, + "step": 3846 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029252690373298936, + "loss": 1.8778, + "step": 3847 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002925230506800821, + "loss": 1.849, + "step": 3848 + }, + { + "epoch": 0.3, + "learning_rate": 0.000292519196659522, + "loss": 1.7949, + "step": 3849 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002925153416713352, + "loss": 1.8621, + "step": 3850 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002925114857155479, + "loss": 1.8169, + "step": 3851 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029250762879218624, + "loss": 1.8617, + "step": 3852 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002925037709012764, + "loss": 1.8635, + "step": 3853 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002924999120428446, + "loss": 1.7654, + "step": 3854 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029249605221691704, + "loss": 1.9275, + "step": 3855 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029249219142351993, + "loss": 1.827, + "step": 3856 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029248832966267946, + "loss": 1.8968, + "step": 3857 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002924844669344219, + "loss": 1.8314, + "step": 3858 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002924806032387734, + "loss": 1.8248, + "step": 3859 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029247673857576024, + "loss": 1.8873, + "step": 3860 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002924728729454087, + "loss": 1.9098, + "step": 3861 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029246900634774493, + "loss": 1.8833, + "step": 3862 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002924651387827952, + "loss": 1.7776, + "step": 3863 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029246127025058584, + "loss": 1.8054, + "step": 3864 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002924574007511431, + "loss": 1.8603, + "step": 3865 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029245353028449316, + "loss": 1.8335, + "step": 3866 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029244965885066236, + "loss": 1.8673, + "step": 3867 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029244578644967704, + "loss": 1.8386, + "step": 3868 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002924419130815634, + "loss": 1.8698, + "step": 3869 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029243803874634777, + "loss": 1.8466, + "step": 3870 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029243416344405647, + "loss": 1.8565, + "step": 3871 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002924302871747158, + "loss": 1.8851, + "step": 3872 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002924264099383521, + "loss": 1.867, + "step": 3873 + }, + { + "epoch": 0.3, + "learning_rate": 0.0002924225317349917, + "loss": 1.8581, + "step": 3874 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029241865256466085, + "loss": 1.7993, + "step": 3875 + }, + { + "epoch": 0.3, + "learning_rate": 0.00029241477242738595, + "loss": 1.8271, + "step": 3876 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002924108913231933, + "loss": 1.8794, + "step": 3877 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002924070092521094, + "loss": 1.825, + "step": 3878 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029240312621416043, + "loss": 1.8561, + "step": 3879 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002923992422093728, + "loss": 1.8898, + "step": 3880 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002923953572377729, + "loss": 1.8193, + "step": 3881 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002923914712993871, + "loss": 1.8735, + "step": 3882 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002923875843942418, + "loss": 1.8743, + "step": 3883 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002923836965223634, + "loss": 1.8592, + "step": 3884 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029237980768377826, + "loss": 1.836, + "step": 3885 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029237591787851277, + "loss": 1.8578, + "step": 3886 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002923720271065934, + "loss": 1.9073, + "step": 3887 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002923681353680465, + "loss": 1.8586, + "step": 3888 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029236424266289855, + "loss": 1.8829, + "step": 3889 + }, + { + "epoch": 0.31, + "learning_rate": 0.000292360348991176, + "loss": 1.8403, + "step": 3890 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029235645435290514, + "loss": 1.8738, + "step": 3891 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002923525587481126, + "loss": 1.8652, + "step": 3892 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002923486621768247, + "loss": 1.8696, + "step": 3893 + }, + { + "epoch": 0.31, + "learning_rate": 0.000292344764639068, + "loss": 1.8699, + "step": 3894 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029234086613486883, + "loss": 1.8729, + "step": 3895 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002923369666642537, + "loss": 1.8534, + "step": 3896 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002923330662272492, + "loss": 1.8687, + "step": 3897 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002923291648238817, + "loss": 1.8479, + "step": 3898 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002923252624541777, + "loss": 1.8802, + "step": 3899 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002923213591181637, + "loss": 1.9133, + "step": 3900 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029231745481586623, + "loss": 1.8672, + "step": 3901 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002923135495473118, + "loss": 1.8673, + "step": 3902 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002923096433125269, + "loss": 1.836, + "step": 3903 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029230573611153796, + "loss": 1.8305, + "step": 3904 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002923018279443717, + "loss": 1.8459, + "step": 3905 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029229791881105454, + "loss": 1.8325, + "step": 3906 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029229400871161305, + "loss": 1.8472, + "step": 3907 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029229009764607374, + "loss": 1.902, + "step": 3908 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002922861856144632, + "loss": 1.8051, + "step": 3909 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029228227261680797, + "loss": 1.8509, + "step": 3910 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002922783586531346, + "loss": 1.813, + "step": 3911 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002922744437234698, + "loss": 1.8315, + "step": 3912 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029227052782783994, + "loss": 1.8752, + "step": 3913 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002922666109662717, + "loss": 1.8564, + "step": 3914 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029226269313879175, + "loss": 1.8519, + "step": 3915 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029225877434542653, + "loss": 1.8184, + "step": 3916 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002922548545862028, + "loss": 1.8716, + "step": 3917 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029225093386114713, + "loss": 1.8202, + "step": 3918 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029224701217028603, + "loss": 1.8966, + "step": 3919 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002922430895136463, + "loss": 1.8506, + "step": 3920 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002922391658912545, + "loss": 1.8691, + "step": 3921 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002922352413031372, + "loss": 1.8436, + "step": 3922 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002922313157493211, + "loss": 1.792, + "step": 3923 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029222738922983293, + "loss": 1.7931, + "step": 3924 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002922234617446992, + "loss": 1.754, + "step": 3925 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002922195332939467, + "loss": 1.8874, + "step": 3926 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029221560387760197, + "loss": 1.8813, + "step": 3927 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029221167349569185, + "loss": 1.9105, + "step": 3928 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029220774214824293, + "loss": 1.856, + "step": 3929 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002922038098352819, + "loss": 1.844, + "step": 3930 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029219987655683546, + "loss": 1.7764, + "step": 3931 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002921959423129304, + "loss": 1.8349, + "step": 3932 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002921920071035933, + "loss": 1.8148, + "step": 3933 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029218807092885093, + "loss": 1.8308, + "step": 3934 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002921841337887301, + "loss": 1.8505, + "step": 3935 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002921801956832574, + "loss": 1.8759, + "step": 3936 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029217625661245964, + "loss": 1.8894, + "step": 3937 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002921723165763636, + "loss": 1.8152, + "step": 3938 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029216837557499595, + "loss": 1.8482, + "step": 3939 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029216443360838344, + "loss": 1.8373, + "step": 3940 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029216049067655296, + "loss": 1.8775, + "step": 3941 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002921565467795312, + "loss": 1.8865, + "step": 3942 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002921526019173449, + "loss": 1.8498, + "step": 3943 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029214865609002085, + "loss": 1.8118, + "step": 3944 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029214470929758593, + "loss": 1.7787, + "step": 3945 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002921407615400668, + "loss": 1.7834, + "step": 3946 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002921368128174904, + "loss": 1.8167, + "step": 3947 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002921328631298835, + "loss": 1.8576, + "step": 3948 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029212891247727284, + "loss": 1.9214, + "step": 3949 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002921249608596853, + "loss": 1.7998, + "step": 3950 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029212100827714774, + "loss": 1.8263, + "step": 3951 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002921170547296869, + "loss": 1.8745, + "step": 3952 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002921131002173298, + "loss": 1.8482, + "step": 3953 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029210914474010307, + "loss": 1.812, + "step": 3954 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002921051882980337, + "loss": 1.866, + "step": 3955 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002921012308911486, + "loss": 1.8698, + "step": 3956 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029209727251947444, + "loss": 1.788, + "step": 3957 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029209331318303826, + "loss": 1.893, + "step": 3958 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002920893528818669, + "loss": 1.8802, + "step": 3959 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029208539161598723, + "loss": 1.8526, + "step": 3960 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002920814293854262, + "loss": 1.8823, + "step": 3961 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029207746619021064, + "loss": 1.7869, + "step": 3962 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029207350203036753, + "loss": 1.8271, + "step": 3963 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002920695369059237, + "loss": 1.8507, + "step": 3964 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002920655708169061, + "loss": 1.8458, + "step": 3965 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002920616037633417, + "loss": 1.8248, + "step": 3966 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002920576357452574, + "loss": 1.8375, + "step": 3967 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002920536667626802, + "loss": 1.8705, + "step": 3968 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002920496968156369, + "loss": 1.8758, + "step": 3969 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002920457259041546, + "loss": 1.9331, + "step": 3970 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029204175402826023, + "loss": 1.88, + "step": 3971 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029203778118798066, + "loss": 1.8081, + "step": 3972 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029203380738334304, + "loss": 1.8194, + "step": 3973 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029202983261437417, + "loss": 1.766, + "step": 3974 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002920258568811012, + "loss": 1.8967, + "step": 3975 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002920218801835509, + "loss": 1.841, + "step": 3976 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002920179025217505, + "loss": 1.8461, + "step": 3977 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002920139238957269, + "loss": 1.8234, + "step": 3978 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002920099443055071, + "loss": 1.836, + "step": 3979 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002920059637511182, + "loss": 1.8956, + "step": 3980 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002920019822325871, + "loss": 1.8424, + "step": 3981 + }, + { + "epoch": 0.31, + "learning_rate": 0.000291997999749941, + "loss": 1.9107, + "step": 3982 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002919940163032068, + "loss": 1.8974, + "step": 3983 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029199003189241156, + "loss": 1.8247, + "step": 3984 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029198604651758237, + "loss": 1.8514, + "step": 3985 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002919820601787463, + "loss": 1.8121, + "step": 3986 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029197807287593036, + "loss": 1.8386, + "step": 3987 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002919740846091617, + "loss": 1.8565, + "step": 3988 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029197009537846734, + "loss": 1.8284, + "step": 3989 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029196610518387436, + "loss": 1.8269, + "step": 3990 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002919621140254099, + "loss": 1.8224, + "step": 3991 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029195812190310093, + "loss": 1.9385, + "step": 3992 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029195412881697475, + "loss": 1.8048, + "step": 3993 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002919501347670583, + "loss": 1.8459, + "step": 3994 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029194613975337886, + "loss": 1.8197, + "step": 3995 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002919421437759634, + "loss": 1.8354, + "step": 3996 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029193814683483915, + "loss": 1.9004, + "step": 3997 + }, + { + "epoch": 0.31, + "learning_rate": 0.00029193414893003317, + "loss": 1.7746, + "step": 3998 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002919301500615727, + "loss": 1.8108, + "step": 3999 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002919261502294848, + "loss": 1.8784, + "step": 4000 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002919221494337967, + "loss": 1.8941, + "step": 4001 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002919181476745355, + "loss": 1.8358, + "step": 4002 + }, + { + "epoch": 0.31, + "learning_rate": 0.0002919141449517283, + "loss": 1.8212, + "step": 4003 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002919101412654025, + "loss": 1.8864, + "step": 4004 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002919061366155851, + "loss": 1.7775, + "step": 4005 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002919021310023034, + "loss": 1.8573, + "step": 4006 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029189812442558444, + "loss": 1.8247, + "step": 4007 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029189411688545553, + "loss": 1.8642, + "step": 4008 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029189010838194393, + "loss": 1.841, + "step": 4009 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029188609891507675, + "loss": 1.831, + "step": 4010 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002918820884848813, + "loss": 1.8106, + "step": 4011 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002918780770913848, + "loss": 1.8883, + "step": 4012 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002918740647346144, + "loss": 1.8233, + "step": 4013 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029187005141459736, + "loss": 1.883, + "step": 4014 + }, + { + "epoch": 0.32, + "learning_rate": 0.000291866037131361, + "loss": 1.8002, + "step": 4015 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002918620218849325, + "loss": 1.8493, + "step": 4016 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002918580056753392, + "loss": 1.9019, + "step": 4017 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029185398850260834, + "loss": 1.7938, + "step": 4018 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029184997036676714, + "loss": 1.8758, + "step": 4019 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002918459512678429, + "loss": 1.8069, + "step": 4020 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029184193120586295, + "loss": 1.8404, + "step": 4021 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002918379101808546, + "loss": 1.8332, + "step": 4022 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002918338881928451, + "loss": 1.8537, + "step": 4023 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029182986524186173, + "loss": 1.8362, + "step": 4024 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002918258413279319, + "loss": 1.8644, + "step": 4025 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029182181645108284, + "loss": 1.8967, + "step": 4026 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002918177906113419, + "loss": 1.8725, + "step": 4027 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002918137638087364, + "loss": 1.8226, + "step": 4028 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002918097360432938, + "loss": 1.8286, + "step": 4029 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029180570731504124, + "loss": 1.8321, + "step": 4030 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002918016776240063, + "loss": 1.8105, + "step": 4031 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002917976469702161, + "loss": 1.8254, + "step": 4032 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029179361535369816, + "loss": 1.8631, + "step": 4033 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029178958277447986, + "loss": 1.8273, + "step": 4034 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002917855492325885, + "loss": 1.9059, + "step": 4035 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029178151472805154, + "loss": 1.8697, + "step": 4036 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002917774792608963, + "loss": 1.8206, + "step": 4037 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002917734428311503, + "loss": 1.9014, + "step": 4038 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002917694054388407, + "loss": 1.8889, + "step": 4039 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002917653670839952, + "loss": 1.9107, + "step": 4040 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029176132776664106, + "loss": 1.8929, + "step": 4041 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002917572874868057, + "loss": 1.869, + "step": 4042 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002917532462445166, + "loss": 1.7673, + "step": 4043 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002917492040398012, + "loss": 1.8571, + "step": 4044 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029174516087268696, + "loss": 1.8239, + "step": 4045 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029174111674320124, + "loss": 1.8069, + "step": 4046 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029173707165137166, + "loss": 1.8707, + "step": 4047 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002917330255972254, + "loss": 1.7801, + "step": 4048 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002917289785807903, + "loss": 1.8641, + "step": 4049 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029172493060209353, + "loss": 1.8494, + "step": 4050 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029172088166116273, + "loss": 1.869, + "step": 4051 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002917168317580253, + "loss": 1.8661, + "step": 4052 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029171278089270886, + "loss": 1.8223, + "step": 4053 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029170872906524086, + "loss": 1.8009, + "step": 4054 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002917046762756487, + "loss": 1.8605, + "step": 4055 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029170062252396005, + "loss": 1.801, + "step": 4056 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002916965678102024, + "loss": 1.7711, + "step": 4057 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029169251213440316, + "loss": 1.8264, + "step": 4058 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029168845549659, + "loss": 1.8734, + "step": 4059 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029168439789679045, + "loss": 1.8102, + "step": 4060 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029168033933503197, + "loss": 1.8516, + "step": 4061 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029167627981134216, + "loss": 1.8598, + "step": 4062 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002916722193257487, + "loss": 1.8482, + "step": 4063 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029166815787827895, + "loss": 1.8691, + "step": 4064 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002916640954689606, + "loss": 1.831, + "step": 4065 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002916600320978212, + "loss": 1.8533, + "step": 4066 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002916559677648884, + "loss": 1.8217, + "step": 4067 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029165190247018975, + "loss": 1.8062, + "step": 4068 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029164783621375283, + "loss": 1.8218, + "step": 4069 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002916437689956053, + "loss": 1.8081, + "step": 4070 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002916397008157747, + "loss": 1.8535, + "step": 4071 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002916356316742887, + "loss": 1.8399, + "step": 4072 + }, + { + "epoch": 0.32, + "learning_rate": 0.000291631561571175, + "loss": 1.8312, + "step": 4073 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002916274905064611, + "loss": 1.8797, + "step": 4074 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002916234184801747, + "loss": 1.829, + "step": 4075 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002916193454923434, + "loss": 1.8422, + "step": 4076 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029161527154299496, + "loss": 1.829, + "step": 4077 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029161119663215695, + "loss": 1.8705, + "step": 4078 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029160712075985707, + "loss": 1.8188, + "step": 4079 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029160304392612297, + "loss": 1.8445, + "step": 4080 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029159896613098235, + "loss": 1.8625, + "step": 4081 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002915948873744629, + "loss": 1.861, + "step": 4082 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002915908076565923, + "loss": 1.7897, + "step": 4083 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029158672697739824, + "loss": 1.8442, + "step": 4084 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029158264533690845, + "loss": 1.8126, + "step": 4085 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029157856273515065, + "loss": 1.831, + "step": 4086 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002915744791721525, + "loss": 1.825, + "step": 4087 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029157039464794177, + "loss": 1.7813, + "step": 4088 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002915663091625462, + "loss": 1.8904, + "step": 4089 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029156222271599347, + "loss": 1.8006, + "step": 4090 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029155813530831146, + "loss": 1.854, + "step": 4091 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002915540469395278, + "loss": 1.8102, + "step": 4092 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002915499576096702, + "loss": 1.8208, + "step": 4093 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002915458673187666, + "loss": 1.8729, + "step": 4094 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002915417760668446, + "loss": 1.8474, + "step": 4095 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002915376838539321, + "loss": 1.8308, + "step": 4096 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002915335906800568, + "loss": 1.8787, + "step": 4097 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029152949654524655, + "loss": 1.8052, + "step": 4098 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002915254014495291, + "loss": 1.8795, + "step": 4099 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029152130539293223, + "loss": 1.843, + "step": 4100 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002915172083754839, + "loss": 1.7879, + "step": 4101 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029151311039721174, + "loss": 1.8492, + "step": 4102 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002915090114581437, + "loss": 1.7961, + "step": 4103 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002915049115583075, + "loss": 1.7987, + "step": 4104 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002915008106977311, + "loss": 1.8618, + "step": 4105 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002914967088764423, + "loss": 1.7986, + "step": 4106 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029149260609446885, + "loss": 1.8141, + "step": 4107 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029148850235183874, + "loss": 1.8139, + "step": 4108 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029148439764857976, + "loss": 1.8282, + "step": 4109 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029148029198471987, + "loss": 1.8518, + "step": 4110 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002914761853602868, + "loss": 1.8444, + "step": 4111 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029147207777530847, + "loss": 1.8058, + "step": 4112 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029146796922981284, + "loss": 1.8284, + "step": 4113 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029146385972382777, + "loss": 1.8588, + "step": 4114 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029145974925738117, + "loss": 1.8134, + "step": 4115 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029145563783050096, + "loss": 1.8373, + "step": 4116 + }, + { + "epoch": 0.32, + "learning_rate": 0.000291451525443215, + "loss": 1.8968, + "step": 4117 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002914474120955512, + "loss": 1.799, + "step": 4118 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002914432977875376, + "loss": 1.7743, + "step": 4119 + }, + { + "epoch": 0.32, + "learning_rate": 0.000291439182519202, + "loss": 1.8609, + "step": 4120 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029143506629057247, + "loss": 1.8867, + "step": 4121 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002914309491016769, + "loss": 1.8184, + "step": 4122 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002914268309525431, + "loss": 1.8403, + "step": 4123 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002914227118431993, + "loss": 1.8511, + "step": 4124 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002914185917736733, + "loss": 1.8529, + "step": 4125 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002914144707439931, + "loss": 1.7788, + "step": 4126 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029141034875418664, + "loss": 1.8259, + "step": 4127 + }, + { + "epoch": 0.32, + "learning_rate": 0.000291406225804282, + "loss": 1.8663, + "step": 4128 + }, + { + "epoch": 0.32, + "learning_rate": 0.0002914021018943071, + "loss": 1.8524, + "step": 4129 + }, + { + "epoch": 0.32, + "learning_rate": 0.00029139797702428997, + "loss": 1.8832, + "step": 4130 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002913938511942586, + "loss": 1.8616, + "step": 4131 + }, + { + "epoch": 0.33, + "learning_rate": 0.000291389724404241, + "loss": 1.796, + "step": 4132 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002913855966542652, + "loss": 1.8471, + "step": 4133 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002913814679443592, + "loss": 1.8312, + "step": 4134 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029137733827455106, + "loss": 1.8372, + "step": 4135 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029137320764486885, + "loss": 1.8746, + "step": 4136 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029136907605534055, + "loss": 1.8767, + "step": 4137 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029136494350599426, + "loss": 1.848, + "step": 4138 + }, + { + "epoch": 0.33, + "learning_rate": 0.000291360809996858, + "loss": 1.8281, + "step": 4139 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029135667552795984, + "loss": 1.8494, + "step": 4140 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002913525400993279, + "loss": 1.8843, + "step": 4141 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002913484037109902, + "loss": 1.818, + "step": 4142 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002913442663629748, + "loss": 1.8777, + "step": 4143 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002913401280553098, + "loss": 1.8435, + "step": 4144 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002913359887880234, + "loss": 1.8298, + "step": 4145 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029133184856114364, + "loss": 1.874, + "step": 4146 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002913277073746986, + "loss": 1.8049, + "step": 4147 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029132356522871644, + "loss": 1.8207, + "step": 4148 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002913194221232252, + "loss": 1.7602, + "step": 4149 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002913152780582531, + "loss": 1.8272, + "step": 4150 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002913111330338283, + "loss": 1.8178, + "step": 4151 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029130698704997877, + "loss": 1.8068, + "step": 4152 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002913028401067329, + "loss": 1.858, + "step": 4153 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002912986922041187, + "loss": 1.8408, + "step": 4154 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002912945433421643, + "loss": 1.8582, + "step": 4155 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002912903935208979, + "loss": 1.8121, + "step": 4156 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002912862427403478, + "loss": 1.8696, + "step": 4157 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029128209100054203, + "loss": 1.8336, + "step": 4158 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002912779383015088, + "loss": 1.8118, + "step": 4159 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002912737846432764, + "loss": 1.7618, + "step": 4160 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002912696300258729, + "loss": 1.8081, + "step": 4161 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002912654744493266, + "loss": 1.8034, + "step": 4162 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002912613179136657, + "loss": 1.8218, + "step": 4163 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002912571604189184, + "loss": 1.8221, + "step": 4164 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002912530019651129, + "loss": 1.8499, + "step": 4165 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002912488425522775, + "loss": 1.8563, + "step": 4166 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029124468218044036, + "loss": 1.7936, + "step": 4167 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002912405208496298, + "loss": 1.805, + "step": 4168 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029123635855987407, + "loss": 1.7759, + "step": 4169 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002912321953112014, + "loss": 1.8069, + "step": 4170 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029122803110364005, + "loss": 1.8892, + "step": 4171 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029122386593721827, + "loss": 1.8237, + "step": 4172 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029121969981196446, + "loss": 1.7786, + "step": 4173 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029121553272790676, + "loss": 1.8107, + "step": 4174 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002912113646850735, + "loss": 1.8354, + "step": 4175 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029120719568349304, + "loss": 1.86, + "step": 4176 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029120302572319367, + "loss": 1.8529, + "step": 4177 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002911988548042036, + "loss": 1.7874, + "step": 4178 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002911946829265513, + "loss": 1.836, + "step": 4179 + }, + { + "epoch": 0.33, + "learning_rate": 0.000291190510090265, + "loss": 1.8618, + "step": 4180 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029118633629537303, + "loss": 1.8012, + "step": 4181 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029118216154190373, + "loss": 1.8393, + "step": 4182 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002911779858298855, + "loss": 1.8042, + "step": 4183 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002911738091593467, + "loss": 1.8809, + "step": 4184 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002911696315303156, + "loss": 1.8068, + "step": 4185 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002911654529428206, + "loss": 1.8328, + "step": 4186 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002911612733968901, + "loss": 1.8476, + "step": 4187 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002911570928925524, + "loss": 1.8387, + "step": 4188 + }, + { + "epoch": 0.33, + "learning_rate": 0.000291152911429836, + "loss": 1.8801, + "step": 4189 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002911487290087692, + "loss": 1.8209, + "step": 4190 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029114454562938034, + "loss": 1.7969, + "step": 4191 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029114036129169796, + "loss": 1.8709, + "step": 4192 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029113617599575047, + "loss": 1.8111, + "step": 4193 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002911319897415662, + "loss": 1.8563, + "step": 4194 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029112780252917356, + "loss": 1.8322, + "step": 4195 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002911236143586011, + "loss": 1.8328, + "step": 4196 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029111942522987714, + "loss": 1.7964, + "step": 4197 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029111523514303015, + "loss": 1.8114, + "step": 4198 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029111104409808856, + "loss": 1.7836, + "step": 4199 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029110685209508087, + "loss": 1.8988, + "step": 4200 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002911026591340356, + "loss": 1.857, + "step": 4201 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029109846521498106, + "loss": 1.8582, + "step": 4202 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002910942703379458, + "loss": 1.8068, + "step": 4203 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029109007450295836, + "loss": 1.855, + "step": 4204 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002910858777100471, + "loss": 1.8123, + "step": 4205 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029108167995924066, + "loss": 1.7877, + "step": 4206 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029107748125056744, + "loss": 1.8181, + "step": 4207 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029107328158405597, + "loss": 1.7782, + "step": 4208 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029106908095973477, + "loss": 1.8343, + "step": 4209 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029106487937763235, + "loss": 1.8644, + "step": 4210 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002910606768377772, + "loss": 1.8457, + "step": 4211 + }, + { + "epoch": 0.33, + "learning_rate": 0.000291056473340198, + "loss": 1.8691, + "step": 4212 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029105226888492315, + "loss": 1.807, + "step": 4213 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002910480634719813, + "loss": 1.7869, + "step": 4214 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002910438571014008, + "loss": 1.8054, + "step": 4215 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029103964977321043, + "loss": 1.8824, + "step": 4216 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029103544148743866, + "loss": 1.8224, + "step": 4217 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029103123224411405, + "loss": 1.7749, + "step": 4218 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029102702204326523, + "loss": 1.8223, + "step": 4219 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002910228108849207, + "loss": 1.8212, + "step": 4220 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029101859876910915, + "loss": 1.8501, + "step": 4221 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002910143856958591, + "loss": 1.8461, + "step": 4222 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002910101716651992, + "loss": 1.8615, + "step": 4223 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002910059566771581, + "loss": 1.8132, + "step": 4224 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002910017407317644, + "loss": 1.7694, + "step": 4225 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002909975238290466, + "loss": 1.7711, + "step": 4226 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029099330596903345, + "loss": 1.7787, + "step": 4227 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002909890871517535, + "loss": 1.7833, + "step": 4228 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002909848673772355, + "loss": 1.8842, + "step": 4229 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002909806466455081, + "loss": 1.8106, + "step": 4230 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029097642495659983, + "loss": 1.7507, + "step": 4231 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002909722023105395, + "loss": 1.844, + "step": 4232 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002909679787073557, + "loss": 1.7649, + "step": 4233 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029096375414707713, + "loss": 1.8291, + "step": 4234 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002909595286297324, + "loss": 1.8187, + "step": 4235 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002909553021553503, + "loss": 1.8326, + "step": 4236 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029095107472395946, + "loss": 1.8635, + "step": 4237 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002909468463355886, + "loss": 1.7067, + "step": 4238 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002909426169902665, + "loss": 1.8186, + "step": 4239 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029093838668802174, + "loss": 1.7843, + "step": 4240 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002909341554288831, + "loss": 1.8909, + "step": 4241 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002909299232128794, + "loss": 1.8162, + "step": 4242 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029092569004003925, + "loss": 1.7874, + "step": 4243 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029092145591039145, + "loss": 1.8336, + "step": 4244 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029091722082396466, + "loss": 1.8947, + "step": 4245 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002909129847807878, + "loss": 1.858, + "step": 4246 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029090874778088944, + "loss": 1.842, + "step": 4247 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029090450982429853, + "loss": 1.8506, + "step": 4248 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029090027091104373, + "loss": 1.8735, + "step": 4249 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002908960310411538, + "loss": 1.8324, + "step": 4250 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029089179021465764, + "loss": 1.8641, + "step": 4251 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029088754843158393, + "loss": 1.8438, + "step": 4252 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002908833056919615, + "loss": 1.8297, + "step": 4253 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002908790619958192, + "loss": 1.7755, + "step": 4254 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002908748173431858, + "loss": 1.8098, + "step": 4255 + }, + { + "epoch": 0.33, + "learning_rate": 0.0002908705717340902, + "loss": 1.7578, + "step": 4256 + }, + { + "epoch": 0.33, + "learning_rate": 0.00029086632516856105, + "loss": 1.8138, + "step": 4257 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002908620776466273, + "loss": 1.7897, + "step": 4258 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002908578291683178, + "loss": 1.8412, + "step": 4259 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002908535797336614, + "loss": 1.8229, + "step": 4260 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029084932934268694, + "loss": 1.7633, + "step": 4261 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002908450779954232, + "loss": 1.8273, + "step": 4262 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002908408256918992, + "loss": 1.7431, + "step": 4263 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029083657243214356, + "loss": 1.7959, + "step": 4264 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002908323182161855, + "loss": 1.8496, + "step": 4265 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029082806304405357, + "loss": 1.846, + "step": 4266 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002908238069157769, + "loss": 1.8265, + "step": 4267 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002908195498313842, + "loss": 1.8703, + "step": 4268 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002908152917909045, + "loss": 1.8498, + "step": 4269 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002908110327943667, + "loss": 1.9118, + "step": 4270 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029080677284179973, + "loss": 1.8045, + "step": 4271 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002908025119332324, + "loss": 1.8028, + "step": 4272 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029079825006869377, + "loss": 1.8086, + "step": 4273 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029079398724821267, + "loss": 1.8655, + "step": 4274 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029078972347181816, + "loss": 1.7985, + "step": 4275 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029078545873953903, + "loss": 1.7913, + "step": 4276 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029078119305140445, + "loss": 1.8178, + "step": 4277 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029077692640744313, + "loss": 1.8005, + "step": 4278 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029077265880768426, + "loss": 1.7737, + "step": 4279 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002907683902521567, + "loss": 1.8526, + "step": 4280 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029076412074088945, + "loss": 1.8613, + "step": 4281 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029075985027391147, + "loss": 1.8026, + "step": 4282 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029075557885125183, + "loss": 1.8271, + "step": 4283 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029075130647293943, + "loss": 1.9011, + "step": 4284 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029074703313900337, + "loss": 1.8414, + "step": 4285 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002907427588494726, + "loss": 1.8564, + "step": 4286 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002907384836043762, + "loss": 1.799, + "step": 4287 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002907342074037431, + "loss": 1.8486, + "step": 4288 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029072993024760246, + "loss": 1.7983, + "step": 4289 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029072565213598327, + "loss": 1.8479, + "step": 4290 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029072137306891454, + "loss": 1.7729, + "step": 4291 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029071709304642534, + "loss": 1.8505, + "step": 4292 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029071281206854467, + "loss": 1.8609, + "step": 4293 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029070853013530174, + "loss": 1.8116, + "step": 4294 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002907042472467255, + "loss": 1.788, + "step": 4295 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002906999634028451, + "loss": 1.8235, + "step": 4296 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029069567860368957, + "loss": 1.8611, + "step": 4297 + }, + { + "epoch": 0.34, + "learning_rate": 0.000290691392849288, + "loss": 1.8175, + "step": 4298 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029068710613966957, + "loss": 1.8355, + "step": 4299 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002906828184748633, + "loss": 1.8283, + "step": 4300 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002906785298548983, + "loss": 1.8826, + "step": 4301 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029067424027980375, + "loss": 1.8129, + "step": 4302 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029066994974960873, + "loss": 1.8166, + "step": 4303 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029066565826434235, + "loss": 1.8549, + "step": 4304 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002906613658240338, + "loss": 1.8174, + "step": 4305 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002906570724287122, + "loss": 1.8106, + "step": 4306 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029065277807840674, + "loss": 1.8004, + "step": 4307 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002906484827731465, + "loss": 1.8082, + "step": 4308 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002906441865129607, + "loss": 1.886, + "step": 4309 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002906398892978784, + "loss": 1.8306, + "step": 4310 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029063559112792897, + "loss": 1.8504, + "step": 4311 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002906312920031414, + "loss": 1.8163, + "step": 4312 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029062699192354503, + "loss": 1.8453, + "step": 4313 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029062269088916894, + "loss": 1.8644, + "step": 4314 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002906183889000424, + "loss": 1.8102, + "step": 4315 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029061408595619466, + "loss": 1.833, + "step": 4316 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002906097820576548, + "loss": 1.8353, + "step": 4317 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029060547720445216, + "loss": 1.8224, + "step": 4318 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029060117139661584, + "loss": 1.8289, + "step": 4319 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029059686463417525, + "loss": 1.8421, + "step": 4320 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029059255691715947, + "loss": 1.828, + "step": 4321 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002905882482455979, + "loss": 1.8768, + "step": 4322 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002905839386195196, + "loss": 1.801, + "step": 4323 + }, + { + "epoch": 0.34, + "learning_rate": 0.000290579628038954, + "loss": 1.875, + "step": 4324 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002905753165039303, + "loss": 1.7887, + "step": 4325 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029057100401447776, + "loss": 1.8601, + "step": 4326 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029056669057062566, + "loss": 1.8253, + "step": 4327 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029056237617240335, + "loss": 1.8401, + "step": 4328 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029055806081984006, + "loss": 1.8147, + "step": 4329 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002905537445129651, + "loss": 1.7512, + "step": 4330 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029054942725180774, + "loss": 1.8362, + "step": 4331 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002905451090363974, + "loss": 1.7945, + "step": 4332 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002905407898667633, + "loss": 1.8427, + "step": 4333 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002905364697429348, + "loss": 1.876, + "step": 4334 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002905321486649412, + "loss": 1.7892, + "step": 4335 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029052782663281185, + "loss": 1.8326, + "step": 4336 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029052350364657616, + "loss": 1.8425, + "step": 4337 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029051917970626337, + "loss": 1.8235, + "step": 4338 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002905148548119029, + "loss": 1.8193, + "step": 4339 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002905105289635242, + "loss": 1.8139, + "step": 4340 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029050620216115647, + "loss": 1.8453, + "step": 4341 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002905018744048291, + "loss": 1.8247, + "step": 4342 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002904975456945717, + "loss": 1.8265, + "step": 4343 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029049321603041335, + "loss": 1.8214, + "step": 4344 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002904888854123837, + "loss": 1.8205, + "step": 4345 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029048455384051195, + "loss": 1.8065, + "step": 4346 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002904802213148277, + "loss": 1.8372, + "step": 4347 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029047588783536024, + "loss": 1.8195, + "step": 4348 + }, + { + "epoch": 0.34, + "learning_rate": 0.000290471553402139, + "loss": 1.7637, + "step": 4349 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029046721801519345, + "loss": 1.7428, + "step": 4350 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029046288167455293, + "loss": 1.8191, + "step": 4351 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029045854438024705, + "loss": 1.8405, + "step": 4352 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002904542061323051, + "loss": 1.7779, + "step": 4353 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029044986693075664, + "loss": 1.7796, + "step": 4354 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002904455267756311, + "loss": 1.8294, + "step": 4355 + }, + { + "epoch": 0.34, + "learning_rate": 0.000290441185666958, + "loss": 1.8504, + "step": 4356 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029043684360476665, + "loss": 1.7972, + "step": 4357 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029043250058908665, + "loss": 1.8274, + "step": 4358 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029042815661994744, + "loss": 1.836, + "step": 4359 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029042381169737863, + "loss": 1.844, + "step": 4360 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029041946582140953, + "loss": 1.7835, + "step": 4361 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002904151189920698, + "loss": 1.8213, + "step": 4362 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002904107712093889, + "loss": 1.801, + "step": 4363 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002904064224733963, + "loss": 1.7486, + "step": 4364 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029040207278412165, + "loss": 1.7416, + "step": 4365 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002903977221415944, + "loss": 1.8044, + "step": 4366 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029039337054584407, + "loss": 1.877, + "step": 4367 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029038901799690025, + "loss": 1.7891, + "step": 4368 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002903846644947924, + "loss": 1.7928, + "step": 4369 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002903803100395502, + "loss": 1.8563, + "step": 4370 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029037595463120313, + "loss": 1.822, + "step": 4371 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029037159826978087, + "loss": 1.8729, + "step": 4372 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029036724095531287, + "loss": 1.8112, + "step": 4373 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029036288268782876, + "loss": 1.8138, + "step": 4374 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029035852346735817, + "loss": 1.8231, + "step": 4375 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002903541632939306, + "loss": 1.855, + "step": 4376 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002903498021675758, + "loss": 1.7896, + "step": 4377 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002903454400883232, + "loss": 1.8336, + "step": 4378 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002903410770562026, + "loss": 1.8509, + "step": 4379 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029033671307124347, + "loss": 1.8893, + "step": 4380 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002903323481334755, + "loss": 1.8421, + "step": 4381 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002903279822429284, + "loss": 1.7667, + "step": 4382 + }, + { + "epoch": 0.34, + "learning_rate": 0.0002903236153996317, + "loss": 1.8449, + "step": 4383 + }, + { + "epoch": 0.34, + "learning_rate": 0.00029031924760361506, + "loss": 1.8521, + "step": 4384 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002903148788549082, + "loss": 1.8097, + "step": 4385 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029031050915354073, + "loss": 1.8334, + "step": 4386 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029030613849954234, + "loss": 1.7868, + "step": 4387 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002903017668929427, + "loss": 1.7973, + "step": 4388 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029029739433377144, + "loss": 1.7876, + "step": 4389 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029029302082205833, + "loss": 1.8485, + "step": 4390 + }, + { + "epoch": 0.35, + "learning_rate": 0.000290288646357833, + "loss": 1.7981, + "step": 4391 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002902842709411252, + "loss": 1.8453, + "step": 4392 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029027989457196463, + "loss": 1.7526, + "step": 4393 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029027551725038103, + "loss": 1.8156, + "step": 4394 + }, + { + "epoch": 0.35, + "learning_rate": 0.000290271138976404, + "loss": 1.8532, + "step": 4395 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002902667597500634, + "loss": 1.8518, + "step": 4396 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029026237957138887, + "loss": 1.8095, + "step": 4397 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002902579984404102, + "loss": 1.8127, + "step": 4398 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002902536163571571, + "loss": 1.9227, + "step": 4399 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002902492333216594, + "loss": 1.8515, + "step": 4400 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002902448493339467, + "loss": 1.8317, + "step": 4401 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029024046439404897, + "loss": 1.8082, + "step": 4402 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029023607850199584, + "loss": 1.8391, + "step": 4403 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029023169165781713, + "loss": 1.7857, + "step": 4404 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002902273038615426, + "loss": 1.8148, + "step": 4405 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002902229151132021, + "loss": 1.8373, + "step": 4406 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029021852541282535, + "loss": 1.7664, + "step": 4407 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002902141347604422, + "loss": 1.8428, + "step": 4408 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029020974315608245, + "loss": 1.8387, + "step": 4409 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002902053505997759, + "loss": 1.798, + "step": 4410 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029020095709155245, + "loss": 1.8626, + "step": 4411 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002901965626314418, + "loss": 1.8342, + "step": 4412 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002901921672194739, + "loss": 1.8125, + "step": 4413 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002901877708556785, + "loss": 1.8311, + "step": 4414 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002901833735400856, + "loss": 1.8272, + "step": 4415 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029017897527272487, + "loss": 1.794, + "step": 4416 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029017457605362627, + "loss": 1.8291, + "step": 4417 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029017017588281967, + "loss": 1.7967, + "step": 4418 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029016577476033493, + "loss": 1.802, + "step": 4419 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002901613726862019, + "loss": 1.7649, + "step": 4420 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002901569696604505, + "loss": 1.8514, + "step": 4421 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029015256568311066, + "loss": 1.8003, + "step": 4422 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029014816075421224, + "loss": 1.8737, + "step": 4423 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002901437548737851, + "loss": 1.8313, + "step": 4424 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029013934804185924, + "loss": 1.8425, + "step": 4425 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002901349402584645, + "loss": 1.8685, + "step": 4426 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002901305315236309, + "loss": 1.7932, + "step": 4427 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002901261218373883, + "loss": 1.827, + "step": 4428 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002901217111997666, + "loss": 1.798, + "step": 4429 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002901172996107959, + "loss": 1.8167, + "step": 4430 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029011288707050606, + "loss": 1.7968, + "step": 4431 + }, + { + "epoch": 0.35, + "learning_rate": 0.000290108473578927, + "loss": 1.8145, + "step": 4432 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002901040591360887, + "loss": 1.8101, + "step": 4433 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002900996437420212, + "loss": 1.816, + "step": 4434 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002900952273967544, + "loss": 1.8646, + "step": 4435 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002900908101003184, + "loss": 1.8392, + "step": 4436 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029008639185274296, + "loss": 1.8601, + "step": 4437 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002900819726540583, + "loss": 1.8513, + "step": 4438 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029007755250429434, + "loss": 1.8661, + "step": 4439 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029007313140348115, + "loss": 1.7945, + "step": 4440 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029006870935164864, + "loss": 1.8012, + "step": 4441 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002900642863488269, + "loss": 1.7002, + "step": 4442 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029005986239504596, + "loss": 1.82, + "step": 4443 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029005543749033584, + "loss": 1.8443, + "step": 4444 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002900510116347266, + "loss": 1.788, + "step": 4445 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002900465848282483, + "loss": 1.776, + "step": 4446 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002900421570709309, + "loss": 1.8162, + "step": 4447 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002900377283628046, + "loss": 1.8688, + "step": 4448 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002900332987038994, + "loss": 1.8331, + "step": 4449 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029002886809424537, + "loss": 1.8305, + "step": 4450 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002900244365338725, + "loss": 1.8656, + "step": 4451 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002900200040228111, + "loss": 1.8262, + "step": 4452 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002900155705610911, + "loss": 1.8736, + "step": 4453 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002900111361487427, + "loss": 1.7943, + "step": 4454 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002900067007857959, + "loss": 1.8375, + "step": 4455 + }, + { + "epoch": 0.35, + "learning_rate": 0.00029000226447228086, + "loss": 1.8563, + "step": 4456 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002899978272082277, + "loss": 1.8595, + "step": 4457 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002899933889936666, + "loss": 1.8222, + "step": 4458 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028998894982862756, + "loss": 1.8462, + "step": 4459 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028998450971314086, + "loss": 1.7499, + "step": 4460 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028998006864723656, + "loss": 1.8201, + "step": 4461 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002899756266309449, + "loss": 1.8202, + "step": 4462 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028997118366429594, + "loss": 1.8549, + "step": 4463 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028996673974731983, + "loss": 1.8552, + "step": 4464 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028996229488004687, + "loss": 1.8207, + "step": 4465 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002899578490625072, + "loss": 1.8095, + "step": 4466 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028995340229473086, + "loss": 1.7914, + "step": 4467 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002899489545767482, + "loss": 1.8257, + "step": 4468 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002899445059085894, + "loss": 1.8829, + "step": 4469 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002899400562902846, + "loss": 1.8567, + "step": 4470 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028993560572186406, + "loss": 1.8018, + "step": 4471 + }, + { + "epoch": 0.35, + "learning_rate": 0.000289931154203358, + "loss": 1.8089, + "step": 4472 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028992670173479655, + "loss": 1.7933, + "step": 4473 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028992224831621006, + "loss": 1.8504, + "step": 4474 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002899177939476287, + "loss": 1.8004, + "step": 4475 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028991333862908277, + "loss": 1.9034, + "step": 4476 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028990888236060246, + "loss": 1.7895, + "step": 4477 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028990442514221804, + "loss": 1.8233, + "step": 4478 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028989996697395976, + "loss": 1.827, + "step": 4479 + }, + { + "epoch": 0.35, + "learning_rate": 0.000289895507855858, + "loss": 1.8022, + "step": 4480 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028989104778794284, + "loss": 1.7986, + "step": 4481 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002898865867702447, + "loss": 1.8654, + "step": 4482 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002898821248027938, + "loss": 1.8231, + "step": 4483 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002898776618856205, + "loss": 1.8362, + "step": 4484 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002898731980187551, + "loss": 1.7776, + "step": 4485 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002898687332022278, + "loss": 1.823, + "step": 4486 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028986426743606903, + "loss": 1.7367, + "step": 4487 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028985980072030907, + "loss": 1.8646, + "step": 4488 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028985533305497823, + "loss": 1.7639, + "step": 4489 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028985086444010687, + "loss": 1.7981, + "step": 4490 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028984639487572534, + "loss": 1.8374, + "step": 4491 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002898419243618639, + "loss": 1.7646, + "step": 4492 + }, + { + "epoch": 0.35, + "learning_rate": 0.000289837452898553, + "loss": 1.8428, + "step": 4493 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028983298048582297, + "loss": 1.8567, + "step": 4494 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002898285071237042, + "loss": 1.8472, + "step": 4495 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028982403281222694, + "loss": 1.7847, + "step": 4496 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002898195575514217, + "loss": 1.816, + "step": 4497 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028981508134131884, + "loss": 1.8446, + "step": 4498 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002898106041819487, + "loss": 1.8945, + "step": 4499 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028980612607334174, + "loss": 1.7909, + "step": 4500 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028980164701552835, + "loss": 1.8029, + "step": 4501 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028979716700853895, + "loss": 1.8006, + "step": 4502 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002897926860524039, + "loss": 1.8389, + "step": 4503 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002897882041471536, + "loss": 1.7869, + "step": 4504 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002897837212928186, + "loss": 1.7976, + "step": 4505 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028977923748942926, + "loss": 1.8237, + "step": 4506 + }, + { + "epoch": 0.35, + "learning_rate": 0.000289774752737016, + "loss": 1.8069, + "step": 4507 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028977026703560935, + "loss": 1.8889, + "step": 4508 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002897657803852397, + "loss": 1.818, + "step": 4509 + }, + { + "epoch": 0.35, + "learning_rate": 0.00028976129278593756, + "loss": 1.8583, + "step": 4510 + }, + { + "epoch": 0.35, + "learning_rate": 0.0002897568042377333, + "loss": 1.8407, + "step": 4511 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028975231474065753, + "loss": 1.8175, + "step": 4512 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002897478242947406, + "loss": 1.836, + "step": 4513 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002897433329000131, + "loss": 1.8299, + "step": 4514 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028973884055650547, + "loss": 1.8483, + "step": 4515 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028973434726424827, + "loss": 1.7954, + "step": 4516 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028972985302327194, + "loss": 1.8378, + "step": 4517 + }, + { + "epoch": 0.36, + "learning_rate": 0.000289725357833607, + "loss": 1.864, + "step": 4518 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028972086169528396, + "loss": 1.7594, + "step": 4519 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028971636460833346, + "loss": 1.8135, + "step": 4520 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002897118665727859, + "loss": 1.8032, + "step": 4521 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028970736758867185, + "loss": 1.8036, + "step": 4522 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028970286765602187, + "loss": 1.8387, + "step": 4523 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002896983667748665, + "loss": 1.8349, + "step": 4524 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028969386494523636, + "loss": 1.8156, + "step": 4525 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028968936216716197, + "loss": 1.82, + "step": 4526 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028968485844067386, + "loss": 1.7895, + "step": 4527 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002896803537658027, + "loss": 1.829, + "step": 4528 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028967584814257894, + "loss": 1.8054, + "step": 4529 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002896713415710333, + "loss": 1.8469, + "step": 4530 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028966683405119633, + "loss": 1.8108, + "step": 4531 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002896623255830986, + "loss": 1.861, + "step": 4532 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002896578161667708, + "loss": 1.7818, + "step": 4533 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028965330580224346, + "loss": 1.8417, + "step": 4534 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002896487944895473, + "loss": 1.8002, + "step": 4535 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028964428222871277, + "loss": 1.772, + "step": 4536 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002896397690197707, + "loss": 1.8559, + "step": 4537 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028963525486275167, + "loss": 1.8131, + "step": 4538 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002896307397576863, + "loss": 1.8402, + "step": 4539 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028962622370460526, + "loss": 1.8268, + "step": 4540 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002896217067035392, + "loss": 1.7969, + "step": 4541 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028961718875451884, + "loss": 1.7924, + "step": 4542 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028961266985757475, + "loss": 1.806, + "step": 4543 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028960815001273776, + "loss": 1.7866, + "step": 4544 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002896036292200384, + "loss": 1.7923, + "step": 4545 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002895991074795075, + "loss": 1.8208, + "step": 4546 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002895945847911756, + "loss": 1.815, + "step": 4547 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028959006115507357, + "loss": 1.8196, + "step": 4548 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002895855365712321, + "loss": 1.7712, + "step": 4549 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028958101103968183, + "loss": 1.7899, + "step": 4550 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028957648456045355, + "loss": 1.7979, + "step": 4551 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002895719571335779, + "loss": 1.7899, + "step": 4552 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028956742875908565, + "loss": 1.8153, + "step": 4553 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028956289943700766, + "loss": 1.8208, + "step": 4554 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002895583691673746, + "loss": 1.814, + "step": 4555 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002895538379502172, + "loss": 1.8142, + "step": 4556 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028954930578556625, + "loss": 1.8736, + "step": 4557 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002895447726734526, + "loss": 1.8615, + "step": 4558 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002895402386139068, + "loss": 1.7768, + "step": 4559 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002895357036069599, + "loss": 1.7577, + "step": 4560 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028953116765264257, + "loss": 1.7988, + "step": 4561 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002895266307509856, + "loss": 1.8349, + "step": 4562 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028952209290201975, + "loss": 1.8125, + "step": 4563 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028951755410577595, + "loss": 1.8001, + "step": 4564 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028951301436228494, + "loss": 1.794, + "step": 4565 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002895084736715775, + "loss": 1.8407, + "step": 4566 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002895039320336846, + "loss": 1.9048, + "step": 4567 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002894993894486369, + "loss": 1.8221, + "step": 4568 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028949484591646535, + "loss": 1.8239, + "step": 4569 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002894903014372008, + "loss": 1.8562, + "step": 4570 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028948575601087405, + "loss": 1.8169, + "step": 4571 + }, + { + "epoch": 0.36, + "learning_rate": 0.000289481209637516, + "loss": 1.7939, + "step": 4572 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028947666231715754, + "loss": 1.8155, + "step": 4573 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028947211404982946, + "loss": 1.8777, + "step": 4574 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002894675648355628, + "loss": 1.8058, + "step": 4575 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028946301467438817, + "loss": 1.8301, + "step": 4576 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028945846356633677, + "loss": 1.7487, + "step": 4577 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002894539115114393, + "loss": 1.7915, + "step": 4578 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002894493585097268, + "loss": 1.8113, + "step": 4579 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028944480456123, + "loss": 1.7863, + "step": 4580 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028944024966598, + "loss": 1.8151, + "step": 4581 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028943569382400763, + "loss": 1.8631, + "step": 4582 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028943113703534383, + "loss": 1.8099, + "step": 4583 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002894265793000196, + "loss": 1.7975, + "step": 4584 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002894220206180658, + "loss": 1.8831, + "step": 4585 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002894174609895135, + "loss": 1.8068, + "step": 4586 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028941290041439345, + "loss": 1.8035, + "step": 4587 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002894083388927368, + "loss": 1.8669, + "step": 4588 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028940377642457446, + "loss": 1.6967, + "step": 4589 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002893992130099374, + "loss": 1.8192, + "step": 4590 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002893946486488567, + "loss": 1.8273, + "step": 4591 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028939008334136315, + "loss": 1.7473, + "step": 4592 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028938551708748787, + "loss": 1.7773, + "step": 4593 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028938094988726184, + "loss": 1.7582, + "step": 4594 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002893763817407161, + "loss": 1.8074, + "step": 4595 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002893718126478817, + "loss": 1.815, + "step": 4596 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002893672426087895, + "loss": 1.8514, + "step": 4597 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002893626716234707, + "loss": 1.7866, + "step": 4598 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002893580996919562, + "loss": 1.8213, + "step": 4599 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002893535268142772, + "loss": 1.8195, + "step": 4600 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002893489529904646, + "loss": 1.7792, + "step": 4601 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002893443782205495, + "loss": 1.7986, + "step": 4602 + }, + { + "epoch": 0.36, + "learning_rate": 0.000289339802504563, + "loss": 1.7646, + "step": 4603 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002893352258425361, + "loss": 1.8399, + "step": 4604 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028933064823449996, + "loss": 1.7845, + "step": 4605 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028932606968048557, + "loss": 1.7479, + "step": 4606 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028932149018052404, + "loss": 1.8055, + "step": 4607 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002893169097346465, + "loss": 1.8764, + "step": 4608 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028931232834288403, + "loss": 1.7993, + "step": 4609 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028930774600526775, + "loss": 1.8492, + "step": 4610 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002893031627218287, + "loss": 1.8131, + "step": 4611 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028929857849259807, + "loss": 1.8208, + "step": 4612 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002892939933176069, + "loss": 1.7508, + "step": 4613 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002892894071968865, + "loss": 1.8266, + "step": 4614 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028928482013046783, + "loss": 1.7404, + "step": 4615 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028928023211838213, + "loss": 1.8314, + "step": 4616 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002892756431606605, + "loss": 1.8392, + "step": 4617 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028927105325733405, + "loss": 1.7772, + "step": 4618 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028926646240843407, + "loss": 1.8255, + "step": 4619 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002892618706139917, + "loss": 1.8164, + "step": 4620 + }, + { + "epoch": 0.36, + "learning_rate": 0.000289257277874038, + "loss": 1.7905, + "step": 4621 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028925268418860425, + "loss": 1.8816, + "step": 4622 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002892480895577216, + "loss": 1.8072, + "step": 4623 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002892434939814213, + "loss": 1.833, + "step": 4624 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028923889745973455, + "loss": 1.8335, + "step": 4625 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002892342999926925, + "loss": 1.8101, + "step": 4626 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028922970158032634, + "loss": 1.7816, + "step": 4627 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002892251022226674, + "loss": 1.8268, + "step": 4628 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002892205019197468, + "loss": 1.8517, + "step": 4629 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028921590067159585, + "loss": 1.7647, + "step": 4630 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028921129847824575, + "loss": 1.7684, + "step": 4631 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002892066953397277, + "loss": 1.8452, + "step": 4632 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028920209125607313, + "loss": 1.7859, + "step": 4633 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028919748622731307, + "loss": 1.8552, + "step": 4634 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028919288025347896, + "loss": 1.8553, + "step": 4635 + }, + { + "epoch": 0.36, + "learning_rate": 0.000289188273334602, + "loss": 1.7795, + "step": 4636 + }, + { + "epoch": 0.36, + "learning_rate": 0.00028918366547071346, + "loss": 1.8134, + "step": 4637 + }, + { + "epoch": 0.36, + "learning_rate": 0.0002891790566618446, + "loss": 1.7561, + "step": 4638 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028917444690802687, + "loss": 1.8189, + "step": 4639 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028916983620929135, + "loss": 1.7918, + "step": 4640 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028916522456566947, + "loss": 1.826, + "step": 4641 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002891606119771925, + "loss": 1.8461, + "step": 4642 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002891559984438918, + "loss": 1.8024, + "step": 4643 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002891513839657986, + "loss": 1.8398, + "step": 4644 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002891467685429443, + "loss": 1.8423, + "step": 4645 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002891421521753603, + "loss": 1.8324, + "step": 4646 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028913753486307784, + "loss": 1.7454, + "step": 4647 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028913291660612823, + "loss": 1.7958, + "step": 4648 + }, + { + "epoch": 0.37, + "learning_rate": 0.000289128297404543, + "loss": 1.7177, + "step": 4649 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028912367725835337, + "loss": 1.841, + "step": 4650 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028911905616759077, + "loss": 1.8075, + "step": 4651 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028911443413228647, + "loss": 1.829, + "step": 4652 + }, + { + "epoch": 0.37, + "learning_rate": 0.000289109811152472, + "loss": 1.8292, + "step": 4653 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028910518722817866, + "loss": 1.7714, + "step": 4654 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028910056235943786, + "loss": 1.8173, + "step": 4655 + }, + { + "epoch": 0.37, + "learning_rate": 0.000289095936546281, + "loss": 1.7921, + "step": 4656 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028909130978873953, + "loss": 1.8369, + "step": 4657 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028908668208684477, + "loss": 1.8286, + "step": 4658 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028908205344062825, + "loss": 1.8703, + "step": 4659 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002890774238501213, + "loss": 1.7483, + "step": 4660 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002890727933153554, + "loss": 1.772, + "step": 4661 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028906816183636193, + "loss": 1.7914, + "step": 4662 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002890635294131725, + "loss": 1.8308, + "step": 4663 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028905889604581835, + "loss": 1.8577, + "step": 4664 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002890542617343311, + "loss": 1.7471, + "step": 4665 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002890496264787421, + "loss": 1.8125, + "step": 4666 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002890449902790829, + "loss": 1.812, + "step": 4667 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028904035313538493, + "loss": 1.826, + "step": 4668 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028903571504767964, + "loss": 1.7648, + "step": 4669 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002890310760159986, + "loss": 1.8471, + "step": 4670 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028902643604037336, + "loss": 1.7101, + "step": 4671 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028902179512083526, + "loss": 1.7512, + "step": 4672 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002890171532574159, + "loss": 1.7263, + "step": 4673 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028901251045014684, + "loss": 1.7857, + "step": 4674 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002890078666990595, + "loss": 1.7938, + "step": 4675 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028900322200418546, + "loss": 1.7827, + "step": 4676 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028899857636555625, + "loss": 1.7885, + "step": 4677 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002889939297832034, + "loss": 1.7916, + "step": 4678 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002889892822571585, + "loss": 1.8203, + "step": 4679 + }, + { + "epoch": 0.37, + "learning_rate": 0.000288984633787453, + "loss": 1.7507, + "step": 4680 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028897998437411865, + "loss": 1.8344, + "step": 4681 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002889753340171868, + "loss": 1.822, + "step": 4682 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028897068271668916, + "loss": 1.7815, + "step": 4683 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002889660304726573, + "loss": 1.7893, + "step": 4684 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002889613772851228, + "loss": 1.7628, + "step": 4685 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002889567231541172, + "loss": 1.8182, + "step": 4686 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002889520680796721, + "loss": 1.8701, + "step": 4687 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002889474120618192, + "loss": 1.8303, + "step": 4688 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028894275510059, + "loss": 1.8543, + "step": 4689 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002889380971960162, + "loss": 1.8163, + "step": 4690 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028893343834812934, + "loss": 1.7743, + "step": 4691 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002889287785569611, + "loss": 1.712, + "step": 4692 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002889241178225432, + "loss": 1.8191, + "step": 4693 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002889194561449072, + "loss": 1.7361, + "step": 4694 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028891479352408474, + "loss": 1.8117, + "step": 4695 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002889101299601075, + "loss": 1.8042, + "step": 4696 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028890546545300703, + "loss": 1.7966, + "step": 4697 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002889008000028152, + "loss": 1.818, + "step": 4698 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002888961336095636, + "loss": 1.7468, + "step": 4699 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028889146627328387, + "loss": 1.7971, + "step": 4700 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002888867979940077, + "loss": 1.7627, + "step": 4701 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028888212877176687, + "loss": 1.842, + "step": 4702 + }, + { + "epoch": 0.37, + "learning_rate": 0.000288877458606593, + "loss": 1.8189, + "step": 4703 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028887278749851786, + "loss": 1.7951, + "step": 4704 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028886811544757306, + "loss": 1.8356, + "step": 4705 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028886344245379045, + "loss": 1.8014, + "step": 4706 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028885876851720166, + "loss": 1.7681, + "step": 4707 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002888540936378385, + "loss": 1.7059, + "step": 4708 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002888494178157327, + "loss": 1.7773, + "step": 4709 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028884474105091585, + "loss": 1.8534, + "step": 4710 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002888400633434199, + "loss": 1.8177, + "step": 4711 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028883538469327656, + "loss": 1.8232, + "step": 4712 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002888307051005176, + "loss": 1.7937, + "step": 4713 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028882602456517466, + "loss": 1.7905, + "step": 4714 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028882134308727976, + "loss": 1.7682, + "step": 4715 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028881666066686443, + "loss": 1.8225, + "step": 4716 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002888119773039606, + "loss": 1.7569, + "step": 4717 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028880729299860013, + "loss": 1.8131, + "step": 4718 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028880260775081463, + "loss": 1.8011, + "step": 4719 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002887979215606361, + "loss": 1.7736, + "step": 4720 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002887932344280962, + "loss": 1.8222, + "step": 4721 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028878854635322693, + "loss": 1.7705, + "step": 4722 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028878385733606, + "loss": 1.8099, + "step": 4723 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002887791673766272, + "loss": 1.7923, + "step": 4724 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028877447647496045, + "loss": 1.7516, + "step": 4725 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002887697846310916, + "loss": 1.7975, + "step": 4726 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002887650918450525, + "loss": 1.8161, + "step": 4727 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028876039811687507, + "loss": 1.7986, + "step": 4728 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028875570344659104, + "loss": 1.8068, + "step": 4729 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028875100783423235, + "loss": 1.8103, + "step": 4730 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002887463112798309, + "loss": 1.7722, + "step": 4731 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002887416137834186, + "loss": 1.7677, + "step": 4732 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028873691534502725, + "loss": 1.8155, + "step": 4733 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028873221596468877, + "loss": 1.7977, + "step": 4734 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002887275156424352, + "loss": 1.792, + "step": 4735 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002887228143782983, + "loss": 1.7955, + "step": 4736 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028871811217231005, + "loss": 1.7112, + "step": 4737 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002887134090245024, + "loss": 1.8203, + "step": 4738 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002887087049349072, + "loss": 1.806, + "step": 4739 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028870399990355646, + "loss": 1.8295, + "step": 4740 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002886992939304821, + "loss": 1.7846, + "step": 4741 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002886945870157161, + "loss": 1.8022, + "step": 4742 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028868987915929036, + "loss": 1.8358, + "step": 4743 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002886851703612369, + "loss": 1.7986, + "step": 4744 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002886804606215877, + "loss": 1.7864, + "step": 4745 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002886757499403747, + "loss": 1.7876, + "step": 4746 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002886710383176298, + "loss": 1.8322, + "step": 4747 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028866632575338507, + "loss": 1.7673, + "step": 4748 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002886616122476726, + "loss": 1.8106, + "step": 4749 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002886568978005243, + "loss": 1.8079, + "step": 4750 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002886521824119721, + "loss": 1.7671, + "step": 4751 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002886474660820482, + "loss": 1.8391, + "step": 4752 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002886427488107844, + "loss": 1.8542, + "step": 4753 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002886380305982129, + "loss": 1.804, + "step": 4754 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002886333114443657, + "loss": 1.7814, + "step": 4755 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002886285913492748, + "loss": 1.7655, + "step": 4756 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028862387031297225, + "loss": 1.7695, + "step": 4757 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028861914833549015, + "loss": 1.8054, + "step": 4758 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002886144254168605, + "loss": 1.7923, + "step": 4759 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002886097015571154, + "loss": 1.7651, + "step": 4760 + }, + { + "epoch": 0.37, + "learning_rate": 0.000288604976756287, + "loss": 1.8352, + "step": 4761 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002886002510144072, + "loss": 1.8203, + "step": 4762 + }, + { + "epoch": 0.37, + "learning_rate": 0.0002885955243315082, + "loss": 1.8422, + "step": 4763 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028859079670762205, + "loss": 1.8041, + "step": 4764 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028858606814278093, + "loss": 1.7881, + "step": 4765 + }, + { + "epoch": 0.37, + "learning_rate": 0.00028858133863701686, + "loss": 1.7745, + "step": 4766 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002885766081903619, + "loss": 1.7966, + "step": 4767 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028857187680284837, + "loss": 1.8001, + "step": 4768 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028856714447450825, + "loss": 1.7806, + "step": 4769 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028856241120537365, + "loss": 1.8594, + "step": 4770 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002885576769954767, + "loss": 1.761, + "step": 4771 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028855294184484964, + "loss": 1.77, + "step": 4772 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002885482057535246, + "loss": 1.7815, + "step": 4773 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028854346872153364, + "loss": 1.7617, + "step": 4774 + }, + { + "epoch": 0.38, + "learning_rate": 0.000288538730748909, + "loss": 1.8032, + "step": 4775 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002885339918356828, + "loss": 1.801, + "step": 4776 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002885292519818873, + "loss": 1.8203, + "step": 4777 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028852451118755454, + "loss": 1.7875, + "step": 4778 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002885197694527169, + "loss": 1.8158, + "step": 4779 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002885150267774064, + "loss": 1.8066, + "step": 4780 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002885102831616553, + "loss": 1.8133, + "step": 4781 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028850553860549586, + "loss": 1.7745, + "step": 4782 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002885007931089602, + "loss": 1.7416, + "step": 4783 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002884960466720806, + "loss": 1.8859, + "step": 4784 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002884912992948893, + "loss": 1.861, + "step": 4785 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002884865509774185, + "loss": 1.7552, + "step": 4786 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028848180171970044, + "loss": 1.7779, + "step": 4787 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028847705152176736, + "loss": 1.778, + "step": 4788 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002884723003836515, + "loss": 1.7081, + "step": 4789 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028846754830538513, + "loss": 1.7803, + "step": 4790 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002884627952870006, + "loss": 1.8038, + "step": 4791 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028845804132853, + "loss": 1.7678, + "step": 4792 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028845328643000573, + "loss": 1.7839, + "step": 4793 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028844853059146005, + "loss": 1.8119, + "step": 4794 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002884437738129253, + "loss": 1.8146, + "step": 4795 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002884390160944337, + "loss": 1.7748, + "step": 4796 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028843425743601755, + "loss": 1.755, + "step": 4797 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002884294978377092, + "loss": 1.7539, + "step": 4798 + }, + { + "epoch": 0.38, + "learning_rate": 0.000288424737299541, + "loss": 1.7808, + "step": 4799 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028841997582154514, + "loss": 1.7585, + "step": 4800 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028841521340375407, + "loss": 1.8091, + "step": 4801 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002884104500462001, + "loss": 1.8117, + "step": 4802 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002884056857489155, + "loss": 1.777, + "step": 4803 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028840092051193275, + "loss": 1.8239, + "step": 4804 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028839615433528404, + "loss": 1.8121, + "step": 4805 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028839138721900186, + "loss": 1.816, + "step": 4806 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002883866191631185, + "loss": 1.7842, + "step": 4807 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028838185016766645, + "loss": 1.769, + "step": 4808 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028837708023267796, + "loss": 1.7576, + "step": 4809 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028837230935818545, + "loss": 1.7769, + "step": 4810 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002883675375442213, + "loss": 1.7792, + "step": 4811 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028836276479081793, + "loss": 1.8199, + "step": 4812 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028835799109800774, + "loss": 1.7742, + "step": 4813 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002883532164658232, + "loss": 1.7833, + "step": 4814 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028834844089429667, + "loss": 1.7666, + "step": 4815 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002883436643834605, + "loss": 1.7969, + "step": 4816 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002883388869333472, + "loss": 1.8637, + "step": 4817 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028833410854398923, + "loss": 1.7467, + "step": 4818 + }, + { + "epoch": 0.38, + "learning_rate": 0.000288329329215419, + "loss": 1.8169, + "step": 4819 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028832454894766896, + "loss": 1.7436, + "step": 4820 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028831976774077155, + "loss": 1.7133, + "step": 4821 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002883149855947593, + "loss": 1.7767, + "step": 4822 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002883102025096646, + "loss": 1.7656, + "step": 4823 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028830541848551993, + "loss": 1.7672, + "step": 4824 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002883006335223578, + "loss": 1.7811, + "step": 4825 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028829584762021066, + "loss": 1.7971, + "step": 4826 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002882910607791111, + "loss": 1.7755, + "step": 4827 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002882862729990915, + "loss": 1.7661, + "step": 4828 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002882814842801844, + "loss": 1.8277, + "step": 4829 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002882766946224224, + "loss": 1.775, + "step": 4830 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002882719040258379, + "loss": 1.8319, + "step": 4831 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028826711249046354, + "loss": 1.8119, + "step": 4832 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002882623200163317, + "loss": 1.8511, + "step": 4833 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028825752660347506, + "loss": 1.7976, + "step": 4834 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002882527322519261, + "loss": 1.8648, + "step": 4835 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002882479369617174, + "loss": 1.7874, + "step": 4836 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002882431407328815, + "loss": 1.8605, + "step": 4837 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028823834356545095, + "loss": 1.7908, + "step": 4838 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002882335454594583, + "loss": 1.7928, + "step": 4839 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028822874641493617, + "loss": 1.8122, + "step": 4840 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002882239464319172, + "loss": 1.7979, + "step": 4841 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002882191455104338, + "loss": 1.7467, + "step": 4842 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002882143436505188, + "loss": 1.7766, + "step": 4843 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028820954085220465, + "loss": 1.7871, + "step": 4844 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002882047371155239, + "loss": 1.8, + "step": 4845 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028819993244050935, + "loss": 1.8039, + "step": 4846 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002881951268271935, + "loss": 1.75, + "step": 4847 + }, + { + "epoch": 0.38, + "learning_rate": 0.000288190320275609, + "loss": 1.7957, + "step": 4848 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028818551278578843, + "loss": 1.7825, + "step": 4849 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002881807043577645, + "loss": 1.8029, + "step": 4850 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002881758949915699, + "loss": 1.8182, + "step": 4851 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002881710846872372, + "loss": 1.8009, + "step": 4852 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028816627344479905, + "loss": 1.8021, + "step": 4853 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002881614612642882, + "loss": 1.8097, + "step": 4854 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028815664814573725, + "loss": 1.7896, + "step": 4855 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028815183408917886, + "loss": 1.8043, + "step": 4856 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028814701909464583, + "loss": 1.7569, + "step": 4857 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028814220316217076, + "loss": 1.7645, + "step": 4858 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002881373862917863, + "loss": 1.8029, + "step": 4859 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002881325684835253, + "loss": 1.7755, + "step": 4860 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028812774973742037, + "loss": 1.7902, + "step": 4861 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002881229300535042, + "loss": 1.8395, + "step": 4862 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028811810943180956, + "loss": 1.7544, + "step": 4863 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002881132878723692, + "loss": 1.7848, + "step": 4864 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002881084653752158, + "loss": 1.8153, + "step": 4865 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002881036419403822, + "loss": 1.8466, + "step": 4866 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028809881756790105, + "loss": 1.8011, + "step": 4867 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028809399225780517, + "loss": 1.7682, + "step": 4868 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028808916601012725, + "loss": 1.7618, + "step": 4869 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002880843388249001, + "loss": 1.8203, + "step": 4870 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028807951070215646, + "loss": 1.7621, + "step": 4871 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028807468164192924, + "loss": 1.8405, + "step": 4872 + }, + { + "epoch": 0.38, + "learning_rate": 0.000288069851644251, + "loss": 1.7901, + "step": 4873 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002880650207091547, + "loss": 1.7941, + "step": 4874 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028806018883667316, + "loss": 1.8079, + "step": 4875 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002880553560268391, + "loss": 1.8097, + "step": 4876 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002880505222796853, + "loss": 1.8092, + "step": 4877 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028804568759524475, + "loss": 1.8661, + "step": 4878 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028804085197355007, + "loss": 1.7284, + "step": 4879 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028803601541463423, + "loss": 1.7954, + "step": 4880 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028803117791852996, + "loss": 1.8159, + "step": 4881 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002880263394852702, + "loss": 1.8074, + "step": 4882 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002880215001148878, + "loss": 1.7905, + "step": 4883 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002880166598074155, + "loss": 1.7942, + "step": 4884 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028801181856288633, + "loss": 1.8394, + "step": 4885 + }, + { + "epoch": 0.38, + "learning_rate": 0.000288006976381333, + "loss": 1.7735, + "step": 4886 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028800213326278854, + "loss": 1.7868, + "step": 4887 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002879972892072857, + "loss": 1.773, + "step": 4888 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002879924442148574, + "loss": 1.8594, + "step": 4889 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028798759828553653, + "loss": 1.8087, + "step": 4890 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002879827514193561, + "loss": 1.7892, + "step": 4891 + }, + { + "epoch": 0.38, + "learning_rate": 0.00028797790361634887, + "loss": 1.8169, + "step": 4892 + }, + { + "epoch": 0.38, + "learning_rate": 0.0002879730548765478, + "loss": 1.8144, + "step": 4893 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002879682051999859, + "loss": 1.8025, + "step": 4894 + }, + { + "epoch": 0.39, + "learning_rate": 0.000287963354586696, + "loss": 1.7879, + "step": 4895 + }, + { + "epoch": 0.39, + "learning_rate": 0.000287958503036711, + "loss": 1.7033, + "step": 4896 + }, + { + "epoch": 0.39, + "learning_rate": 0.000287953650550064, + "loss": 1.7853, + "step": 4897 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002879487971267878, + "loss": 1.8166, + "step": 4898 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028794394276691535, + "loss": 1.8124, + "step": 4899 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028793908747047967, + "loss": 1.7731, + "step": 4900 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028793423123751373, + "loss": 1.8326, + "step": 4901 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002879293740680505, + "loss": 1.7531, + "step": 4902 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002879245159621229, + "loss": 1.7644, + "step": 4903 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028791965691976395, + "loss": 1.8506, + "step": 4904 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028791479694100663, + "loss": 1.8337, + "step": 4905 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028790993602588396, + "loss": 1.8197, + "step": 4906 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028790507417442894, + "loss": 1.7607, + "step": 4907 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028790021138667455, + "loss": 1.8464, + "step": 4908 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028789534766265385, + "loss": 1.7903, + "step": 4909 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002878904830023998, + "loss": 1.7956, + "step": 4910 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028788561740594553, + "loss": 1.8348, + "step": 4911 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028788075087332393, + "loss": 1.7572, + "step": 4912 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028787588340456813, + "loss": 1.8169, + "step": 4913 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002878710149997112, + "loss": 1.7958, + "step": 4914 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002878661456587862, + "loss": 1.7938, + "step": 4915 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028786127538182605, + "loss": 1.8069, + "step": 4916 + }, + { + "epoch": 0.39, + "learning_rate": 0.000287856404168864, + "loss": 1.7881, + "step": 4917 + }, + { + "epoch": 0.39, + "learning_rate": 0.000287851532019933, + "loss": 1.8497, + "step": 4918 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002878466589350662, + "loss": 1.8019, + "step": 4919 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002878417849142966, + "loss": 1.7965, + "step": 4920 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028783690995765743, + "loss": 1.8031, + "step": 4921 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002878320340651817, + "loss": 1.7523, + "step": 4922 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002878271572369025, + "loss": 1.7838, + "step": 4923 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028782227947285287, + "loss": 1.821, + "step": 4924 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002878174007730661, + "loss": 1.8081, + "step": 4925 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028781252113757523, + "loss": 1.8133, + "step": 4926 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002878076405664134, + "loss": 1.8079, + "step": 4927 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028780275905961375, + "loss": 1.7654, + "step": 4928 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002877978766172094, + "loss": 1.7837, + "step": 4929 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028779299323923347, + "loss": 1.7296, + "step": 4930 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002877881089257192, + "loss": 1.7745, + "step": 4931 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002877832236766997, + "loss": 1.7196, + "step": 4932 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028777833749220815, + "loss": 1.7784, + "step": 4933 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002877734503722777, + "loss": 1.7748, + "step": 4934 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002877685623169416, + "loss": 1.746, + "step": 4935 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002877636733262329, + "loss": 1.7767, + "step": 4936 + }, + { + "epoch": 0.39, + "learning_rate": 0.000287758783400185, + "loss": 1.7796, + "step": 4937 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002877538925388309, + "loss": 1.7607, + "step": 4938 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002877490007422039, + "loss": 1.7866, + "step": 4939 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002877441080103372, + "loss": 1.7853, + "step": 4940 + }, + { + "epoch": 0.39, + "learning_rate": 0.000287739214343264, + "loss": 1.784, + "step": 4941 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002877343197410176, + "loss": 1.7738, + "step": 4942 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002877294242036311, + "loss": 1.7849, + "step": 4943 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002877245277311379, + "loss": 1.742, + "step": 4944 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028771963032357114, + "loss": 1.7943, + "step": 4945 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028771473198096407, + "loss": 1.8224, + "step": 4946 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028770983270335, + "loss": 1.8021, + "step": 4947 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028770493249076213, + "loss": 1.7702, + "step": 4948 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002877000313432337, + "loss": 1.7285, + "step": 4949 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028769512926079817, + "loss": 1.7677, + "step": 4950 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028769022624348863, + "loss": 1.7977, + "step": 4951 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028768532229133845, + "loss": 1.8346, + "step": 4952 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002876804174043809, + "loss": 1.7731, + "step": 4953 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028767551158264933, + "loss": 1.7777, + "step": 4954 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028767060482617695, + "loss": 1.809, + "step": 4955 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002876656971349972, + "loss": 1.7922, + "step": 4956 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002876607885091433, + "loss": 1.7829, + "step": 4957 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002876558789486486, + "loss": 1.7998, + "step": 4958 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002876509684535465, + "loss": 1.7789, + "step": 4959 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002876460570238703, + "loss": 1.7699, + "step": 4960 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002876411446596532, + "loss": 1.7757, + "step": 4961 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002876362313609288, + "loss": 1.8406, + "step": 4962 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002876313171277303, + "loss": 1.7933, + "step": 4963 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028762640196009116, + "loss": 1.7499, + "step": 4964 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028762148585804466, + "loss": 1.748, + "step": 4965 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002876165688216242, + "loss": 1.7864, + "step": 4966 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028761165085086323, + "loss": 1.7634, + "step": 4967 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028760673194579503, + "loss": 1.7976, + "step": 4968 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002876018121064531, + "loss": 1.8359, + "step": 4969 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002875968913328708, + "loss": 1.8033, + "step": 4970 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002875919696250815, + "loss": 1.7293, + "step": 4971 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028758704698311874, + "loss": 1.8518, + "step": 4972 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028758212340701577, + "loss": 1.7522, + "step": 4973 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028757719889680616, + "loss": 1.7683, + "step": 4974 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028757227345252326, + "loss": 1.8087, + "step": 4975 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028756734707420056, + "loss": 1.8332, + "step": 4976 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028756241976187147, + "loss": 1.8648, + "step": 4977 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002875574915155695, + "loss": 1.7956, + "step": 4978 + }, + { + "epoch": 0.39, + "learning_rate": 0.000287552562335328, + "loss": 1.7902, + "step": 4979 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028754763222118055, + "loss": 1.7765, + "step": 4980 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002875427011731606, + "loss": 1.7793, + "step": 4981 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002875377691913016, + "loss": 1.7469, + "step": 4982 + }, + { + "epoch": 0.39, + "learning_rate": 0.000287532836275637, + "loss": 1.7882, + "step": 4983 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028752790242620043, + "loss": 1.7714, + "step": 4984 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002875229676430253, + "loss": 1.7446, + "step": 4985 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028751803192614506, + "loss": 1.7489, + "step": 4986 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002875130952755933, + "loss": 1.7698, + "step": 4987 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002875081576914034, + "loss": 1.7588, + "step": 4988 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002875032191736091, + "loss": 1.8215, + "step": 4989 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002874982797222438, + "loss": 1.7644, + "step": 4990 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028749333933734104, + "loss": 1.7709, + "step": 4991 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002874883980189344, + "loss": 1.7327, + "step": 4992 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028748345576705745, + "loss": 1.8171, + "step": 4993 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002874785125817437, + "loss": 1.8141, + "step": 4994 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002874735684630266, + "loss": 1.8399, + "step": 4995 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028746862341093993, + "loss": 1.7655, + "step": 4996 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028746367742551717, + "loss": 1.8171, + "step": 4997 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028745873050679187, + "loss": 1.8, + "step": 4998 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002874537826547977, + "loss": 1.7688, + "step": 4999 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028744883386956817, + "loss": 1.8219, + "step": 5000 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028744388415113687, + "loss": 1.7348, + "step": 5001 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028743893349953743, + "loss": 1.7209, + "step": 5002 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028743398191480356, + "loss": 1.7841, + "step": 5003 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028742902939696876, + "loss": 1.7538, + "step": 5004 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028742407594606665, + "loss": 1.7618, + "step": 5005 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028741912156213093, + "loss": 1.7619, + "step": 5006 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002874141662451952, + "loss": 1.8046, + "step": 5007 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028740920999529315, + "loss": 1.8282, + "step": 5008 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028740425281245836, + "loss": 1.8163, + "step": 5009 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002873992946967245, + "loss": 1.7597, + "step": 5010 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002873943356481253, + "loss": 1.7948, + "step": 5011 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002873893756666944, + "loss": 1.7605, + "step": 5012 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028738441475246535, + "loss": 1.7911, + "step": 5013 + }, + { + "epoch": 0.39, + "learning_rate": 0.000287379452905472, + "loss": 1.7897, + "step": 5014 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028737449012574806, + "loss": 1.7753, + "step": 5015 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028736952641332704, + "loss": 1.7807, + "step": 5016 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028736456176824273, + "loss": 1.7865, + "step": 5017 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002873595961905289, + "loss": 1.7954, + "step": 5018 + }, + { + "epoch": 0.39, + "learning_rate": 0.00028735462968021923, + "loss": 1.7662, + "step": 5019 + }, + { + "epoch": 0.39, + "learning_rate": 0.0002873496622373474, + "loss": 1.8498, + "step": 5020 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028734469386194715, + "loss": 1.6987, + "step": 5021 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002873397245540522, + "loss": 1.7412, + "step": 5022 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028733475431369634, + "loss": 1.8328, + "step": 5023 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002873297831409133, + "loss": 1.8273, + "step": 5024 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028732481103573677, + "loss": 1.8212, + "step": 5025 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002873198379982006, + "loss": 1.8613, + "step": 5026 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028731486402833845, + "loss": 1.7316, + "step": 5027 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002873098891261842, + "loss": 1.8405, + "step": 5028 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028730491329177164, + "loss": 1.7525, + "step": 5029 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002872999365251344, + "loss": 1.795, + "step": 5030 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028729495882630633, + "loss": 1.7502, + "step": 5031 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002872899801953213, + "loss": 1.8218, + "step": 5032 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002872850006322131, + "loss": 1.75, + "step": 5033 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002872800201370155, + "loss": 1.7791, + "step": 5034 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028727503870976226, + "loss": 1.7304, + "step": 5035 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002872700563504873, + "loss": 1.7654, + "step": 5036 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002872650730592244, + "loss": 1.8018, + "step": 5037 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002872600888360074, + "loss": 1.7871, + "step": 5038 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002872551036808702, + "loss": 1.809, + "step": 5039 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002872501175938465, + "loss": 1.8053, + "step": 5040 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002872451305749703, + "loss": 1.76, + "step": 5041 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028724014262427537, + "loss": 1.7399, + "step": 5042 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028723515374179566, + "loss": 1.7887, + "step": 5043 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028723016392756496, + "loss": 1.8079, + "step": 5044 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002872251731816171, + "loss": 1.7979, + "step": 5045 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028722018150398613, + "loss": 1.7651, + "step": 5046 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002872151888947059, + "loss": 1.6973, + "step": 5047 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002872101953538102, + "loss": 1.8021, + "step": 5048 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002872052008813329, + "loss": 1.7737, + "step": 5049 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028720020547730817, + "loss": 1.7758, + "step": 5050 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002871952091417697, + "loss": 1.8059, + "step": 5051 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002871902118747514, + "loss": 1.7646, + "step": 5052 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002871852136762873, + "loss": 1.8582, + "step": 5053 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028718021454641134, + "loss": 1.8179, + "step": 5054 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028717521448515736, + "loss": 1.8118, + "step": 5055 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002871702134925594, + "loss": 1.777, + "step": 5056 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002871652115686514, + "loss": 1.8057, + "step": 5057 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028716020871346736, + "loss": 1.7761, + "step": 5058 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028715520492704114, + "loss": 1.7549, + "step": 5059 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002871502002094068, + "loss": 1.7664, + "step": 5060 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028714519456059825, + "loss": 1.8068, + "step": 5061 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002871401879806495, + "loss": 1.8126, + "step": 5062 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028713518046959456, + "loss": 1.8563, + "step": 5063 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002871301720274675, + "loss": 1.7647, + "step": 5064 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028712516265430214, + "loss": 1.8037, + "step": 5065 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028712015235013265, + "loss": 1.7889, + "step": 5066 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028711514111499296, + "loss": 1.7822, + "step": 5067 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028711012894891717, + "loss": 1.7445, + "step": 5068 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028710511585193927, + "loss": 1.7453, + "step": 5069 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002871001018240933, + "loss": 1.7528, + "step": 5070 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002870950868654132, + "loss": 1.8327, + "step": 5071 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028709007097593324, + "loss": 1.7278, + "step": 5072 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002870850541556873, + "loss": 1.7863, + "step": 5073 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002870800364047095, + "loss": 1.8337, + "step": 5074 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002870750177230339, + "loss": 1.7688, + "step": 5075 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028706999811069456, + "loss": 1.8003, + "step": 5076 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028706497756772557, + "loss": 1.7959, + "step": 5077 + }, + { + "epoch": 0.4, + "learning_rate": 0.000287059956094161, + "loss": 1.7479, + "step": 5078 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028705493369003503, + "loss": 1.7948, + "step": 5079 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002870499103553816, + "loss": 1.8292, + "step": 5080 + }, + { + "epoch": 0.4, + "learning_rate": 0.000287044886090235, + "loss": 1.8242, + "step": 5081 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028703986089462924, + "loss": 1.7769, + "step": 5082 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002870348347685984, + "loss": 1.7756, + "step": 5083 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002870298077121767, + "loss": 1.8318, + "step": 5084 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002870247797253982, + "loss": 1.8246, + "step": 5085 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028701975080829706, + "loss": 1.7686, + "step": 5086 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028701472096090744, + "loss": 1.7749, + "step": 5087 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002870096901832635, + "loss": 1.8261, + "step": 5088 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002870046584753993, + "loss": 1.7398, + "step": 5089 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028699962583734914, + "loss": 1.7793, + "step": 5090 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002869945922691471, + "loss": 1.8203, + "step": 5091 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002869895577708274, + "loss": 1.7906, + "step": 5092 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028698452234242414, + "loss": 1.7509, + "step": 5093 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002869794859839716, + "loss": 1.8262, + "step": 5094 + }, + { + "epoch": 0.4, + "learning_rate": 0.000286974448695504, + "loss": 1.8095, + "step": 5095 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028696941047705543, + "loss": 1.7394, + "step": 5096 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002869643713286601, + "loss": 1.7691, + "step": 5097 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028695933125035233, + "loss": 1.7925, + "step": 5098 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028695429024216626, + "loss": 1.7781, + "step": 5099 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028694924830413614, + "loss": 1.8364, + "step": 5100 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002869442054362962, + "loss": 1.7683, + "step": 5101 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028693916163868074, + "loss": 1.7797, + "step": 5102 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028693411691132386, + "loss": 1.7223, + "step": 5103 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002869290712542599, + "loss": 1.7508, + "step": 5104 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028692402466752316, + "loss": 1.7255, + "step": 5105 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002869189771511478, + "loss": 1.7461, + "step": 5106 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002869139287051682, + "loss": 1.7666, + "step": 5107 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002869088793296185, + "loss": 1.7804, + "step": 5108 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028690382902453313, + "loss": 1.737, + "step": 5109 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002868987777899463, + "loss": 1.7358, + "step": 5110 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002868937256258923, + "loss": 1.768, + "step": 5111 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002868886725324054, + "loss": 1.8124, + "step": 5112 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028688361850952006, + "loss": 1.7219, + "step": 5113 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002868785635572704, + "loss": 1.7367, + "step": 5114 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028687350767569086, + "loss": 1.8006, + "step": 5115 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028686845086481577, + "loss": 1.7572, + "step": 5116 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002868633931246794, + "loss": 1.7994, + "step": 5117 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002868583344553161, + "loss": 1.8174, + "step": 5118 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028685327485676024, + "loss": 1.8445, + "step": 5119 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002868482143290462, + "loss": 1.8135, + "step": 5120 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002868431528722083, + "loss": 1.7811, + "step": 5121 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002868380904862809, + "loss": 1.8013, + "step": 5122 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002868330271712983, + "loss": 1.7718, + "step": 5123 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028682796292729505, + "loss": 1.7952, + "step": 5124 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002868228977543054, + "loss": 1.8517, + "step": 5125 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028681783165236376, + "loss": 1.84, + "step": 5126 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002868127646215046, + "loss": 1.7625, + "step": 5127 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002868076966617623, + "loss": 1.7845, + "step": 5128 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028680262777317113, + "loss": 1.8194, + "step": 5129 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028679755795576567, + "loss": 1.7806, + "step": 5130 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002867924872095803, + "loss": 1.8059, + "step": 5131 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002867874155346494, + "loss": 1.7681, + "step": 5132 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028678234293100745, + "loss": 1.8383, + "step": 5133 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028677726939868884, + "loss": 1.7672, + "step": 5134 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002867721949377281, + "loss": 1.7919, + "step": 5135 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028676711954815957, + "loss": 1.716, + "step": 5136 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028676204323001785, + "loss": 1.7588, + "step": 5137 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028675696598333726, + "loss": 1.7852, + "step": 5138 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028675188780815237, + "loss": 1.804, + "step": 5139 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002867468087044976, + "loss": 1.7505, + "step": 5140 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028674172867240754, + "loss": 1.7448, + "step": 5141 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028673664771191655, + "loss": 1.7705, + "step": 5142 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028673156582305917, + "loss": 1.787, + "step": 5143 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002867264830058699, + "loss": 1.7888, + "step": 5144 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002867213992603833, + "loss": 1.772, + "step": 5145 + }, + { + "epoch": 0.4, + "learning_rate": 0.0002867163145866338, + "loss": 1.7731, + "step": 5146 + }, + { + "epoch": 0.4, + "learning_rate": 0.00028671122898465604, + "loss": 1.7967, + "step": 5147 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002867061424544845, + "loss": 1.7574, + "step": 5148 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028670105499615356, + "loss": 1.8336, + "step": 5149 + }, + { + "epoch": 0.41, + "learning_rate": 0.000286695966609698, + "loss": 1.7346, + "step": 5150 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028669087729515225, + "loss": 1.77, + "step": 5151 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028668578705255086, + "loss": 1.7903, + "step": 5152 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002866806958819284, + "loss": 1.7663, + "step": 5153 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002866756037833194, + "loss": 1.7773, + "step": 5154 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028667051075675855, + "loss": 1.7954, + "step": 5155 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002866654168022803, + "loss": 1.7735, + "step": 5156 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002866603219199193, + "loss": 1.7922, + "step": 5157 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002866552261097102, + "loss": 1.8076, + "step": 5158 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028665012937168746, + "loss": 1.8073, + "step": 5159 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002866450317058857, + "loss": 1.7082, + "step": 5160 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028663993311233967, + "loss": 1.7821, + "step": 5161 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002866348335910839, + "loss": 1.768, + "step": 5162 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028662973314215294, + "loss": 1.7245, + "step": 5163 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002866246317655815, + "loss": 1.7772, + "step": 5164 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002866195294614043, + "loss": 1.7526, + "step": 5165 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028661442622965577, + "loss": 1.7753, + "step": 5166 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028660932207037076, + "loss": 1.8182, + "step": 5167 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002866042169835838, + "loss": 1.7516, + "step": 5168 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028659911096932966, + "loss": 1.7636, + "step": 5169 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028659400402764284, + "loss": 1.7672, + "step": 5170 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002865888961585581, + "loss": 1.7824, + "step": 5171 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002865837873621103, + "loss": 1.8158, + "step": 5172 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028657867763833374, + "loss": 1.7887, + "step": 5173 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028657356698726344, + "loss": 1.81, + "step": 5174 + }, + { + "epoch": 0.41, + "learning_rate": 0.000286568455408934, + "loss": 1.7677, + "step": 5175 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002865633429033801, + "loss": 1.8336, + "step": 5176 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002865582294706364, + "loss": 1.752, + "step": 5177 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002865531151107378, + "loss": 1.7691, + "step": 5178 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002865479998237188, + "loss": 1.7426, + "step": 5179 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002865428836096143, + "loss": 1.8265, + "step": 5180 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002865377664684589, + "loss": 1.7875, + "step": 5181 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028653264840028744, + "loss": 1.805, + "step": 5182 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002865275294051347, + "loss": 1.7871, + "step": 5183 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028652240948303536, + "loss": 1.7659, + "step": 5184 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028651728863402415, + "loss": 1.7531, + "step": 5185 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002865121668581359, + "loss": 1.7512, + "step": 5186 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002865070441554054, + "loss": 1.7357, + "step": 5187 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002865019205258674, + "loss": 1.81, + "step": 5188 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002864967959695566, + "loss": 1.7725, + "step": 5189 + }, + { + "epoch": 0.41, + "learning_rate": 0.000286491670486508, + "loss": 1.7357, + "step": 5190 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002864865440767562, + "loss": 1.7566, + "step": 5191 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028648141674033614, + "loss": 1.8229, + "step": 5192 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028647628847728256, + "loss": 1.7403, + "step": 5193 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002864711592876303, + "loss": 1.8231, + "step": 5194 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002864660291714142, + "loss": 1.7895, + "step": 5195 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028646089812866903, + "loss": 1.7552, + "step": 5196 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028645576615942965, + "loss": 1.7638, + "step": 5197 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028645063326373095, + "loss": 1.7812, + "step": 5198 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002864454994416077, + "loss": 1.7022, + "step": 5199 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028644036469309484, + "loss": 1.779, + "step": 5200 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028643522901822727, + "loss": 1.7618, + "step": 5201 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002864300924170397, + "loss": 1.7891, + "step": 5202 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002864249548895671, + "loss": 1.7278, + "step": 5203 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002864198164358444, + "loss": 1.8143, + "step": 5204 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002864146770559064, + "loss": 1.7599, + "step": 5205 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028640953674978796, + "loss": 1.8218, + "step": 5206 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002864043955175241, + "loss": 1.7488, + "step": 5207 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028639925335914964, + "loss": 1.7534, + "step": 5208 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028639411027469956, + "loss": 1.7911, + "step": 5209 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002863889662642087, + "loss": 1.738, + "step": 5210 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002863838213277121, + "loss": 1.8333, + "step": 5211 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028637867546524456, + "loss": 1.7458, + "step": 5212 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028637352867684105, + "loss": 1.7433, + "step": 5213 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002863683809625366, + "loss": 1.7387, + "step": 5214 + }, + { + "epoch": 0.41, + "learning_rate": 0.000286363232322366, + "loss": 1.7804, + "step": 5215 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002863580827563644, + "loss": 1.7713, + "step": 5216 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002863529322645666, + "loss": 1.7611, + "step": 5217 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002863477808470077, + "loss": 1.7624, + "step": 5218 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028634262850372257, + "loss": 1.7214, + "step": 5219 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002863374752347462, + "loss": 1.7381, + "step": 5220 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002863323210401137, + "loss": 1.7534, + "step": 5221 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002863271659198599, + "loss": 1.8259, + "step": 5222 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002863220098740199, + "loss": 1.8065, + "step": 5223 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028631685290262873, + "loss": 1.7642, + "step": 5224 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028631169500572124, + "loss": 1.7528, + "step": 5225 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028630653618333266, + "loss": 1.7849, + "step": 5226 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002863013764354979, + "loss": 1.8312, + "step": 5227 + }, + { + "epoch": 0.41, + "learning_rate": 0.000286296215762252, + "loss": 1.712, + "step": 5228 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028629105416363, + "loss": 1.8153, + "step": 5229 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028628589163966694, + "loss": 1.8157, + "step": 5230 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028628072819039793, + "loss": 1.769, + "step": 5231 + }, + { + "epoch": 0.41, + "learning_rate": 0.000286275563815858, + "loss": 1.7769, + "step": 5232 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028627039851608215, + "loss": 1.7471, + "step": 5233 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028626523229110547, + "loss": 1.772, + "step": 5234 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028626006514096314, + "loss": 1.7836, + "step": 5235 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028625489706569007, + "loss": 1.8032, + "step": 5236 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002862497280653215, + "loss": 1.7078, + "step": 5237 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028624455813989244, + "loss": 1.7216, + "step": 5238 + }, + { + "epoch": 0.41, + "learning_rate": 0.000286239387289438, + "loss": 1.8074, + "step": 5239 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002862342155139933, + "loss": 1.8136, + "step": 5240 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028622904281359353, + "loss": 1.8197, + "step": 5241 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028622386918827366, + "loss": 1.7926, + "step": 5242 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028621869463806894, + "loss": 1.7396, + "step": 5243 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028621351916301445, + "loss": 1.7375, + "step": 5244 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002862083427631453, + "loss": 1.7534, + "step": 5245 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028620316543849673, + "loss": 1.7555, + "step": 5246 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028619798718910376, + "loss": 1.7413, + "step": 5247 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002861928080150017, + "loss": 1.7935, + "step": 5248 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028618762791622556, + "loss": 1.7482, + "step": 5249 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002861824468928106, + "loss": 1.803, + "step": 5250 + }, + { + "epoch": 0.41, + "learning_rate": 0.000286177264944792, + "loss": 1.7508, + "step": 5251 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002861720820722049, + "loss": 1.7834, + "step": 5252 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028616689827508444, + "loss": 1.7677, + "step": 5253 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028616171355346593, + "loss": 1.786, + "step": 5254 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002861565279073846, + "loss": 1.7864, + "step": 5255 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028615134133687554, + "loss": 1.8466, + "step": 5256 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028614615384197397, + "loss": 1.7694, + "step": 5257 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002861409654227152, + "loss": 1.7892, + "step": 5258 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028613577607913436, + "loss": 1.7503, + "step": 5259 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028613058581126674, + "loss": 1.8474, + "step": 5260 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028612539461914756, + "loss": 1.7386, + "step": 5261 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002861202025028121, + "loss": 1.7654, + "step": 5262 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028611500946229557, + "loss": 1.8201, + "step": 5263 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002861098154976332, + "loss": 1.7867, + "step": 5264 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002861046206088603, + "loss": 1.7593, + "step": 5265 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002860994247960122, + "loss": 1.7778, + "step": 5266 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002860942280591241, + "loss": 1.7458, + "step": 5267 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028608903039823125, + "loss": 1.8195, + "step": 5268 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028608383181336896, + "loss": 1.7908, + "step": 5269 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002860786323045726, + "loss": 1.7124, + "step": 5270 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028607343187187737, + "loss": 1.8383, + "step": 5271 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028606823051531875, + "loss": 1.7792, + "step": 5272 + }, + { + "epoch": 0.41, + "learning_rate": 0.0002860630282349318, + "loss": 1.7683, + "step": 5273 + }, + { + "epoch": 0.41, + "learning_rate": 0.00028605782503075204, + "loss": 1.785, + "step": 5274 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002860526209028147, + "loss": 1.7586, + "step": 5275 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028604741585115515, + "loss": 1.8067, + "step": 5276 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028604220987580876, + "loss": 1.7819, + "step": 5277 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002860370029768108, + "loss": 1.8147, + "step": 5278 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002860317951541967, + "loss": 1.7689, + "step": 5279 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028602658640800174, + "loss": 1.7261, + "step": 5280 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002860213767382613, + "loss": 1.7918, + "step": 5281 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002860161661450109, + "loss": 1.8202, + "step": 5282 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028601095462828566, + "loss": 1.7486, + "step": 5283 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028600574218812117, + "loss": 1.7372, + "step": 5284 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002860005288245527, + "loss": 1.8298, + "step": 5285 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002859953145376157, + "loss": 1.8113, + "step": 5286 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002859900993273456, + "loss": 1.8106, + "step": 5287 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028598488319377775, + "loss": 1.7415, + "step": 5288 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028597966613694753, + "loss": 1.7283, + "step": 5289 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002859744481568905, + "loss": 1.787, + "step": 5290 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002859692292536419, + "loss": 1.8049, + "step": 5291 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028596400942723735, + "loss": 1.7788, + "step": 5292 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002859587886777122, + "loss": 1.8316, + "step": 5293 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002859535670051019, + "loss": 1.6998, + "step": 5294 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002859483444094419, + "loss": 1.7538, + "step": 5295 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028594312089076765, + "loss": 1.7893, + "step": 5296 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028593789644911464, + "loss": 1.8007, + "step": 5297 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002859326710845184, + "loss": 1.789, + "step": 5298 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002859274447970142, + "loss": 1.7597, + "step": 5299 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028592221758663776, + "loss": 1.7418, + "step": 5300 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002859169894534244, + "loss": 1.7365, + "step": 5301 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028591176039740977, + "loss": 1.7535, + "step": 5302 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028590653041862926, + "loss": 1.7362, + "step": 5303 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002859012995171184, + "loss": 1.7626, + "step": 5304 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002858960676929127, + "loss": 1.7725, + "step": 5305 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002858908349460477, + "loss": 1.7693, + "step": 5306 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002858856012765589, + "loss": 1.7346, + "step": 5307 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002858803666844819, + "loss": 1.8291, + "step": 5308 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028587513116985216, + "loss": 1.7628, + "step": 5309 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028586989473270525, + "loss": 1.7922, + "step": 5310 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028586465737307675, + "loss": 1.7141, + "step": 5311 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002858594190910022, + "loss": 1.7533, + "step": 5312 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002858541798865172, + "loss": 1.7816, + "step": 5313 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002858489397596573, + "loss": 1.7814, + "step": 5314 + }, + { + "epoch": 0.42, + "learning_rate": 0.000285843698710458, + "loss": 1.7586, + "step": 5315 + }, + { + "epoch": 0.42, + "learning_rate": 0.000285838456738955, + "loss": 1.6995, + "step": 5316 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028583321384518384, + "loss": 1.7469, + "step": 5317 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002858279700291801, + "loss": 1.7228, + "step": 5318 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002858227252909794, + "loss": 1.7466, + "step": 5319 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028581747963061735, + "loss": 1.7603, + "step": 5320 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028581223304812955, + "loss": 1.7831, + "step": 5321 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028580698554355166, + "loss": 1.7946, + "step": 5322 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028580173711691923, + "loss": 1.7855, + "step": 5323 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028579648776826805, + "loss": 1.8172, + "step": 5324 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028579123749763357, + "loss": 1.8387, + "step": 5325 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028578598630505156, + "loss": 1.7711, + "step": 5326 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028578073419055765, + "loss": 1.7273, + "step": 5327 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028577548115418745, + "loss": 1.7554, + "step": 5328 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028577022719597663, + "loss": 1.7882, + "step": 5329 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028576497231596096, + "loss": 1.7631, + "step": 5330 + }, + { + "epoch": 0.42, + "learning_rate": 0.000285759716514176, + "loss": 1.6488, + "step": 5331 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002857544597906575, + "loss": 1.8296, + "step": 5332 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028574920214544114, + "loss": 1.8361, + "step": 5333 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002857439435785626, + "loss": 1.7403, + "step": 5334 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002857386840900576, + "loss": 1.8627, + "step": 5335 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028573342367996187, + "loss": 1.8164, + "step": 5336 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002857281623483111, + "loss": 1.8016, + "step": 5337 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002857229000951409, + "loss": 1.7573, + "step": 5338 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002857176369204872, + "loss": 1.7137, + "step": 5339 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028571237282438565, + "loss": 1.7381, + "step": 5340 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028570710780687194, + "loss": 1.7898, + "step": 5341 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028570184186798187, + "loss": 1.7784, + "step": 5342 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002856965750077512, + "loss": 1.8016, + "step": 5343 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002856913072262157, + "loss": 1.7725, + "step": 5344 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028568603852341097, + "loss": 1.775, + "step": 5345 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028568076889937306, + "loss": 1.7429, + "step": 5346 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028567549835413757, + "loss": 1.7592, + "step": 5347 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002856702268877402, + "loss": 1.8076, + "step": 5348 + }, + { + "epoch": 0.42, + "learning_rate": 0.000285664954500217, + "loss": 1.7915, + "step": 5349 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002856596811916036, + "loss": 1.7854, + "step": 5350 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002856544069619358, + "loss": 1.7694, + "step": 5351 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028564913181124943, + "loss": 1.768, + "step": 5352 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028564385573958035, + "loss": 1.8167, + "step": 5353 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002856385787469643, + "loss": 1.7779, + "step": 5354 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002856333008334372, + "loss": 1.795, + "step": 5355 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002856280219990348, + "loss": 1.7551, + "step": 5356 + }, + { + "epoch": 0.42, + "learning_rate": 0.000285622742243793, + "loss": 1.8142, + "step": 5357 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028561746156774756, + "loss": 1.8006, + "step": 5358 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028561217997093445, + "loss": 1.7735, + "step": 5359 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002856068974533895, + "loss": 1.7413, + "step": 5360 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002856016140151485, + "loss": 1.7811, + "step": 5361 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002855963296562474, + "loss": 1.7915, + "step": 5362 + }, + { + "epoch": 0.42, + "learning_rate": 0.000285591044376722, + "loss": 1.7884, + "step": 5363 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002855857581766083, + "loss": 1.7301, + "step": 5364 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002855804710559421, + "loss": 1.7426, + "step": 5365 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002855751830147593, + "loss": 1.7577, + "step": 5366 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028556989405309583, + "loss": 1.8295, + "step": 5367 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028556460417098763, + "loss": 1.7762, + "step": 5368 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028555931336847056, + "loss": 1.7732, + "step": 5369 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028555402164558055, + "loss": 1.7617, + "step": 5370 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002855487290023536, + "loss": 1.8117, + "step": 5371 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028554343543882543, + "loss": 1.7446, + "step": 5372 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028553814095503226, + "loss": 1.7583, + "step": 5373 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028553284555100987, + "loss": 1.7512, + "step": 5374 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028552754922679424, + "loss": 1.7919, + "step": 5375 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002855222519824214, + "loss": 1.8223, + "step": 5376 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002855169538179272, + "loss": 1.7305, + "step": 5377 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028551165473334774, + "loss": 1.7764, + "step": 5378 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002855063547287188, + "loss": 1.734, + "step": 5379 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028550105380407655, + "loss": 1.7133, + "step": 5380 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028549575195945697, + "loss": 1.7846, + "step": 5381 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028549044919489597, + "loss": 1.7865, + "step": 5382 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002854851455104296, + "loss": 1.8001, + "step": 5383 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028547984090609383, + "loss": 1.7215, + "step": 5384 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028547453538192475, + "loss": 1.8184, + "step": 5385 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028546922893795827, + "loss": 1.7833, + "step": 5386 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002854639215742305, + "loss": 1.7822, + "step": 5387 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002854586132907775, + "loss": 1.8311, + "step": 5388 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028545330408763525, + "loss": 1.7938, + "step": 5389 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002854479939648398, + "loss": 1.8029, + "step": 5390 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002854426829224272, + "loss": 1.8155, + "step": 5391 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002854373709604336, + "loss": 1.7583, + "step": 5392 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002854320580788949, + "loss": 1.7514, + "step": 5393 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028542674427784734, + "loss": 1.7528, + "step": 5394 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002854214295573269, + "loss": 1.7312, + "step": 5395 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028541611391736966, + "loss": 1.7452, + "step": 5396 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028541079735801175, + "loss": 1.7372, + "step": 5397 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028540547987928927, + "loss": 1.832, + "step": 5398 + }, + { + "epoch": 0.42, + "learning_rate": 0.00028540016148123826, + "loss": 1.7673, + "step": 5399 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002853948421638949, + "loss": 1.7895, + "step": 5400 + }, + { + "epoch": 0.42, + "learning_rate": 0.0002853895219272953, + "loss": 1.7529, + "step": 5401 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002853842007714755, + "loss": 1.7536, + "step": 5402 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028537887869647174, + "loss": 1.7772, + "step": 5403 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002853735557023201, + "loss": 1.7656, + "step": 5404 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028536823178905673, + "loss": 1.7377, + "step": 5405 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028536290695671773, + "loss": 1.7402, + "step": 5406 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002853575812053393, + "loss": 1.765, + "step": 5407 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028535225453495757, + "loss": 1.7293, + "step": 5408 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002853469269456088, + "loss": 1.7529, + "step": 5409 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028534159843732903, + "loss": 1.7844, + "step": 5410 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002853362690101545, + "loss": 1.7208, + "step": 5411 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002853309386641214, + "loss": 1.7058, + "step": 5412 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028532560739926593, + "loss": 1.7506, + "step": 5413 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002853202752156242, + "loss": 1.7777, + "step": 5414 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028531494211323253, + "loss": 1.7935, + "step": 5415 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028530960809212703, + "loss": 1.7833, + "step": 5416 + }, + { + "epoch": 0.43, + "learning_rate": 0.000285304273152344, + "loss": 1.7986, + "step": 5417 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028529893729391963, + "loss": 1.7971, + "step": 5418 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002852936005168901, + "loss": 1.7834, + "step": 5419 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002852882628212917, + "loss": 1.7771, + "step": 5420 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028528292420716066, + "loss": 1.8097, + "step": 5421 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028527758467453325, + "loss": 1.7389, + "step": 5422 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028527224422344565, + "loss": 1.7747, + "step": 5423 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002852669028539342, + "loss": 1.7963, + "step": 5424 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002852615605660351, + "loss": 1.7608, + "step": 5425 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028525621735978464, + "loss": 1.7877, + "step": 5426 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028525087323521913, + "loss": 1.7734, + "step": 5427 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002852455281923748, + "loss": 1.7754, + "step": 5428 + }, + { + "epoch": 0.43, + "learning_rate": 0.000285240182231288, + "loss": 1.7534, + "step": 5429 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002852348353519949, + "loss": 1.8209, + "step": 5430 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028522948755453203, + "loss": 1.738, + "step": 5431 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002852241388389355, + "loss": 1.7723, + "step": 5432 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002852187892052417, + "loss": 1.7189, + "step": 5433 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028521343865348694, + "loss": 1.7449, + "step": 5434 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028520808718370753, + "loss": 1.7392, + "step": 5435 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028520273479593983, + "loss": 1.838, + "step": 5436 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002851973814902202, + "loss": 1.77, + "step": 5437 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028519202726658496, + "loss": 1.7456, + "step": 5438 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002851866721250704, + "loss": 1.7617, + "step": 5439 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028518131606571296, + "loss": 1.8237, + "step": 5440 + }, + { + "epoch": 0.43, + "learning_rate": 0.000285175959088549, + "loss": 1.7948, + "step": 5441 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002851706011936149, + "loss": 1.7875, + "step": 5442 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028516524238094695, + "loss": 1.7442, + "step": 5443 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028515988265058164, + "loss": 1.7516, + "step": 5444 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002851545220025553, + "loss": 1.7531, + "step": 5445 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002851491604369044, + "loss": 1.7123, + "step": 5446 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002851437979536652, + "loss": 1.7695, + "step": 5447 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002851384345528742, + "loss": 1.7631, + "step": 5448 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002851330702345678, + "loss": 1.7434, + "step": 5449 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002851277049987825, + "loss": 1.7635, + "step": 5450 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002851223388455546, + "loss": 1.7425, + "step": 5451 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028511697177492054, + "loss": 1.8299, + "step": 5452 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028511160378691684, + "loss": 1.7585, + "step": 5453 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028510623488157993, + "loss": 1.775, + "step": 5454 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028510086505894623, + "loss": 1.727, + "step": 5455 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002850954943190522, + "loss": 1.7398, + "step": 5456 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028509012266193437, + "loss": 1.7321, + "step": 5457 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002850847500876291, + "loss": 1.7883, + "step": 5458 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002850793765961729, + "loss": 1.7911, + "step": 5459 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028507400218760233, + "loss": 1.6898, + "step": 5460 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002850686268619538, + "loss": 1.7579, + "step": 5461 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002850632506192639, + "loss": 1.7504, + "step": 5462 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028505787345956896, + "loss": 1.7991, + "step": 5463 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028505249538290564, + "loss": 1.7785, + "step": 5464 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002850471163893104, + "loss": 1.851, + "step": 5465 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028504173647881975, + "loss": 1.7945, + "step": 5466 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028503635565147026, + "loss": 1.8289, + "step": 5467 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002850309739072984, + "loss": 1.7579, + "step": 5468 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002850255912463408, + "loss": 1.7373, + "step": 5469 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002850202076686339, + "loss": 1.8047, + "step": 5470 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028501482317421433, + "loss": 1.7606, + "step": 5471 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002850094377631186, + "loss": 1.7851, + "step": 5472 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002850040514353833, + "loss": 1.8154, + "step": 5473 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028499866419104495, + "loss": 1.8063, + "step": 5474 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002849932760301402, + "loss": 1.7435, + "step": 5475 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002849878869527056, + "loss": 1.6951, + "step": 5476 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028498249695877776, + "loss": 1.7634, + "step": 5477 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002849771060483932, + "loss": 1.7441, + "step": 5478 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028497171422158863, + "loss": 1.812, + "step": 5479 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002849663214784006, + "loss": 1.7733, + "step": 5480 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002849609278188657, + "loss": 1.7971, + "step": 5481 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002849555332430206, + "loss": 1.7654, + "step": 5482 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002849501377509019, + "loss": 1.7983, + "step": 5483 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028494474134254624, + "loss": 1.7674, + "step": 5484 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028493934401799026, + "loss": 1.7621, + "step": 5485 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002849339457772706, + "loss": 1.7941, + "step": 5486 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002849285466204239, + "loss": 1.7642, + "step": 5487 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002849231465474868, + "loss": 1.7631, + "step": 5488 + }, + { + "epoch": 0.43, + "learning_rate": 0.000284917745558496, + "loss": 1.7804, + "step": 5489 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028491234365348817, + "loss": 1.7204, + "step": 5490 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028490694083250004, + "loss": 1.7214, + "step": 5491 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028490153709556816, + "loss": 1.8211, + "step": 5492 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028489613244272934, + "loss": 1.7949, + "step": 5493 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028489072687402017, + "loss": 1.7205, + "step": 5494 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028488532038947745, + "loss": 1.7198, + "step": 5495 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002848799129891378, + "loss": 1.7365, + "step": 5496 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028487450467303796, + "loss": 1.7533, + "step": 5497 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002848690954412147, + "loss": 1.7726, + "step": 5498 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002848636852937047, + "loss": 1.7724, + "step": 5499 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002848582742305447, + "loss": 1.75, + "step": 5500 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028485286225177144, + "loss": 1.7832, + "step": 5501 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002848474493574216, + "loss": 1.7258, + "step": 5502 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002848420355475321, + "loss": 1.8306, + "step": 5503 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028483662082213953, + "loss": 1.7778, + "step": 5504 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028483120518128075, + "loss": 1.7619, + "step": 5505 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028482578862499246, + "loss": 1.786, + "step": 5506 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028482037115331145, + "loss": 1.8107, + "step": 5507 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002848149527662746, + "loss": 1.787, + "step": 5508 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028480953346391856, + "loss": 1.7587, + "step": 5509 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002848041132462802, + "loss": 1.7506, + "step": 5510 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002847986921133963, + "loss": 1.787, + "step": 5511 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028479327006530365, + "loss": 1.7577, + "step": 5512 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028478784710203906, + "loss": 1.7206, + "step": 5513 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002847824232236394, + "loss": 1.7409, + "step": 5514 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002847769984301415, + "loss": 1.7694, + "step": 5515 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002847715727215821, + "loss": 1.7837, + "step": 5516 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002847661460979981, + "loss": 1.7812, + "step": 5517 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002847607185594264, + "loss": 1.7703, + "step": 5518 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028475529010590374, + "loss": 1.8262, + "step": 5519 + }, + { + "epoch": 0.43, + "learning_rate": 0.000284749860737467, + "loss": 1.7697, + "step": 5520 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028474443045415314, + "loss": 1.794, + "step": 5521 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002847389992559989, + "loss": 1.8139, + "step": 5522 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002847335671430412, + "loss": 1.7517, + "step": 5523 + }, + { + "epoch": 0.43, + "learning_rate": 0.000284728134115317, + "loss": 1.7891, + "step": 5524 + }, + { + "epoch": 0.43, + "learning_rate": 0.00028472270017286305, + "loss": 1.7384, + "step": 5525 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002847172653157163, + "loss": 1.7808, + "step": 5526 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002847118295439137, + "loss": 1.7894, + "step": 5527 + }, + { + "epoch": 0.43, + "learning_rate": 0.0002847063928574921, + "loss": 1.7938, + "step": 5528 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002847009552564884, + "loss": 1.7854, + "step": 5529 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028469551674093965, + "loss": 1.748, + "step": 5530 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002846900773108826, + "loss": 1.7661, + "step": 5531 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002846846369663543, + "loss": 1.8261, + "step": 5532 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028467919570739157, + "loss": 1.7546, + "step": 5533 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028467375353403144, + "loss": 1.7267, + "step": 5534 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028466831044631093, + "loss": 1.8035, + "step": 5535 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002846628664442668, + "loss": 1.7166, + "step": 5536 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028465742152793615, + "loss": 1.7348, + "step": 5537 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028465197569735594, + "loss": 1.6903, + "step": 5538 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002846465289525631, + "loss": 1.8084, + "step": 5539 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028464108129359466, + "loss": 1.785, + "step": 5540 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002846356327204876, + "loss": 1.7668, + "step": 5541 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028463018323327883, + "loss": 1.722, + "step": 5542 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002846247328320054, + "loss": 1.7894, + "step": 5543 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002846192815167044, + "loss": 1.7357, + "step": 5544 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002846138292874127, + "loss": 1.7978, + "step": 5545 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002846083761441674, + "loss": 1.767, + "step": 5546 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028460292208700556, + "loss": 1.7703, + "step": 5547 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002845974671159641, + "loss": 1.7564, + "step": 5548 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028459201123108015, + "loss": 1.7464, + "step": 5549 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028458655443239065, + "loss": 1.7376, + "step": 5550 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002845810967199328, + "loss": 1.6681, + "step": 5551 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028457563809374355, + "loss": 1.7194, + "step": 5552 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028457017855385995, + "loss": 1.6932, + "step": 5553 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002845647181003191, + "loss": 1.8475, + "step": 5554 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028455925673315815, + "loss": 1.7013, + "step": 5555 + }, + { + "epoch": 0.44, + "learning_rate": 0.000284553794452414, + "loss": 1.7472, + "step": 5556 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028454833125812393, + "loss": 1.7513, + "step": 5557 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002845428671503249, + "loss": 1.7009, + "step": 5558 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028453740212905403, + "loss": 1.7531, + "step": 5559 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002845319361943485, + "loss": 1.7463, + "step": 5560 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002845264693462453, + "loss": 1.7527, + "step": 5561 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028452100158478166, + "loss": 1.75, + "step": 5562 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002845155329099946, + "loss": 1.7319, + "step": 5563 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002845100633219213, + "loss": 1.7536, + "step": 5564 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028450459282059896, + "loss": 1.7094, + "step": 5565 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028449912140606463, + "loss": 1.791, + "step": 5566 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002844936490783555, + "loss": 1.7285, + "step": 5567 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002844881758375087, + "loss": 1.7461, + "step": 5568 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002844827016835614, + "loss": 1.7533, + "step": 5569 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028447722661655077, + "loss": 1.7665, + "step": 5570 + }, + { + "epoch": 0.44, + "learning_rate": 0.000284471750636514, + "loss": 1.8111, + "step": 5571 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028446627374348826, + "loss": 1.7533, + "step": 5572 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002844607959375107, + "loss": 1.7661, + "step": 5573 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002844553172186186, + "loss": 1.8473, + "step": 5574 + }, + { + "epoch": 0.44, + "learning_rate": 0.000284449837586849, + "loss": 1.7877, + "step": 5575 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002844443570422392, + "loss": 1.8129, + "step": 5576 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028443887558482646, + "loss": 1.7782, + "step": 5577 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002844333932146479, + "loss": 1.7673, + "step": 5578 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002844279099317408, + "loss": 1.7422, + "step": 5579 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028442242573614246, + "loss": 1.7842, + "step": 5580 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028441694062788993, + "loss": 1.7385, + "step": 5581 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002844114546070206, + "loss": 1.7277, + "step": 5582 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002844059676735716, + "loss": 1.7883, + "step": 5583 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002844004798275803, + "loss": 1.7101, + "step": 5584 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028439499106908394, + "loss": 1.7103, + "step": 5585 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002843895013981197, + "loss": 1.8038, + "step": 5586 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002843840108147249, + "loss": 1.7531, + "step": 5587 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002843785193189369, + "loss": 1.7961, + "step": 5588 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028437302691079286, + "loss": 1.7089, + "step": 5589 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002843675335903301, + "loss": 1.7704, + "step": 5590 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028436203935758596, + "loss": 1.7399, + "step": 5591 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028435654421259777, + "loss": 1.7981, + "step": 5592 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002843510481554027, + "loss": 1.7534, + "step": 5593 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002843455511860382, + "loss": 1.7652, + "step": 5594 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028434005330454156, + "loss": 1.6997, + "step": 5595 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002843345545109501, + "loss": 1.7387, + "step": 5596 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028432905480530113, + "loss": 1.7178, + "step": 5597 + }, + { + "epoch": 0.44, + "learning_rate": 0.000284323554187632, + "loss": 1.7162, + "step": 5598 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028431805265798007, + "loss": 1.7747, + "step": 5599 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028431255021638265, + "loss": 1.7294, + "step": 5600 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028430704686287716, + "loss": 1.7239, + "step": 5601 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028430154259750093, + "loss": 1.7379, + "step": 5602 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028429603742029133, + "loss": 1.7418, + "step": 5603 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002842905313312858, + "loss": 1.7781, + "step": 5604 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028428502433052165, + "loss": 1.7584, + "step": 5605 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028427951641803623, + "loss": 1.7401, + "step": 5606 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028427400759386705, + "loss": 1.7219, + "step": 5607 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002842684978580515, + "loss": 1.7553, + "step": 5608 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028426298721062685, + "loss": 1.7212, + "step": 5609 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028425747565163066, + "loss": 1.7838, + "step": 5610 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002842519631811003, + "loss": 1.7903, + "step": 5611 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002842464497990732, + "loss": 1.796, + "step": 5612 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002842409355055868, + "loss": 1.7426, + "step": 5613 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028423542030067846, + "loss": 1.7612, + "step": 5614 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002842299041843857, + "loss": 1.7338, + "step": 5615 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002842243871567461, + "loss": 1.7703, + "step": 5616 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028421886921779684, + "loss": 1.7707, + "step": 5617 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028421335036757557, + "loss": 1.6947, + "step": 5618 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002842078306061197, + "loss": 1.7164, + "step": 5619 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028420230993346675, + "loss": 1.7273, + "step": 5620 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002841967883496542, + "loss": 1.768, + "step": 5621 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002841912658547194, + "loss": 1.7268, + "step": 5622 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028418574244870007, + "loss": 1.7282, + "step": 5623 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028418021813163356, + "loss": 1.7357, + "step": 5624 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002841746929035574, + "loss": 1.7542, + "step": 5625 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002841691667645092, + "loss": 1.7145, + "step": 5626 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002841636397145263, + "loss": 1.7535, + "step": 5627 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002841581117536464, + "loss": 1.7263, + "step": 5628 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002841525828819069, + "loss": 1.8061, + "step": 5629 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002841470530993454, + "loss": 1.7372, + "step": 5630 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028414152240599944, + "loss": 1.7583, + "step": 5631 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002841359908019066, + "loss": 1.7421, + "step": 5632 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028413045828710434, + "loss": 1.7744, + "step": 5633 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002841249248616304, + "loss": 1.7501, + "step": 5634 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002841193905255221, + "loss": 1.7295, + "step": 5635 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028411385527881723, + "loss": 1.7487, + "step": 5636 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002841083191215533, + "loss": 1.7862, + "step": 5637 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002841027820537678, + "loss": 1.7278, + "step": 5638 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002840972440754985, + "loss": 1.7418, + "step": 5639 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002840917051867829, + "loss": 1.7718, + "step": 5640 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028408616538765866, + "loss": 1.7874, + "step": 5641 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028408062467816334, + "loss": 1.7958, + "step": 5642 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002840750830583345, + "loss": 1.7427, + "step": 5643 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002840695405282099, + "loss": 1.8179, + "step": 5644 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028406399708782705, + "loss": 1.7859, + "step": 5645 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002840584527372237, + "loss": 1.7789, + "step": 5646 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002840529074764374, + "loss": 1.7767, + "step": 5647 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002840473613055058, + "loss": 1.8074, + "step": 5648 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028404181422446667, + "loss": 1.7618, + "step": 5649 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028403626623335756, + "loss": 1.7828, + "step": 5650 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028403071733221615, + "loss": 1.7641, + "step": 5651 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028402516752108016, + "loss": 1.7566, + "step": 5652 + }, + { + "epoch": 0.44, + "learning_rate": 0.0002840196167999872, + "loss": 1.7505, + "step": 5653 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028401406516897506, + "loss": 1.7285, + "step": 5654 + }, + { + "epoch": 0.44, + "learning_rate": 0.00028400851262808135, + "loss": 1.8047, + "step": 5655 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002840029591773438, + "loss": 1.746, + "step": 5656 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028399740481680006, + "loss": 1.7788, + "step": 5657 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002839918495464879, + "loss": 1.7521, + "step": 5658 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028398629336644503, + "loss": 1.6955, + "step": 5659 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002839807362767092, + "loss": 1.7568, + "step": 5660 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002839751782773181, + "loss": 1.6827, + "step": 5661 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002839696193683094, + "loss": 1.7588, + "step": 5662 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028396405954972105, + "loss": 1.7498, + "step": 5663 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028395849882159054, + "loss": 1.7852, + "step": 5664 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028395293718395584, + "loss": 1.7424, + "step": 5665 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002839473746368546, + "loss": 1.747, + "step": 5666 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028394181118032453, + "loss": 1.7713, + "step": 5667 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028393624681440354, + "loss": 1.7662, + "step": 5668 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028393068153912933, + "loss": 1.7482, + "step": 5669 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002839251153545397, + "loss": 1.7983, + "step": 5670 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002839195482606725, + "loss": 1.7277, + "step": 5671 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028391398025756534, + "loss": 1.7389, + "step": 5672 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002839084113452563, + "loss": 1.6993, + "step": 5673 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028390284152378294, + "loss": 1.7232, + "step": 5674 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002838972707931832, + "loss": 1.7244, + "step": 5675 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002838916991534949, + "loss": 1.6969, + "step": 5676 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002838861266047559, + "loss": 1.7743, + "step": 5677 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028388055314700387, + "loss": 1.7841, + "step": 5678 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028387497878027687, + "loss": 1.7378, + "step": 5679 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028386940350461255, + "loss": 1.7664, + "step": 5680 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002838638273200489, + "loss": 1.7751, + "step": 5681 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028385825022662377, + "loss": 1.7228, + "step": 5682 + }, + { + "epoch": 0.45, + "learning_rate": 0.000283852672224375, + "loss": 1.7516, + "step": 5683 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002838470933133404, + "loss": 1.7363, + "step": 5684 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002838415134935579, + "loss": 1.6928, + "step": 5685 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028383593276506535, + "loss": 1.6959, + "step": 5686 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028383035112790073, + "loss": 1.7759, + "step": 5687 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002838247685821019, + "loss": 1.7249, + "step": 5688 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028381918512770666, + "loss": 1.741, + "step": 5689 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028381360076475305, + "loss": 1.7614, + "step": 5690 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028380801549327895, + "loss": 1.7305, + "step": 5691 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028380242931332224, + "loss": 1.7761, + "step": 5692 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002837968422249209, + "loss": 1.8307, + "step": 5693 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002837912542281128, + "loss": 1.7658, + "step": 5694 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028378566532293595, + "loss": 1.7519, + "step": 5695 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028378007550942827, + "loss": 1.7479, + "step": 5696 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028377448478762767, + "loss": 1.732, + "step": 5697 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028376889315757215, + "loss": 1.7833, + "step": 5698 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028376330061929966, + "loss": 1.804, + "step": 5699 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002837577071728482, + "loss": 1.7489, + "step": 5700 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028375211281825573, + "loss": 1.7838, + "step": 5701 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002837465175555601, + "loss": 1.7723, + "step": 5702 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002837409213847996, + "loss": 1.7778, + "step": 5703 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028373532430601197, + "loss": 1.7513, + "step": 5704 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028372972631923526, + "loss": 1.7986, + "step": 5705 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028372412742450753, + "loss": 1.7059, + "step": 5706 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002837185276218668, + "loss": 1.7452, + "step": 5707 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028371292691135104, + "loss": 1.7699, + "step": 5708 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002837073252929983, + "loss": 1.7875, + "step": 5709 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028370172276684656, + "loss": 1.7451, + "step": 5710 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028369611933293394, + "loss": 1.7751, + "step": 5711 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002836905149912985, + "loss": 1.6999, + "step": 5712 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002836849097419781, + "loss": 1.766, + "step": 5713 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002836793035850111, + "loss": 1.7244, + "step": 5714 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002836736965204353, + "loss": 1.7591, + "step": 5715 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002836680885482889, + "loss": 1.7189, + "step": 5716 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028366247966860996, + "loss": 1.7841, + "step": 5717 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002836568698814365, + "loss": 1.7912, + "step": 5718 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028365125918680667, + "loss": 1.7726, + "step": 5719 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028364564758475856, + "loss": 1.7983, + "step": 5720 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028364003507533027, + "loss": 1.7505, + "step": 5721 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028363442165855985, + "loss": 1.7568, + "step": 5722 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028362880733448547, + "loss": 1.7721, + "step": 5723 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028362319210314523, + "loss": 1.7586, + "step": 5724 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028361757596457725, + "loss": 1.7901, + "step": 5725 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002836119589188197, + "loss": 1.7695, + "step": 5726 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002836063409659106, + "loss": 1.7329, + "step": 5727 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002836007221058882, + "loss": 1.7158, + "step": 5728 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028359510233879064, + "loss": 1.6727, + "step": 5729 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028358948166465613, + "loss": 1.6923, + "step": 5730 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002835838600835227, + "loss": 1.8064, + "step": 5731 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028357823759542856, + "loss": 1.7706, + "step": 5732 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028357261420041194, + "loss": 1.7537, + "step": 5733 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028356698989851094, + "loss": 1.7257, + "step": 5734 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002835613646897638, + "loss": 1.7715, + "step": 5735 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002835557385742087, + "loss": 1.724, + "step": 5736 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028355011155188387, + "loss": 1.7564, + "step": 5737 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002835444836228274, + "loss": 1.7195, + "step": 5738 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002835388547870776, + "loss": 1.8489, + "step": 5739 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028353322504467277, + "loss": 1.7512, + "step": 5740 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002835275943956509, + "loss": 1.7488, + "step": 5741 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002835219628400505, + "loss": 1.7738, + "step": 5742 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028351633037790953, + "loss": 1.7144, + "step": 5743 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028351069700926644, + "loss": 1.7711, + "step": 5744 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002835050627341593, + "loss": 1.7423, + "step": 5745 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028349942755262654, + "loss": 1.7522, + "step": 5746 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028349379146470633, + "loss": 1.7726, + "step": 5747 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002834881544704369, + "loss": 1.7595, + "step": 5748 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028348251656985655, + "loss": 1.7061, + "step": 5749 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002834768777630037, + "loss": 1.7545, + "step": 5750 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002834712380499164, + "loss": 1.7419, + "step": 5751 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028346559743063307, + "loss": 1.786, + "step": 5752 + }, + { + "epoch": 0.45, + "learning_rate": 0.000283459955905192, + "loss": 1.8005, + "step": 5753 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002834543134736314, + "loss": 1.7811, + "step": 5754 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002834486701359898, + "loss": 1.7368, + "step": 5755 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028344302589230526, + "loss": 1.7161, + "step": 5756 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002834373807426162, + "loss": 1.6974, + "step": 5757 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028343173468696107, + "loss": 1.7741, + "step": 5758 + }, + { + "epoch": 0.45, + "learning_rate": 0.000283426087725378, + "loss": 1.7655, + "step": 5759 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028342043985790546, + "loss": 1.7166, + "step": 5760 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002834147910845818, + "loss": 1.7039, + "step": 5761 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002834091414054453, + "loss": 1.7741, + "step": 5762 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028340349082053433, + "loss": 1.8258, + "step": 5763 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002833978393298873, + "loss": 1.8011, + "step": 5764 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002833921869335425, + "loss": 1.7801, + "step": 5765 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002833865336315384, + "loss": 1.7179, + "step": 5766 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028338087942391337, + "loss": 1.7158, + "step": 5767 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002833752243107058, + "loss": 1.7789, + "step": 5768 + }, + { + "epoch": 0.45, + "learning_rate": 0.000283369568291954, + "loss": 1.7765, + "step": 5769 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002833639113676965, + "loss": 1.778, + "step": 5770 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028335825353797153, + "loss": 1.7731, + "step": 5771 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002833525948028177, + "loss": 1.807, + "step": 5772 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002833469351622733, + "loss": 1.8399, + "step": 5773 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028334127461637684, + "loss": 1.7909, + "step": 5774 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028333561316516665, + "loss": 1.7203, + "step": 5775 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028332995080868127, + "loss": 1.7137, + "step": 5776 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028332428754695906, + "loss": 1.8245, + "step": 5777 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002833186233800386, + "loss": 1.7043, + "step": 5778 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028331295830795813, + "loss": 1.7199, + "step": 5779 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028330729233075634, + "loss": 1.7488, + "step": 5780 + }, + { + "epoch": 0.45, + "learning_rate": 0.00028330162544847157, + "loss": 1.7223, + "step": 5781 + }, + { + "epoch": 0.45, + "learning_rate": 0.0002832959576611423, + "loss": 1.7393, + "step": 5782 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002832902889688071, + "loss": 1.7445, + "step": 5783 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028328461937150435, + "loss": 1.7209, + "step": 5784 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002832789488692726, + "loss": 1.786, + "step": 5785 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028327327746215027, + "loss": 1.7588, + "step": 5786 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028326760515017603, + "loss": 1.7391, + "step": 5787 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028326193193338824, + "loss": 1.7547, + "step": 5788 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002832562578118255, + "loss": 1.7407, + "step": 5789 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002832505827855263, + "loss": 1.7628, + "step": 5790 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002832449068545292, + "loss": 1.7346, + "step": 5791 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002832392300188726, + "loss": 1.7203, + "step": 5792 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002832335522785953, + "loss": 1.7586, + "step": 5793 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002832278736337356, + "loss": 1.7596, + "step": 5794 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028322219408433223, + "loss": 1.756, + "step": 5795 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028321651363042365, + "loss": 1.7617, + "step": 5796 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002832108322720484, + "loss": 1.8447, + "step": 5797 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028320515000924523, + "loss": 1.8204, + "step": 5798 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002831994668420525, + "loss": 1.7361, + "step": 5799 + }, + { + "epoch": 0.46, + "learning_rate": 0.000283193782770509, + "loss": 1.7862, + "step": 5800 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002831880977946531, + "loss": 1.797, + "step": 5801 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002831824119145236, + "loss": 1.72, + "step": 5802 + }, + { + "epoch": 0.46, + "learning_rate": 0.000283176725130159, + "loss": 1.747, + "step": 5803 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002831710374415979, + "loss": 1.752, + "step": 5804 + }, + { + "epoch": 0.46, + "learning_rate": 0.000283165348848879, + "loss": 1.8023, + "step": 5805 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002831596593520408, + "loss": 1.7759, + "step": 5806 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028315396895112205, + "loss": 1.7615, + "step": 5807 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028314827764616126, + "loss": 1.7967, + "step": 5808 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002831425854371972, + "loss": 1.7357, + "step": 5809 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002831368923242685, + "loss": 1.7686, + "step": 5810 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028313119830741367, + "loss": 1.7653, + "step": 5811 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028312550338667155, + "loss": 1.7987, + "step": 5812 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002831198075620807, + "loss": 1.7577, + "step": 5813 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002831141108336798, + "loss": 1.738, + "step": 5814 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002831084132015076, + "loss": 1.755, + "step": 5815 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028310271466560266, + "loss": 1.7782, + "step": 5816 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002830970152260038, + "loss": 1.7861, + "step": 5817 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002830913148827496, + "loss": 1.7542, + "step": 5818 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028308561363587885, + "loss": 1.8072, + "step": 5819 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028307991148543026, + "loss": 1.7424, + "step": 5820 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028307420843144243, + "loss": 1.7708, + "step": 5821 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002830685044739542, + "loss": 1.7454, + "step": 5822 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002830627996130043, + "loss": 1.7777, + "step": 5823 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028305709384863136, + "loss": 1.7144, + "step": 5824 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002830513871808742, + "loss": 1.7414, + "step": 5825 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028304567960977156, + "loss": 1.7461, + "step": 5826 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002830399711353622, + "loss": 1.7013, + "step": 5827 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002830342617576848, + "loss": 1.7324, + "step": 5828 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028302855147677814, + "loss": 1.7198, + "step": 5829 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002830228402926811, + "loss": 1.7489, + "step": 5830 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028301712820543237, + "loss": 1.6915, + "step": 5831 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028301141521507077, + "loss": 1.7466, + "step": 5832 + }, + { + "epoch": 0.46, + "learning_rate": 0.000283005701321635, + "loss": 1.7427, + "step": 5833 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028299998652516395, + "loss": 1.7652, + "step": 5834 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002829942708256964, + "loss": 1.7718, + "step": 5835 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028298855422327114, + "loss": 1.7657, + "step": 5836 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028298283671792697, + "loss": 1.7428, + "step": 5837 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002829771183097027, + "loss": 1.7426, + "step": 5838 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002829713989986372, + "loss": 1.812, + "step": 5839 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002829656787847693, + "loss": 1.7145, + "step": 5840 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002829599576681378, + "loss": 1.7772, + "step": 5841 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028295423564878155, + "loss": 1.7236, + "step": 5842 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002829485127267394, + "loss": 1.7365, + "step": 5843 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002829427889020503, + "loss": 1.7083, + "step": 5844 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028293706417475295, + "loss": 1.7294, + "step": 5845 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028293133854488634, + "loss": 1.7473, + "step": 5846 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028292561201248925, + "loss": 1.7058, + "step": 5847 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028291988457760064, + "loss": 1.7552, + "step": 5848 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028291415624025933, + "loss": 1.7927, + "step": 5849 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002829084270005043, + "loss": 1.7293, + "step": 5850 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028290269685837436, + "loss": 1.7065, + "step": 5851 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002828969658139085, + "loss": 1.7332, + "step": 5852 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002828912338671455, + "loss": 1.7918, + "step": 5853 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002828855010181244, + "loss": 1.809, + "step": 5854 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002828797672668841, + "loss": 1.7228, + "step": 5855 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002828740326134635, + "loss": 1.7241, + "step": 5856 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028286829705790153, + "loss": 1.6957, + "step": 5857 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002828625606002371, + "loss": 1.7006, + "step": 5858 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028285682324050924, + "loss": 1.6802, + "step": 5859 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002828510849787569, + "loss": 1.7942, + "step": 5860 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028284534581501903, + "loss": 1.7433, + "step": 5861 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002828396057493345, + "loss": 1.7092, + "step": 5862 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002828338647817424, + "loss": 1.6962, + "step": 5863 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028282812291228164, + "loss": 1.734, + "step": 5864 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028282238014099123, + "loss": 1.7522, + "step": 5865 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028281663646791014, + "loss": 1.7451, + "step": 5866 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002828108918930774, + "loss": 1.8301, + "step": 5867 + }, + { + "epoch": 0.46, + "learning_rate": 0.000282805146416532, + "loss": 1.7581, + "step": 5868 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028279940003831294, + "loss": 1.7312, + "step": 5869 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028279365275845925, + "loss": 1.7344, + "step": 5870 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028278790457700987, + "loss": 1.7213, + "step": 5871 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028278215549400393, + "loss": 1.7604, + "step": 5872 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028277640550948053, + "loss": 1.7778, + "step": 5873 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002827706546234785, + "loss": 1.8177, + "step": 5874 + }, + { + "epoch": 0.46, + "learning_rate": 0.000282764902836037, + "loss": 1.7496, + "step": 5875 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002827591501471951, + "loss": 1.7593, + "step": 5876 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002827533965569919, + "loss": 1.7531, + "step": 5877 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002827476420654663, + "loss": 1.7603, + "step": 5878 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002827418866726575, + "loss": 1.7327, + "step": 5879 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002827361303786045, + "loss": 1.7316, + "step": 5880 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028273037318334645, + "loss": 1.7118, + "step": 5881 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028272461508692246, + "loss": 1.7085, + "step": 5882 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028271885608937154, + "loss": 1.7868, + "step": 5883 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002827130961907328, + "loss": 1.7373, + "step": 5884 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028270733539104544, + "loss": 1.783, + "step": 5885 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028270157369034843, + "loss": 1.7772, + "step": 5886 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028269581108868104, + "loss": 1.7721, + "step": 5887 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002826900475860823, + "loss": 1.7806, + "step": 5888 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028268428318259137, + "loss": 1.7484, + "step": 5889 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002826785178782473, + "loss": 1.7267, + "step": 5890 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002826727516730894, + "loss": 1.7253, + "step": 5891 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028266698456715664, + "loss": 1.7475, + "step": 5892 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028266121656048837, + "loss": 1.7583, + "step": 5893 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002826554476531236, + "loss": 1.7744, + "step": 5894 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028264967784510155, + "loss": 1.7089, + "step": 5895 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002826439071364614, + "loss": 1.7784, + "step": 5896 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002826381355272423, + "loss": 1.8067, + "step": 5897 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002826323630174834, + "loss": 1.749, + "step": 5898 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028262658960722406, + "loss": 1.7851, + "step": 5899 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028262081529650335, + "loss": 1.7517, + "step": 5900 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028261504008536044, + "loss": 1.761, + "step": 5901 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002826092639738346, + "loss": 1.6759, + "step": 5902 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002826034869619651, + "loss": 1.7585, + "step": 5903 + }, + { + "epoch": 0.46, + "learning_rate": 0.000282597709049791, + "loss": 1.8012, + "step": 5904 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028259193023735167, + "loss": 1.7643, + "step": 5905 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028258615052468634, + "loss": 1.693, + "step": 5906 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002825803699118341, + "loss": 1.7844, + "step": 5907 + }, + { + "epoch": 0.46, + "learning_rate": 0.00028257458839883444, + "loss": 1.7447, + "step": 5908 + }, + { + "epoch": 0.46, + "learning_rate": 0.0002825688059857264, + "loss": 1.7118, + "step": 5909 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028256302267254944, + "loss": 1.7281, + "step": 5910 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002825572384593426, + "loss": 1.7033, + "step": 5911 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002825514533461453, + "loss": 1.7728, + "step": 5912 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002825456673329968, + "loss": 1.7453, + "step": 5913 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028253988041993634, + "loss": 1.758, + "step": 5914 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002825340926070032, + "loss": 1.7223, + "step": 5915 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028252830389423675, + "loss": 1.7399, + "step": 5916 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002825225142816763, + "loss": 1.7667, + "step": 5917 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028251672376936103, + "loss": 1.6907, + "step": 5918 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028251093235733037, + "loss": 1.7817, + "step": 5919 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028250514004562354, + "loss": 1.7041, + "step": 5920 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028249934683428, + "loss": 1.7445, + "step": 5921 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028249355272333903, + "loss": 1.7472, + "step": 5922 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002824877577128399, + "loss": 1.7564, + "step": 5923 + }, + { + "epoch": 0.47, + "learning_rate": 0.000282481961802822, + "loss": 1.7069, + "step": 5924 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028247616499332476, + "loss": 1.7561, + "step": 5925 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002824703672843874, + "loss": 1.7708, + "step": 5926 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002824645686760494, + "loss": 1.7869, + "step": 5927 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002824587691683501, + "loss": 1.7465, + "step": 5928 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002824529687613288, + "loss": 1.8167, + "step": 5929 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028244716745502496, + "loss": 1.7559, + "step": 5930 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028244136524947794, + "loss": 1.815, + "step": 5931 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002824355621447271, + "loss": 1.7111, + "step": 5932 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002824297581408119, + "loss": 1.7495, + "step": 5933 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002824239532377717, + "loss": 1.7243, + "step": 5934 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028241814743564593, + "loss": 1.7171, + "step": 5935 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002824123407344741, + "loss": 1.7218, + "step": 5936 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028240653313429547, + "loss": 1.8036, + "step": 5937 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028240072463514955, + "loss": 1.7522, + "step": 5938 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002823949152370758, + "loss": 1.7295, + "step": 5939 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028238910494011364, + "loss": 1.6867, + "step": 5940 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002823832937443025, + "loss": 1.7602, + "step": 5941 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002823774816496819, + "loss": 1.74, + "step": 5942 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002823716686562912, + "loss": 1.7181, + "step": 5943 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028236585476416995, + "loss": 1.7738, + "step": 5944 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002823600399733575, + "loss": 1.7303, + "step": 5945 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028235422428389355, + "loss": 1.7125, + "step": 5946 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028234840769581735, + "loss": 1.7598, + "step": 5947 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028234259020916853, + "loss": 1.7187, + "step": 5948 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002823367718239866, + "loss": 1.7014, + "step": 5949 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028233095254031097, + "loss": 1.7412, + "step": 5950 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028232513235818126, + "loss": 1.7449, + "step": 5951 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028231931127763686, + "loss": 1.7449, + "step": 5952 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028231348929871734, + "loss": 1.8149, + "step": 5953 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002823076664214623, + "loss": 1.7204, + "step": 5954 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002823018426459112, + "loss": 1.7082, + "step": 5955 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028229601797210365, + "loss": 1.7224, + "step": 5956 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002822901924000791, + "loss": 1.7829, + "step": 5957 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002822843659298771, + "loss": 1.688, + "step": 5958 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002822785385615373, + "loss": 1.7462, + "step": 5959 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028227271029509924, + "loss": 1.7409, + "step": 5960 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028226688113060244, + "loss": 1.7247, + "step": 5961 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002822610510680865, + "loss": 1.757, + "step": 5962 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028225522010759104, + "loss": 1.695, + "step": 5963 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028224938824915563, + "loss": 1.7502, + "step": 5964 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002822435554928198, + "loss": 1.7504, + "step": 5965 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028223772183862323, + "loss": 1.7479, + "step": 5966 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028223188728660555, + "loss": 1.7924, + "step": 5967 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002822260518368063, + "loss": 1.8104, + "step": 5968 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028222021548926507, + "loss": 1.7742, + "step": 5969 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002822143782440216, + "loss": 1.7279, + "step": 5970 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002822085401011154, + "loss": 1.6748, + "step": 5971 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028220270106058627, + "loss": 1.7378, + "step": 5972 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002821968611224737, + "loss": 1.7403, + "step": 5973 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002821910202868174, + "loss": 1.7597, + "step": 5974 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028218517855365706, + "loss": 1.7459, + "step": 5975 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028217933592303225, + "loss": 1.6828, + "step": 5976 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002821734923949827, + "loss": 1.709, + "step": 5977 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002821676479695481, + "loss": 1.7441, + "step": 5978 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028216180264676807, + "loss": 1.7052, + "step": 5979 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028215595642668234, + "loss": 1.7512, + "step": 5980 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028215010930933063, + "loss": 1.6881, + "step": 5981 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002821442612947526, + "loss": 1.7449, + "step": 5982 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002821384123829879, + "loss": 1.7585, + "step": 5983 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028213256257407634, + "loss": 1.7852, + "step": 5984 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002821267118680576, + "loss": 1.7157, + "step": 5985 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002821208602649714, + "loss": 1.7362, + "step": 5986 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002821150077648575, + "loss": 1.6737, + "step": 5987 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028210915436775556, + "loss": 1.7969, + "step": 5988 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002821033000737054, + "loss": 1.7283, + "step": 5989 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002820974448827467, + "loss": 1.7579, + "step": 5990 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002820915887949192, + "loss": 1.7856, + "step": 5991 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028208573181026284, + "loss": 1.7261, + "step": 5992 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002820798739288172, + "loss": 1.7512, + "step": 5993 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002820740151506221, + "loss": 1.7857, + "step": 5994 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002820681554757172, + "loss": 1.7364, + "step": 5995 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002820622949041425, + "loss": 1.7692, + "step": 5996 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002820564334359378, + "loss": 1.7385, + "step": 5997 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002820505710711427, + "loss": 1.7543, + "step": 5998 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028204470780979706, + "loss": 1.7145, + "step": 5999 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028203884365194076, + "loss": 1.7802, + "step": 6000 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002820329785976136, + "loss": 1.7078, + "step": 6001 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002820271126468553, + "loss": 1.7503, + "step": 6002 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002820212457997058, + "loss": 1.6863, + "step": 6003 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028201537805620493, + "loss": 1.7566, + "step": 6004 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028200950941639243, + "loss": 1.7958, + "step": 6005 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028200363988030826, + "loss": 1.7451, + "step": 6006 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002819977694479922, + "loss": 1.7641, + "step": 6007 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028199189811948416, + "loss": 1.7198, + "step": 6008 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028198602589482396, + "loss": 1.7844, + "step": 6009 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002819801527740515, + "loss": 1.7489, + "step": 6010 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028197427875720655, + "loss": 1.7228, + "step": 6011 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028196840384432913, + "loss": 1.7081, + "step": 6012 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002819625280354591, + "loss": 1.7148, + "step": 6013 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028195665133063627, + "loss": 1.7223, + "step": 6014 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002819507737299006, + "loss": 1.7607, + "step": 6015 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002819448952332921, + "loss": 1.7018, + "step": 6016 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002819390158408505, + "loss": 1.7631, + "step": 6017 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002819331355526158, + "loss": 1.7815, + "step": 6018 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002819272543686279, + "loss": 1.7034, + "step": 6019 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002819213722889267, + "loss": 1.7529, + "step": 6020 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002819154893135523, + "loss": 1.74, + "step": 6021 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028190960544254446, + "loss": 1.7343, + "step": 6022 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002819037206759432, + "loss": 1.7279, + "step": 6023 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028189783501378845, + "loss": 1.7349, + "step": 6024 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028189194845612016, + "loss": 1.7588, + "step": 6025 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002818860610029784, + "loss": 1.7529, + "step": 6026 + }, + { + "epoch": 0.47, + "learning_rate": 0.000281880172654403, + "loss": 1.7834, + "step": 6027 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028187428341043406, + "loss": 1.7683, + "step": 6028 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002818683932711115, + "loss": 1.8212, + "step": 6029 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028186250223647525, + "loss": 1.7206, + "step": 6030 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028185661030656546, + "loss": 1.7137, + "step": 6031 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028185071748142203, + "loss": 1.7347, + "step": 6032 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028184482376108496, + "loss": 1.7052, + "step": 6033 + }, + { + "epoch": 0.47, + "learning_rate": 0.0002818389291455943, + "loss": 1.739, + "step": 6034 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028183303363499013, + "loss": 1.7502, + "step": 6035 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028182713722931234, + "loss": 1.7279, + "step": 6036 + }, + { + "epoch": 0.47, + "learning_rate": 0.00028182123992860105, + "loss": 1.7379, + "step": 6037 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002818153417328963, + "loss": 1.7222, + "step": 6038 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028180944264223813, + "loss": 1.7478, + "step": 6039 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002818035426566666, + "loss": 1.7194, + "step": 6040 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002817976417762217, + "loss": 1.7428, + "step": 6041 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002817917400009436, + "loss": 1.7971, + "step": 6042 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002817858373308723, + "loss": 1.7293, + "step": 6043 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028177993376604784, + "loss": 1.7019, + "step": 6044 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002817740293065104, + "loss": 1.7469, + "step": 6045 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002817681239523, + "loss": 1.7403, + "step": 6046 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028176221770345673, + "loss": 1.7446, + "step": 6047 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002817563105600207, + "loss": 1.7682, + "step": 6048 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002817504025220321, + "loss": 1.7888, + "step": 6049 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028174449358953096, + "loss": 1.712, + "step": 6050 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002817385837625574, + "loss": 1.7811, + "step": 6051 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028173267304115154, + "loss": 1.7094, + "step": 6052 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028172676142535353, + "loss": 1.7465, + "step": 6053 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028172084891520355, + "loss": 1.765, + "step": 6054 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028171493551074165, + "loss": 1.7443, + "step": 6055 + }, + { + "epoch": 0.48, + "learning_rate": 0.000281709021212008, + "loss": 1.7379, + "step": 6056 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028170310601904284, + "loss": 1.6928, + "step": 6057 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002816971899318862, + "loss": 1.7364, + "step": 6058 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028169127295057836, + "loss": 1.7368, + "step": 6059 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002816853550751595, + "loss": 1.7039, + "step": 6060 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028167943630566966, + "loss": 1.7439, + "step": 6061 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002816735166421491, + "loss": 1.7575, + "step": 6062 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002816675960846381, + "loss": 1.7966, + "step": 6063 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002816616746331768, + "loss": 1.7449, + "step": 6064 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002816557522878053, + "loss": 1.6841, + "step": 6065 + }, + { + "epoch": 0.48, + "learning_rate": 0.000281649829048564, + "loss": 1.7261, + "step": 6066 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002816439049154929, + "loss": 1.7703, + "step": 6067 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002816379798886324, + "loss": 1.7271, + "step": 6068 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002816320539680226, + "loss": 1.7275, + "step": 6069 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002816261271537039, + "loss": 1.8034, + "step": 6070 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028162019944571635, + "loss": 1.7319, + "step": 6071 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002816142708441003, + "loss": 1.6624, + "step": 6072 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028160834134889596, + "loss": 1.7423, + "step": 6073 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002816024109601437, + "loss": 1.7165, + "step": 6074 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002815964796778836, + "loss": 1.7225, + "step": 6075 + }, + { + "epoch": 0.48, + "learning_rate": 0.000281590547502156, + "loss": 1.7804, + "step": 6076 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028158461443300126, + "loss": 1.7656, + "step": 6077 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002815786804704596, + "loss": 1.7634, + "step": 6078 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002815727456145713, + "loss": 1.7508, + "step": 6079 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028156680986537666, + "loss": 1.7425, + "step": 6080 + }, + { + "epoch": 0.48, + "learning_rate": 0.000281560873222916, + "loss": 1.7223, + "step": 6081 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002815549356872296, + "loss": 1.7071, + "step": 6082 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002815489972583578, + "loss": 1.7575, + "step": 6083 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002815430579363409, + "loss": 1.6968, + "step": 6084 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002815371177212192, + "loss": 1.7515, + "step": 6085 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002815311766130331, + "loss": 1.7067, + "step": 6086 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002815252346118229, + "loss": 1.7349, + "step": 6087 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002815192917176289, + "loss": 1.6768, + "step": 6088 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002815133479304915, + "loss": 1.7331, + "step": 6089 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028150740325045106, + "loss": 1.7947, + "step": 6090 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002815014576775479, + "loss": 1.6965, + "step": 6091 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002814955112118224, + "loss": 1.6943, + "step": 6092 + }, + { + "epoch": 0.48, + "learning_rate": 0.000281489563853315, + "loss": 1.7619, + "step": 6093 + }, + { + "epoch": 0.48, + "learning_rate": 0.000281483615602066, + "loss": 1.7339, + "step": 6094 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002814776664581158, + "loss": 1.7435, + "step": 6095 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028147171642150474, + "loss": 1.6698, + "step": 6096 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028146576549227336, + "loss": 1.6833, + "step": 6097 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028145981367046197, + "loss": 1.7384, + "step": 6098 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028145386095611096, + "loss": 1.7458, + "step": 6099 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028144790734926077, + "loss": 1.793, + "step": 6100 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002814419528499519, + "loss": 1.6815, + "step": 6101 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002814359974582246, + "loss": 1.7132, + "step": 6102 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002814300411741195, + "loss": 1.6975, + "step": 6103 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028142408399767693, + "loss": 1.7, + "step": 6104 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028141812592893733, + "loss": 1.7282, + "step": 6105 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002814121669679412, + "loss": 1.7541, + "step": 6106 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028140620711472895, + "loss": 1.7665, + "step": 6107 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028140024636934106, + "loss": 1.7076, + "step": 6108 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028139428473181806, + "loss": 1.7058, + "step": 6109 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028138832220220034, + "loss": 1.7582, + "step": 6110 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028138235878052845, + "loss": 1.7524, + "step": 6111 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002813763944668428, + "loss": 1.7315, + "step": 6112 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028137042926118397, + "loss": 1.7164, + "step": 6113 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002813644631635924, + "loss": 1.7359, + "step": 6114 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028135849617410863, + "loss": 1.7564, + "step": 6115 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028135252829277315, + "loss": 1.685, + "step": 6116 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002813465595196265, + "loss": 1.7915, + "step": 6117 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028134058985470917, + "loss": 1.7385, + "step": 6118 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002813346192980618, + "loss": 1.7581, + "step": 6119 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028132864784972467, + "loss": 1.7604, + "step": 6120 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028132267550973867, + "loss": 1.7564, + "step": 6121 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002813167022781441, + "loss": 1.6957, + "step": 6122 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028131072815498157, + "loss": 1.7351, + "step": 6123 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002813047531402917, + "loss": 1.7092, + "step": 6124 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028129877723411493, + "loss": 1.7522, + "step": 6125 + }, + { + "epoch": 0.48, + "learning_rate": 0.000281292800436492, + "loss": 1.7533, + "step": 6126 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002812868227474634, + "loss": 1.7893, + "step": 6127 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028128084416706976, + "loss": 1.7232, + "step": 6128 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002812748646953516, + "loss": 1.7314, + "step": 6129 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028126888433234953, + "loss": 1.7247, + "step": 6130 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028126290307810416, + "loss": 1.688, + "step": 6131 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028125692093265616, + "loss": 1.7822, + "step": 6132 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028125093789604607, + "loss": 1.7528, + "step": 6133 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028124495396831455, + "loss": 1.7363, + "step": 6134 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028123896914950225, + "loss": 1.6881, + "step": 6135 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002812329834396497, + "loss": 1.773, + "step": 6136 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002812269968387977, + "loss": 1.7654, + "step": 6137 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002812210093469868, + "loss": 1.6834, + "step": 6138 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002812150209642576, + "loss": 1.7041, + "step": 6139 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028120903169065085, + "loss": 1.7341, + "step": 6140 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028120304152620717, + "loss": 1.6551, + "step": 6141 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028119705047096726, + "loss": 1.701, + "step": 6142 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002811910585249718, + "loss": 1.6974, + "step": 6143 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002811850656882614, + "loss": 1.7449, + "step": 6144 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002811790719608768, + "loss": 1.7485, + "step": 6145 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028117307734285875, + "loss": 1.683, + "step": 6146 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002811670818342478, + "loss": 1.6956, + "step": 6147 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002811610854350848, + "loss": 1.7484, + "step": 6148 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028115508814541046, + "loss": 1.7748, + "step": 6149 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002811490899652654, + "loss": 1.743, + "step": 6150 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002811430908946904, + "loss": 1.7348, + "step": 6151 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028113709093372614, + "loss": 1.6675, + "step": 6152 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002811310900824135, + "loss": 1.7234, + "step": 6153 + }, + { + "epoch": 0.48, + "learning_rate": 0.000281125088340793, + "loss": 1.767, + "step": 6154 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028111908570890555, + "loss": 1.6916, + "step": 6155 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002811130821867919, + "loss": 1.7496, + "step": 6156 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028110707777449274, + "loss": 1.7454, + "step": 6157 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028110107247204894, + "loss": 1.7291, + "step": 6158 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002810950662795011, + "loss": 1.7677, + "step": 6159 + }, + { + "epoch": 0.48, + "learning_rate": 0.0002810890591968902, + "loss": 1.746, + "step": 6160 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028108305122425694, + "loss": 1.6873, + "step": 6161 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028107704236164205, + "loss": 1.7179, + "step": 6162 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028107103260908636, + "loss": 1.7373, + "step": 6163 + }, + { + "epoch": 0.48, + "learning_rate": 0.00028106502196663066, + "loss": 1.7913, + "step": 6164 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028105901043431585, + "loss": 1.6983, + "step": 6165 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002810529980121827, + "loss": 1.7446, + "step": 6166 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028104698470027197, + "loss": 1.7262, + "step": 6167 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002810409704986246, + "loss": 1.7148, + "step": 6168 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002810349554072812, + "loss": 1.7531, + "step": 6169 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002810289394262829, + "loss": 1.7398, + "step": 6170 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002810229225556704, + "loss": 1.7371, + "step": 6171 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002810169047954845, + "loss": 1.7498, + "step": 6172 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002810108861457662, + "loss": 1.7428, + "step": 6173 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002810048666065562, + "loss": 1.7016, + "step": 6174 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028099884617789546, + "loss": 1.7825, + "step": 6175 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002809928248598249, + "loss": 1.7414, + "step": 6176 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002809868026523853, + "loss": 1.8137, + "step": 6177 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028098077955561766, + "loss": 1.775, + "step": 6178 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002809747555695627, + "loss": 1.7211, + "step": 6179 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028096873069426154, + "loss": 1.8102, + "step": 6180 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002809627049297549, + "loss": 1.7098, + "step": 6181 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002809566782760838, + "loss": 1.7974, + "step": 6182 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002809506507332891, + "loss": 1.7155, + "step": 6183 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002809446223014118, + "loss": 1.7136, + "step": 6184 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002809385929804927, + "loss": 1.7356, + "step": 6185 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028093256277057283, + "loss": 1.7836, + "step": 6186 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028092653167169314, + "loss": 1.719, + "step": 6187 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002809204996838945, + "loss": 1.7578, + "step": 6188 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028091446680721794, + "loss": 1.7333, + "step": 6189 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028090843304170445, + "loss": 1.7255, + "step": 6190 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002809023983873949, + "loss": 1.7043, + "step": 6191 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028089636284433025, + "loss": 1.7229, + "step": 6192 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002808903264125516, + "loss": 1.7692, + "step": 6193 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028088428909209983, + "loss": 1.8104, + "step": 6194 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028087825088301594, + "loss": 1.7348, + "step": 6195 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028087221178534104, + "loss": 1.7982, + "step": 6196 + }, + { + "epoch": 0.49, + "learning_rate": 0.000280866171799116, + "loss": 1.73, + "step": 6197 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028086013092438187, + "loss": 1.7639, + "step": 6198 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002808540891611796, + "loss": 1.7554, + "step": 6199 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002808480465095504, + "loss": 1.7697, + "step": 6200 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002808420029695351, + "loss": 1.6884, + "step": 6201 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002808359585411748, + "loss": 1.7261, + "step": 6202 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028082991322451057, + "loss": 1.7619, + "step": 6203 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002808238670195834, + "loss": 1.7615, + "step": 6204 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002808178199264344, + "loss": 1.7188, + "step": 6205 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002808117719451045, + "loss": 1.747, + "step": 6206 + }, + { + "epoch": 0.49, + "learning_rate": 0.000280805723075635, + "loss": 1.7393, + "step": 6207 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028079967331806675, + "loss": 1.7482, + "step": 6208 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002807936226724409, + "loss": 1.7509, + "step": 6209 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028078757113879853, + "loss": 1.7088, + "step": 6210 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002807815187171807, + "loss": 1.7358, + "step": 6211 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002807754654076286, + "loss": 1.7239, + "step": 6212 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002807694112101832, + "loss": 1.7528, + "step": 6213 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002807633561248857, + "loss": 1.689, + "step": 6214 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028075730015177715, + "loss": 1.7306, + "step": 6215 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028075124329089864, + "loss": 1.732, + "step": 6216 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002807451855422915, + "loss": 1.701, + "step": 6217 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002807391269059965, + "loss": 1.7309, + "step": 6218 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028073306738205515, + "loss": 1.7088, + "step": 6219 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002807270069705083, + "loss": 1.692, + "step": 6220 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028072094567139724, + "loss": 1.6638, + "step": 6221 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028071488348476315, + "loss": 1.7203, + "step": 6222 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002807088204106471, + "loss": 1.7302, + "step": 6223 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002807027564490903, + "loss": 1.6807, + "step": 6224 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028069669160013386, + "loss": 1.7711, + "step": 6225 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028069062586381905, + "loss": 1.7591, + "step": 6226 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028068455924018705, + "loss": 1.7772, + "step": 6227 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002806784917292789, + "loss": 1.7381, + "step": 6228 + }, + { + "epoch": 0.49, + "learning_rate": 0.000280672423331136, + "loss": 1.6998, + "step": 6229 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002806663540457994, + "loss": 1.7914, + "step": 6230 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028066028387331045, + "loss": 1.7664, + "step": 6231 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002806542128137102, + "loss": 1.7424, + "step": 6232 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028064814086703997, + "loss": 1.6753, + "step": 6233 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028064206803334095, + "loss": 1.6829, + "step": 6234 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002806359943126544, + "loss": 1.7317, + "step": 6235 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002806299197050215, + "loss": 1.7572, + "step": 6236 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002806238442104836, + "loss": 1.8075, + "step": 6237 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002806177678290818, + "loss": 1.7425, + "step": 6238 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002806116905608575, + "loss": 1.7287, + "step": 6239 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002806056124058519, + "loss": 1.7177, + "step": 6240 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002805995333641063, + "loss": 1.7469, + "step": 6241 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028059345343566184, + "loss": 1.7101, + "step": 6242 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028058737262055995, + "loss": 1.7482, + "step": 6243 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002805812909188418, + "loss": 1.6973, + "step": 6244 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002805752083305488, + "loss": 1.6837, + "step": 6245 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002805691248557222, + "loss": 1.7621, + "step": 6246 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028056304049440335, + "loss": 1.6998, + "step": 6247 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002805569552466334, + "loss": 1.7209, + "step": 6248 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028055086911245384, + "loss": 1.7213, + "step": 6249 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002805447820919059, + "loss": 1.731, + "step": 6250 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028053869418503095, + "loss": 1.7525, + "step": 6251 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002805326053918703, + "loss": 1.7279, + "step": 6252 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028052651571246526, + "loss": 1.6719, + "step": 6253 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028052042514685726, + "loss": 1.7389, + "step": 6254 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028051433369508756, + "loss": 1.7217, + "step": 6255 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002805082413571975, + "loss": 1.7081, + "step": 6256 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028050214813322863, + "loss": 1.6749, + "step": 6257 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002804960540232221, + "loss": 1.772, + "step": 6258 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028048995902721943, + "loss": 1.7273, + "step": 6259 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028048386314526196, + "loss": 1.7053, + "step": 6260 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028047776637739097, + "loss": 1.7285, + "step": 6261 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028047166872364804, + "loss": 1.7409, + "step": 6262 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028046557018407447, + "loss": 1.7133, + "step": 6263 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028045947075871163, + "loss": 1.7332, + "step": 6264 + }, + { + "epoch": 0.49, + "learning_rate": 0.000280453370447601, + "loss": 1.7776, + "step": 6265 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028044726925078396, + "loss": 1.7339, + "step": 6266 + }, + { + "epoch": 0.49, + "learning_rate": 0.000280441167168302, + "loss": 1.7182, + "step": 6267 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002804350642001965, + "loss": 1.654, + "step": 6268 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028042896034650885, + "loss": 1.7025, + "step": 6269 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002804228556072805, + "loss": 1.7331, + "step": 6270 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028041674998255297, + "loss": 1.721, + "step": 6271 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002804106434723677, + "loss": 1.7909, + "step": 6272 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002804045360767661, + "loss": 1.7442, + "step": 6273 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028039842779578974, + "loss": 1.7249, + "step": 6274 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028039231862947986, + "loss": 1.6706, + "step": 6275 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002803862085778782, + "loss": 1.7599, + "step": 6276 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002803800976410261, + "loss": 1.7306, + "step": 6277 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028037398581896514, + "loss": 1.7468, + "step": 6278 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002803678731117368, + "loss": 1.7281, + "step": 6279 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002803617595193824, + "loss": 1.7935, + "step": 6280 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002803556450419437, + "loss": 1.7549, + "step": 6281 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028034952967946207, + "loss": 1.7556, + "step": 6282 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002803434134319791, + "loss": 1.7802, + "step": 6283 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028033729629953625, + "loss": 1.7577, + "step": 6284 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028033117828217503, + "loss": 1.7551, + "step": 6285 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002803250593799371, + "loss": 1.6604, + "step": 6286 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002803189395928639, + "loss": 1.7723, + "step": 6287 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028031281892099705, + "loss": 1.7216, + "step": 6288 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028030669736437807, + "loss": 1.7348, + "step": 6289 + }, + { + "epoch": 0.49, + "learning_rate": 0.0002803005749230485, + "loss": 1.7448, + "step": 6290 + }, + { + "epoch": 0.49, + "learning_rate": 0.00028029445159705, + "loss": 1.7529, + "step": 6291 + }, + { + "epoch": 0.5, + "learning_rate": 0.000280288327386424, + "loss": 1.6949, + "step": 6292 + }, + { + "epoch": 0.5, + "learning_rate": 0.00028028220229121223, + "loss": 1.7185, + "step": 6293 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002802760763114561, + "loss": 1.7771, + "step": 6294 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002802699494471974, + "loss": 1.7277, + "step": 6295 + }, + { + "epoch": 0.5, + "learning_rate": 0.00028026382169847754, + "loss": 1.7292, + "step": 6296 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002802576930653383, + "loss": 1.7001, + "step": 6297 + }, + { + "epoch": 0.5, + "learning_rate": 0.00028025156354782117, + "loss": 1.7637, + "step": 6298 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002802454331459678, + "loss": 1.7713, + "step": 6299 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002802393018598198, + "loss": 1.7067, + "step": 6300 + }, + { + "epoch": 0.5, + "learning_rate": 0.00028023316968941883, + "loss": 1.7554, + "step": 6301 + }, + { + "epoch": 0.5, + "learning_rate": 0.00028022703663480654, + "loss": 1.7438, + "step": 6302 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002802209026960245, + "loss": 1.725, + "step": 6303 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002802147678731144, + "loss": 1.7597, + "step": 6304 + }, + { + "epoch": 0.5, + "learning_rate": 0.00028020863216611785, + "loss": 1.7168, + "step": 6305 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002802024955750766, + "loss": 1.734, + "step": 6306 + }, + { + "epoch": 0.5, + "learning_rate": 0.00028019635810003224, + "loss": 1.7382, + "step": 6307 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002801902197410264, + "loss": 1.7324, + "step": 6308 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002801840804981009, + "loss": 1.7409, + "step": 6309 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002801779403712973, + "loss": 1.6836, + "step": 6310 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002801717993606573, + "loss": 1.7021, + "step": 6311 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002801656574662226, + "loss": 1.7473, + "step": 6312 + }, + { + "epoch": 0.5, + "learning_rate": 0.00028015951468803496, + "loss": 1.7324, + "step": 6313 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002801533710261361, + "loss": 1.7486, + "step": 6314 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002801472264805676, + "loss": 1.7344, + "step": 6315 + }, + { + "epoch": 0.5, + "learning_rate": 0.00028014108105137126, + "loss": 1.6802, + "step": 6316 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002801349347385888, + "loss": 1.7148, + "step": 6317 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002801287875422619, + "loss": 1.7526, + "step": 6318 + }, + { + "epoch": 0.5, + "learning_rate": 0.00028012263946243244, + "loss": 1.7327, + "step": 6319 + }, + { + "epoch": 0.5, + "learning_rate": 0.00028011649049914197, + "loss": 1.7071, + "step": 6320 + }, + { + "epoch": 0.5, + "learning_rate": 0.00028011034065243245, + "loss": 1.7458, + "step": 6321 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002801041899223454, + "loss": 1.7569, + "step": 6322 + }, + { + "epoch": 0.5, + "learning_rate": 0.00028009803830892277, + "loss": 1.813, + "step": 6323 + }, + { + "epoch": 0.5, + "learning_rate": 0.00028009188581220625, + "loss": 1.7048, + "step": 6324 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002800857324322376, + "loss": 1.818, + "step": 6325 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002800795781690586, + "loss": 1.7902, + "step": 6326 + }, + { + "epoch": 0.5, + "learning_rate": 0.00028007342302271103, + "loss": 1.7313, + "step": 6327 + }, + { + "epoch": 0.5, + "learning_rate": 0.00028006726699323676, + "loss": 1.6926, + "step": 6328 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002800611100806775, + "loss": 1.7295, + "step": 6329 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002800549522850751, + "loss": 1.7065, + "step": 6330 + }, + { + "epoch": 0.5, + "learning_rate": 0.00028004879360647126, + "loss": 1.7145, + "step": 6331 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002800426340449079, + "loss": 1.6929, + "step": 6332 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002800364736004269, + "loss": 1.7912, + "step": 6333 + }, + { + "epoch": 0.5, + "learning_rate": 0.00028003031227306994, + "loss": 1.717, + "step": 6334 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002800241500628789, + "loss": 1.717, + "step": 6335 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002800179869698957, + "loss": 1.7337, + "step": 6336 + }, + { + "epoch": 0.5, + "learning_rate": 0.00028001182299416206, + "loss": 1.7268, + "step": 6337 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002800056581357199, + "loss": 1.7323, + "step": 6338 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002799994923946111, + "loss": 1.7303, + "step": 6339 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002799933257708774, + "loss": 1.7364, + "step": 6340 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002799871582645609, + "loss": 1.7077, + "step": 6341 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002799809898757032, + "loss": 1.7403, + "step": 6342 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027997482060434636, + "loss": 1.7504, + "step": 6343 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002799686504505322, + "loss": 1.7716, + "step": 6344 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027996247941430266, + "loss": 1.7628, + "step": 6345 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027995630749569957, + "loss": 1.7, + "step": 6346 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027995013469476484, + "loss": 1.6764, + "step": 6347 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002799439610115405, + "loss": 1.7131, + "step": 6348 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002799377864460683, + "loss": 1.7505, + "step": 6349 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002799316109983902, + "loss": 1.7455, + "step": 6350 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027992543466854827, + "loss": 1.7098, + "step": 6351 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002799192574565842, + "loss": 1.7231, + "step": 6352 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002799130793625402, + "loss": 1.7053, + "step": 6353 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027990690038645806, + "loss": 1.7165, + "step": 6354 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027990072052837966, + "loss": 1.776, + "step": 6355 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027989453978834715, + "loss": 1.7236, + "step": 6356 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002798883581664024, + "loss": 1.6895, + "step": 6357 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027988217566258736, + "loss": 1.6676, + "step": 6358 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027987599227694395, + "loss": 1.7377, + "step": 6359 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002798698080095143, + "loss": 1.7201, + "step": 6360 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027986362286034033, + "loss": 1.7368, + "step": 6361 + }, + { + "epoch": 0.5, + "learning_rate": 0.000279857436829464, + "loss": 1.7611, + "step": 6362 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002798512499169273, + "loss": 1.721, + "step": 6363 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002798450621227723, + "loss": 1.7011, + "step": 6364 + }, + { + "epoch": 0.5, + "learning_rate": 0.000279838873447041, + "loss": 1.7073, + "step": 6365 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027983268388977536, + "loss": 1.7653, + "step": 6366 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027982649345101746, + "loss": 1.6634, + "step": 6367 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027982030213080937, + "loss": 1.7163, + "step": 6368 + }, + { + "epoch": 0.5, + "learning_rate": 0.000279814109929193, + "loss": 1.7438, + "step": 6369 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027980791684621047, + "loss": 1.6752, + "step": 6370 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027980172288190385, + "loss": 1.6947, + "step": 6371 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027979552803631514, + "loss": 1.7305, + "step": 6372 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002797893323094864, + "loss": 1.7077, + "step": 6373 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027978313570145975, + "loss": 1.7576, + "step": 6374 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027977693821227726, + "loss": 1.7551, + "step": 6375 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002797707398419809, + "loss": 1.7285, + "step": 6376 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002797645405906129, + "loss": 1.7573, + "step": 6377 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027975834045821524, + "loss": 1.7459, + "step": 6378 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027975213944483006, + "loss": 1.7425, + "step": 6379 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002797459375504995, + "loss": 1.7546, + "step": 6380 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002797397347752656, + "loss": 1.7541, + "step": 6381 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002797335311191704, + "loss": 1.7514, + "step": 6382 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002797273265822562, + "loss": 1.7805, + "step": 6383 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027972112116456506, + "loss": 1.7244, + "step": 6384 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002797149148661391, + "loss": 1.6954, + "step": 6385 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002797087076870204, + "loss": 1.7489, + "step": 6386 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027970249962725114, + "loss": 1.7813, + "step": 6387 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027969629068687357, + "loss": 1.7301, + "step": 6388 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002796900808659297, + "loss": 1.7295, + "step": 6389 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002796838701644617, + "loss": 1.7665, + "step": 6390 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027967765858251186, + "loss": 1.7328, + "step": 6391 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002796714461201223, + "loss": 1.7264, + "step": 6392 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002796652327773351, + "loss": 1.6307, + "step": 6393 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002796590185541926, + "loss": 1.7393, + "step": 6394 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002796528034507369, + "loss": 1.6998, + "step": 6395 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002796465874670102, + "loss": 1.6921, + "step": 6396 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027964037060305475, + "loss": 1.7419, + "step": 6397 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027963415285891266, + "loss": 1.6931, + "step": 6398 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027962793423462625, + "loss": 1.7914, + "step": 6399 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027962171473023764, + "loss": 1.6819, + "step": 6400 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027961549434578917, + "loss": 1.723, + "step": 6401 + }, + { + "epoch": 0.5, + "learning_rate": 0.000279609273081323, + "loss": 1.6826, + "step": 6402 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027960305093688146, + "loss": 1.7493, + "step": 6403 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002795968279125067, + "loss": 1.7227, + "step": 6404 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002795906040082409, + "loss": 1.7463, + "step": 6405 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027958437922412653, + "loss": 1.748, + "step": 6406 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002795781535602057, + "loss": 1.7243, + "step": 6407 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027957192701652067, + "loss": 1.6791, + "step": 6408 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002795656995931138, + "loss": 1.7301, + "step": 6409 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002795594712900274, + "loss": 1.6999, + "step": 6410 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027955324210730354, + "loss": 1.6761, + "step": 6411 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027954701204498475, + "loss": 1.6959, + "step": 6412 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027954078110311323, + "loss": 1.651, + "step": 6413 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002795345492817313, + "loss": 1.7039, + "step": 6414 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002795283165808812, + "loss": 1.6764, + "step": 6415 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027952208300060534, + "loss": 1.6986, + "step": 6416 + }, + { + "epoch": 0.5, + "learning_rate": 0.00027951584854094604, + "loss": 1.7201, + "step": 6417 + }, + { + "epoch": 0.5, + "learning_rate": 0.0002795096132019456, + "loss": 1.7204, + "step": 6418 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002795033769836463, + "loss": 1.7246, + "step": 6419 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002794971398860906, + "loss": 1.7147, + "step": 6420 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027949090190932074, + "loss": 1.7625, + "step": 6421 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027948466305337917, + "loss": 1.8001, + "step": 6422 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027947842331830814, + "loss": 1.7558, + "step": 6423 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002794721827041501, + "loss": 1.6814, + "step": 6424 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002794659412109474, + "loss": 1.7182, + "step": 6425 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002794596988387424, + "loss": 1.7447, + "step": 6426 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002794534555875774, + "loss": 1.7521, + "step": 6427 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027944721145749496, + "loss": 1.746, + "step": 6428 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027944096644853735, + "loss": 1.778, + "step": 6429 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002794347205607471, + "loss": 1.7368, + "step": 6430 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002794284737941664, + "loss": 1.7175, + "step": 6431 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027942222614883787, + "loss": 1.6786, + "step": 6432 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002794159776248038, + "loss": 1.6717, + "step": 6433 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027940972822210663, + "loss": 1.7345, + "step": 6434 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002794034779407889, + "loss": 1.7289, + "step": 6435 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027939722678089297, + "loss": 1.6706, + "step": 6436 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027939097474246125, + "loss": 1.7483, + "step": 6437 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027938472182553617, + "loss": 1.7264, + "step": 6438 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027937846803016025, + "loss": 1.723, + "step": 6439 + }, + { + "epoch": 0.51, + "learning_rate": 0.000279372213356376, + "loss": 1.7328, + "step": 6440 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027936595780422575, + "loss": 1.6919, + "step": 6441 + }, + { + "epoch": 0.51, + "learning_rate": 0.000279359701373752, + "loss": 1.7078, + "step": 6442 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002793534440649973, + "loss": 1.7308, + "step": 6443 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027934718587800417, + "loss": 1.749, + "step": 6444 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027934092681281496, + "loss": 1.7148, + "step": 6445 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002793346668694722, + "loss": 1.738, + "step": 6446 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027932840604801847, + "loss": 1.7988, + "step": 6447 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027932214434849624, + "loss": 1.7712, + "step": 6448 + }, + { + "epoch": 0.51, + "learning_rate": 0.000279315881770948, + "loss": 1.6733, + "step": 6449 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002793096183154163, + "loss": 1.7283, + "step": 6450 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027930335398194364, + "loss": 1.73, + "step": 6451 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002792970887705725, + "loss": 1.6999, + "step": 6452 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002792908226813456, + "loss": 1.7126, + "step": 6453 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002792845557143053, + "loss": 1.6731, + "step": 6454 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027927828786949424, + "loss": 1.7258, + "step": 6455 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002792720191469549, + "loss": 1.698, + "step": 6456 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027926574954672986, + "loss": 1.6815, + "step": 6457 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027925947906886175, + "loss": 1.7246, + "step": 6458 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002792532077133932, + "loss": 1.7025, + "step": 6459 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002792469354803666, + "loss": 1.7481, + "step": 6460 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027924066236982467, + "loss": 1.7517, + "step": 6461 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002792343883818099, + "loss": 1.7243, + "step": 6462 + }, + { + "epoch": 0.51, + "learning_rate": 0.000279228113516365, + "loss": 1.702, + "step": 6463 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027922183777353253, + "loss": 1.7976, + "step": 6464 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002792155611533551, + "loss": 1.6861, + "step": 6465 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027920928365587525, + "loss": 1.6724, + "step": 6466 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002792030052811358, + "loss": 1.7223, + "step": 6467 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002791967260291791, + "loss": 1.7722, + "step": 6468 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027919044590004797, + "loss": 1.7211, + "step": 6469 + }, + { + "epoch": 0.51, + "learning_rate": 0.000279184164893785, + "loss": 1.6966, + "step": 6470 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027917788301043287, + "loss": 1.7232, + "step": 6471 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027917160025003423, + "loss": 1.7423, + "step": 6472 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002791653166126317, + "loss": 1.7043, + "step": 6473 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027915903209826785, + "loss": 1.7739, + "step": 6474 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027915274670698554, + "loss": 1.6869, + "step": 6475 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027914646043882734, + "loss": 1.7173, + "step": 6476 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002791401732938359, + "loss": 1.705, + "step": 6477 + }, + { + "epoch": 0.51, + "learning_rate": 0.000279133885272054, + "loss": 1.7384, + "step": 6478 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027912759637352424, + "loss": 1.767, + "step": 6479 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002791213065982894, + "loss": 1.7043, + "step": 6480 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027911501594639213, + "loss": 1.7626, + "step": 6481 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027910872441787516, + "loss": 1.6991, + "step": 6482 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027910243201278117, + "loss": 1.6855, + "step": 6483 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002790961387311529, + "loss": 1.7112, + "step": 6484 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027908984457303314, + "loss": 1.7663, + "step": 6485 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027908354953846455, + "loss": 1.6907, + "step": 6486 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002790772536274899, + "loss": 1.7255, + "step": 6487 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027907095684015195, + "loss": 1.7331, + "step": 6488 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002790646591764934, + "loss": 1.7509, + "step": 6489 + }, + { + "epoch": 0.51, + "learning_rate": 0.000279058360636557, + "loss": 1.7532, + "step": 6490 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002790520612203856, + "loss": 1.6756, + "step": 6491 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027904576092802194, + "loss": 1.7715, + "step": 6492 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027903945975950875, + "loss": 1.7358, + "step": 6493 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027903315771488877, + "loss": 1.794, + "step": 6494 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027902685479420496, + "loss": 1.7656, + "step": 6495 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027902055099749995, + "loss": 1.6967, + "step": 6496 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027901424632481667, + "loss": 1.7021, + "step": 6497 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002790079407761978, + "loss": 1.6688, + "step": 6498 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027900163435168616, + "loss": 1.7222, + "step": 6499 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002789953270513247, + "loss": 1.6959, + "step": 6500 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002789890188751561, + "loss": 1.6891, + "step": 6501 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027898270982322325, + "loss": 1.7416, + "step": 6502 + }, + { + "epoch": 0.51, + "learning_rate": 0.000278976399895569, + "loss": 1.6971, + "step": 6503 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027897008909223616, + "loss": 1.6435, + "step": 6504 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027896377741326757, + "loss": 1.7754, + "step": 6505 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027895746485870614, + "loss": 1.7301, + "step": 6506 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027895115142859465, + "loss": 1.6806, + "step": 6507 + }, + { + "epoch": 0.51, + "learning_rate": 0.000278944837122976, + "loss": 1.7272, + "step": 6508 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027893852194189303, + "loss": 1.7342, + "step": 6509 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002789322058853887, + "loss": 1.7646, + "step": 6510 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002789258889535059, + "loss": 1.7782, + "step": 6511 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027891957114628736, + "loss": 1.7032, + "step": 6512 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002789132524637761, + "loss": 1.7216, + "step": 6513 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027890693290601507, + "loss": 1.7721, + "step": 6514 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027890061247304705, + "loss": 1.7192, + "step": 6515 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027889429116491495, + "loss": 1.7449, + "step": 6516 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027888796898166185, + "loss": 1.7559, + "step": 6517 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002788816459233305, + "loss": 1.669, + "step": 6518 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027887532198996387, + "loss": 1.7113, + "step": 6519 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027886899718160496, + "loss": 1.7367, + "step": 6520 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002788626714982967, + "loss": 1.7003, + "step": 6521 + }, + { + "epoch": 0.51, + "learning_rate": 0.000278856344940082, + "loss": 1.7205, + "step": 6522 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002788500175070038, + "loss": 1.736, + "step": 6523 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002788436891991051, + "loss": 1.74, + "step": 6524 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002788373600164288, + "loss": 1.6851, + "step": 6525 + }, + { + "epoch": 0.51, + "learning_rate": 0.000278831029959018, + "loss": 1.7153, + "step": 6526 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002788246990269156, + "loss": 1.6971, + "step": 6527 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027881836722016455, + "loss": 1.7596, + "step": 6528 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027881203453880793, + "loss": 1.7591, + "step": 6529 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002788057009828886, + "loss": 1.7202, + "step": 6530 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002787993665524497, + "loss": 1.7645, + "step": 6531 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002787930312475341, + "loss": 1.7292, + "step": 6532 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027878669506818497, + "loss": 1.7523, + "step": 6533 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027878035801444525, + "loss": 1.6762, + "step": 6534 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002787740200863579, + "loss": 1.7102, + "step": 6535 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002787676812839661, + "loss": 1.7355, + "step": 6536 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002787613416073128, + "loss": 1.742, + "step": 6537 + }, + { + "epoch": 0.51, + "learning_rate": 0.000278755001056441, + "loss": 1.6556, + "step": 6538 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002787486596313938, + "loss": 1.6981, + "step": 6539 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002787423173322142, + "loss": 1.7037, + "step": 6540 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002787359741589454, + "loss": 1.7417, + "step": 6541 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002787296301116304, + "loss": 1.7035, + "step": 6542 + }, + { + "epoch": 0.51, + "learning_rate": 0.00027872328519031216, + "loss": 1.777, + "step": 6543 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002787169393950339, + "loss": 1.73, + "step": 6544 + }, + { + "epoch": 0.51, + "learning_rate": 0.0002787105927258386, + "loss": 1.7654, + "step": 6545 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002787042451827695, + "loss": 1.6976, + "step": 6546 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002786978967658695, + "loss": 1.7034, + "step": 6547 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027869154747518185, + "loss": 1.7517, + "step": 6548 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027868519731074964, + "loss": 1.7139, + "step": 6549 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027867884627261587, + "loss": 1.7455, + "step": 6550 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002786724943608238, + "loss": 1.7106, + "step": 6551 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027866614157541654, + "loss": 1.7166, + "step": 6552 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002786597879164372, + "loss": 1.6647, + "step": 6553 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027865343338392875, + "loss": 1.7183, + "step": 6554 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027864707797793463, + "loss": 1.7466, + "step": 6555 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027864072169849776, + "loss": 1.6588, + "step": 6556 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027863436454566144, + "loss": 1.7044, + "step": 6557 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027862800651946867, + "loss": 1.6899, + "step": 6558 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002786216476199628, + "loss": 1.7101, + "step": 6559 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002786152878471869, + "loss": 1.7285, + "step": 6560 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002786089272011842, + "loss": 1.7483, + "step": 6561 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027860256568199785, + "loss": 1.6971, + "step": 6562 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027859620328967105, + "loss": 1.7548, + "step": 6563 + }, + { + "epoch": 0.52, + "learning_rate": 0.000278589840024247, + "loss": 1.6768, + "step": 6564 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027858347588576883, + "loss": 1.7085, + "step": 6565 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002785771108742799, + "loss": 1.7269, + "step": 6566 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002785707449898233, + "loss": 1.7005, + "step": 6567 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027856437823244224, + "loss": 1.7143, + "step": 6568 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027855801060218014, + "loss": 1.733, + "step": 6569 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027855164209908, + "loss": 1.7112, + "step": 6570 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002785452727231851, + "loss": 1.6473, + "step": 6571 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027853890247453883, + "loss": 1.693, + "step": 6572 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027853253135318433, + "loss": 1.7095, + "step": 6573 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027852615935916483, + "loss": 1.7471, + "step": 6574 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002785197864925237, + "loss": 1.7225, + "step": 6575 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027851341275330406, + "loss": 1.6914, + "step": 6576 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002785070381415493, + "loss": 1.7763, + "step": 6577 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002785006626573027, + "loss": 1.6899, + "step": 6578 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027849428630060747, + "loss": 1.6986, + "step": 6579 + }, + { + "epoch": 0.52, + "learning_rate": 0.000278487909071507, + "loss": 1.7473, + "step": 6580 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002784815309700445, + "loss": 1.7203, + "step": 6581 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027847515199626327, + "loss": 1.6784, + "step": 6582 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002784687721502067, + "loss": 1.6678, + "step": 6583 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027846239143191807, + "loss": 1.7429, + "step": 6584 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027845600984144066, + "loss": 1.6504, + "step": 6585 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027844962737881785, + "loss": 1.7155, + "step": 6586 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027844324404409295, + "loss": 1.6812, + "step": 6587 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027843685983730933, + "loss": 1.714, + "step": 6588 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027843047475851026, + "loss": 1.7454, + "step": 6589 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002784240888077392, + "loss": 1.7672, + "step": 6590 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002784177019850394, + "loss": 1.7039, + "step": 6591 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002784113142904543, + "loss": 1.6814, + "step": 6592 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002784049257240272, + "loss": 1.7421, + "step": 6593 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027839853628580153, + "loss": 1.7038, + "step": 6594 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027839214597582065, + "loss": 1.6524, + "step": 6595 + }, + { + "epoch": 0.52, + "learning_rate": 0.000278385754794128, + "loss": 1.7291, + "step": 6596 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002783793627407668, + "loss": 1.7463, + "step": 6597 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002783729698157807, + "loss": 1.7277, + "step": 6598 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002783665760192129, + "loss": 1.7246, + "step": 6599 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027836018135110694, + "loss": 1.7199, + "step": 6600 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002783537858115062, + "loss": 1.7504, + "step": 6601 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027834738940045407, + "loss": 1.6706, + "step": 6602 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027834099211799395, + "loss": 1.7471, + "step": 6603 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002783345939641694, + "loss": 1.7631, + "step": 6604 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002783281949390237, + "loss": 1.7094, + "step": 6605 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002783217950426004, + "loss": 1.7173, + "step": 6606 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002783153942749429, + "loss": 1.7045, + "step": 6607 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002783089926360947, + "loss": 1.6935, + "step": 6608 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002783025901260992, + "loss": 1.6977, + "step": 6609 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027829618674500003, + "loss": 1.7072, + "step": 6610 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027828978249284047, + "loss": 1.7201, + "step": 6611 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002782833773696641, + "loss": 1.7124, + "step": 6612 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002782769713755144, + "loss": 1.7481, + "step": 6613 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002782705645104348, + "loss": 1.7306, + "step": 6614 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002782641567744689, + "loss": 1.7558, + "step": 6615 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002782577481676602, + "loss": 1.7206, + "step": 6616 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002782513386900521, + "loss": 1.7527, + "step": 6617 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027824492834168827, + "loss": 1.6809, + "step": 6618 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002782385171226121, + "loss": 1.7148, + "step": 6619 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002782321050328671, + "loss": 1.7761, + "step": 6620 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002782256920724969, + "loss": 1.7334, + "step": 6621 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002782192782415451, + "loss": 1.7266, + "step": 6622 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027821286354005507, + "loss": 1.7076, + "step": 6623 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002782064479680705, + "loss": 1.692, + "step": 6624 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027820003152563484, + "loss": 1.7214, + "step": 6625 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002781936142127918, + "loss": 1.7074, + "step": 6626 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027818719602958476, + "loss": 1.7009, + "step": 6627 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002781807769760575, + "loss": 1.7311, + "step": 6628 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002781743570522534, + "loss": 1.7322, + "step": 6629 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002781679362582162, + "loss": 1.6982, + "step": 6630 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002781615145939894, + "loss": 1.656, + "step": 6631 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002781550920596167, + "loss": 1.7172, + "step": 6632 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027814866865514165, + "loss": 1.6937, + "step": 6633 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002781422443806078, + "loss": 1.73, + "step": 6634 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027813581923605887, + "loss": 1.783, + "step": 6635 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027812939322153845, + "loss": 1.7431, + "step": 6636 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027812296633709016, + "loss": 1.7204, + "step": 6637 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027811653858275757, + "loss": 1.7376, + "step": 6638 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002781101099585844, + "loss": 1.7162, + "step": 6639 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002781036804646143, + "loss": 1.7299, + "step": 6640 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027809725010089094, + "loss": 1.6732, + "step": 6641 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002780908188674579, + "loss": 1.7362, + "step": 6642 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002780843867643589, + "loss": 1.6963, + "step": 6643 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002780779537916376, + "loss": 1.764, + "step": 6644 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027807151994933767, + "loss": 1.7137, + "step": 6645 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027806508523750274, + "loss": 1.7017, + "step": 6646 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027805864965617665, + "loss": 1.7497, + "step": 6647 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002780522132054029, + "loss": 1.756, + "step": 6648 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027804577588522536, + "loss": 1.6898, + "step": 6649 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027803933769568766, + "loss": 1.7316, + "step": 6650 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002780328986368335, + "loss": 1.652, + "step": 6651 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002780264587087066, + "loss": 1.8018, + "step": 6652 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027802001791135065, + "loss": 1.7478, + "step": 6653 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002780135762448095, + "loss": 1.7146, + "step": 6654 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002780071337091268, + "loss": 1.7546, + "step": 6655 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027800069030434627, + "loss": 1.7529, + "step": 6656 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002779942460305117, + "loss": 1.748, + "step": 6657 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002779878008876669, + "loss": 1.752, + "step": 6658 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002779813548758555, + "loss": 1.8219, + "step": 6659 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002779749079951213, + "loss": 1.7758, + "step": 6660 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002779684602455082, + "loss": 1.7223, + "step": 6661 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027796201162705975, + "loss": 1.7127, + "step": 6662 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002779555621398199, + "loss": 1.6688, + "step": 6663 + }, + { + "epoch": 0.52, + "learning_rate": 0.0002779491117838324, + "loss": 1.7415, + "step": 6664 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027794266055914107, + "loss": 1.7453, + "step": 6665 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027793620846578966, + "loss": 1.7489, + "step": 6666 + }, + { + "epoch": 0.52, + "learning_rate": 0.000277929755503822, + "loss": 1.6325, + "step": 6667 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027792330167328186, + "loss": 1.7024, + "step": 6668 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027791684697421316, + "loss": 1.6875, + "step": 6669 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027791039140665955, + "loss": 1.7483, + "step": 6670 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027790393497066504, + "loss": 1.7, + "step": 6671 + }, + { + "epoch": 0.52, + "learning_rate": 0.00027789747766627344, + "loss": 1.7463, + "step": 6672 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002778910194935285, + "loss": 1.6924, + "step": 6673 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002778845604524741, + "loss": 1.7316, + "step": 6674 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002778781005431541, + "loss": 1.7188, + "step": 6675 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002778716397656124, + "loss": 1.7501, + "step": 6676 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027786517811989283, + "loss": 1.7406, + "step": 6677 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027785871560603924, + "loss": 1.7205, + "step": 6678 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002778522522240956, + "loss": 1.7061, + "step": 6679 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002778457879741056, + "loss": 1.6583, + "step": 6680 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002778393228561133, + "loss": 1.7453, + "step": 6681 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002778328568701626, + "loss": 1.7636, + "step": 6682 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002778263900162973, + "loss": 1.7326, + "step": 6683 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027781992229456137, + "loss": 1.7128, + "step": 6684 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027781345370499867, + "loss": 1.7173, + "step": 6685 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002778069842476532, + "loss": 1.7456, + "step": 6686 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002778005139225688, + "loss": 1.7166, + "step": 6687 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002777940427297894, + "loss": 1.7527, + "step": 6688 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002777875706693591, + "loss": 1.7323, + "step": 6689 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002777810977413216, + "loss": 1.7366, + "step": 6690 + }, + { + "epoch": 0.53, + "learning_rate": 0.000277774623945721, + "loss": 1.7354, + "step": 6691 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002777681492826012, + "loss": 1.6613, + "step": 6692 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027776167375200624, + "loss": 1.71, + "step": 6693 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002777551973539799, + "loss": 1.7264, + "step": 6694 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002777487200885664, + "loss": 1.7381, + "step": 6695 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002777422419558095, + "loss": 1.7231, + "step": 6696 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002777357629557533, + "loss": 1.706, + "step": 6697 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027772928308844174, + "loss": 1.7122, + "step": 6698 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027772280235391887, + "loss": 1.7186, + "step": 6699 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002777163207522286, + "loss": 1.746, + "step": 6700 + }, + { + "epoch": 0.53, + "learning_rate": 0.000277709838283415, + "loss": 1.7045, + "step": 6701 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002777033549475222, + "loss": 1.7281, + "step": 6702 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027769687074459396, + "loss": 1.7153, + "step": 6703 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002776903856746744, + "loss": 1.701, + "step": 6704 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002776838997378077, + "loss": 1.7078, + "step": 6705 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027767741293403776, + "loss": 1.6796, + "step": 6706 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027767092526340863, + "loss": 1.7053, + "step": 6707 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027766443672596437, + "loss": 1.7652, + "step": 6708 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027765794732174904, + "loss": 1.7206, + "step": 6709 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027765145705080667, + "loss": 1.7203, + "step": 6710 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002776449659131814, + "loss": 1.6887, + "step": 6711 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002776384739089172, + "loss": 1.656, + "step": 6712 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002776319810380582, + "loss": 1.7712, + "step": 6713 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002776254873006485, + "loss": 1.7178, + "step": 6714 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002776189926967322, + "loss": 1.7181, + "step": 6715 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002776124972263533, + "loss": 1.7096, + "step": 6716 + }, + { + "epoch": 0.53, + "learning_rate": 0.000277606000889556, + "loss": 1.7278, + "step": 6717 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002775995036863844, + "loss": 1.7281, + "step": 6718 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002775930056168826, + "loss": 1.7324, + "step": 6719 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002775865066810946, + "loss": 1.6555, + "step": 6720 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002775800068790647, + "loss": 1.7297, + "step": 6721 + }, + { + "epoch": 0.53, + "learning_rate": 0.000277573506210837, + "loss": 1.7173, + "step": 6722 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002775670046764555, + "loss": 1.7076, + "step": 6723 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002775605022759645, + "loss": 1.7064, + "step": 6724 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027755399900940807, + "loss": 1.7229, + "step": 6725 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027754749487683033, + "loss": 1.7288, + "step": 6726 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027754098987827554, + "loss": 1.7743, + "step": 6727 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002775344840137878, + "loss": 1.6536, + "step": 6728 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002775279772834113, + "loss": 1.7238, + "step": 6729 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002775214696871902, + "loss": 1.706, + "step": 6730 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002775149612251687, + "loss": 1.6528, + "step": 6731 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027750845189739097, + "loss": 1.7394, + "step": 6732 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002775019417039012, + "loss": 1.7231, + "step": 6733 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027749543064474366, + "loss": 1.7642, + "step": 6734 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027748891871996246, + "loss": 1.6535, + "step": 6735 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027748240592960185, + "loss": 1.7214, + "step": 6736 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002774758922737061, + "loss": 1.73, + "step": 6737 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027746937775231936, + "loss": 1.7467, + "step": 6738 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002774628623654859, + "loss": 1.7334, + "step": 6739 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027745634611324997, + "loss": 1.7138, + "step": 6740 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002774498289956557, + "loss": 1.7306, + "step": 6741 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002774433110127475, + "loss": 1.6839, + "step": 6742 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002774367921645695, + "loss": 1.7248, + "step": 6743 + }, + { + "epoch": 0.53, + "learning_rate": 0.000277430272451166, + "loss": 1.6768, + "step": 6744 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027742375187258134, + "loss": 1.7145, + "step": 6745 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002774172304288597, + "loss": 1.685, + "step": 6746 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027741070812004536, + "loss": 1.755, + "step": 6747 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027740418494618264, + "loss": 1.6851, + "step": 6748 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002773976609073158, + "loss": 1.6851, + "step": 6749 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027739113600348917, + "loss": 1.7623, + "step": 6750 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027738461023474694, + "loss": 1.7391, + "step": 6751 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027737808360113356, + "loss": 1.7152, + "step": 6752 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002773715561026933, + "loss": 1.7103, + "step": 6753 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027736502773947045, + "loss": 1.69, + "step": 6754 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027735849851150937, + "loss": 1.6602, + "step": 6755 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027735196841885434, + "loss": 1.7107, + "step": 6756 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027734543746154975, + "loss": 1.7041, + "step": 6757 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027733890563963985, + "loss": 1.7574, + "step": 6758 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027733237295316914, + "loss": 1.722, + "step": 6759 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027732583940218186, + "loss": 1.7084, + "step": 6760 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027731930498672234, + "loss": 1.7444, + "step": 6761 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027731276970683504, + "loss": 1.734, + "step": 6762 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002773062335625643, + "loss": 1.7522, + "step": 6763 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027729969655395444, + "loss": 1.728, + "step": 6764 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027729315868105, + "loss": 1.7487, + "step": 6765 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002772866199438951, + "loss": 1.7091, + "step": 6766 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002772800803425344, + "loss": 1.7565, + "step": 6767 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002772735398770122, + "loss": 1.7214, + "step": 6768 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027726699854737285, + "loss": 1.7308, + "step": 6769 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002772604563536609, + "loss": 1.7541, + "step": 6770 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027725391329592054, + "loss": 1.7079, + "step": 6771 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027724736937419643, + "loss": 1.7237, + "step": 6772 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027724082458853287, + "loss": 1.7549, + "step": 6773 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027723427893897436, + "loss": 1.7365, + "step": 6774 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027722773242556525, + "loss": 1.7366, + "step": 6775 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002772211850483501, + "loss": 1.703, + "step": 6776 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002772146368073733, + "loss": 1.7129, + "step": 6777 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027720808770267935, + "loss": 1.6492, + "step": 6778 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002772015377343126, + "loss": 1.7078, + "step": 6779 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027719498690231766, + "loss": 1.7007, + "step": 6780 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002771884352067389, + "loss": 1.7191, + "step": 6781 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027718188264762094, + "loss": 1.6973, + "step": 6782 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002771753292250081, + "loss": 1.7514, + "step": 6783 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027716877493894505, + "loss": 1.7366, + "step": 6784 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027716221978947613, + "loss": 1.6782, + "step": 6785 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002771556637766459, + "loss": 1.7314, + "step": 6786 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002771491069004989, + "loss": 1.7407, + "step": 6787 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027714254916107964, + "loss": 1.6886, + "step": 6788 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002771359905584326, + "loss": 1.7309, + "step": 6789 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002771294310926024, + "loss": 1.6684, + "step": 6790 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002771228707636335, + "loss": 1.7344, + "step": 6791 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027711630957157047, + "loss": 1.7083, + "step": 6792 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002771097475164578, + "loss": 1.6901, + "step": 6793 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002771031845983401, + "loss": 1.6888, + "step": 6794 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002770966208172619, + "loss": 1.7514, + "step": 6795 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002770900561732679, + "loss": 1.725, + "step": 6796 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027708349066640244, + "loss": 1.7335, + "step": 6797 + }, + { + "epoch": 0.53, + "learning_rate": 0.00027707692429671026, + "loss": 1.7109, + "step": 6798 + }, + { + "epoch": 0.53, + "learning_rate": 0.0002770703570642358, + "loss": 1.7157, + "step": 6799 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002770637889690238, + "loss": 1.7145, + "step": 6800 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027705722001111885, + "loss": 1.7318, + "step": 6801 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027705065019056544, + "loss": 1.6894, + "step": 6802 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002770440795074082, + "loss": 1.6756, + "step": 6803 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002770375079616918, + "loss": 1.7443, + "step": 6804 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027703093555346087, + "loss": 1.672, + "step": 6805 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027702436228275995, + "loss": 1.6296, + "step": 6806 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027701778814963367, + "loss": 1.7238, + "step": 6807 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027701121315412675, + "loss": 1.7108, + "step": 6808 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027700463729628374, + "loss": 1.7094, + "step": 6809 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002769980605761494, + "loss": 1.6888, + "step": 6810 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002769914829937682, + "loss": 1.7023, + "step": 6811 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027698490454918504, + "loss": 1.7126, + "step": 6812 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027697832524244435, + "loss": 1.7322, + "step": 6813 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002769717450735909, + "loss": 1.6808, + "step": 6814 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002769651640426695, + "loss": 1.7052, + "step": 6815 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002769585821497246, + "loss": 1.7243, + "step": 6816 + }, + { + "epoch": 0.54, + "learning_rate": 0.000276951999394801, + "loss": 1.686, + "step": 6817 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002769454157779434, + "loss": 1.7047, + "step": 6818 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027693883129919643, + "loss": 1.7124, + "step": 6819 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002769322459586049, + "loss": 1.6934, + "step": 6820 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002769256597562135, + "loss": 1.6955, + "step": 6821 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027691907269206687, + "loss": 1.7141, + "step": 6822 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027691248476620974, + "loss": 1.7337, + "step": 6823 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027690589597868695, + "loss": 1.6953, + "step": 6824 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002768993063295431, + "loss": 1.7385, + "step": 6825 + }, + { + "epoch": 0.54, + "learning_rate": 0.000276892715818823, + "loss": 1.7263, + "step": 6826 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002768861244465714, + "loss": 1.7028, + "step": 6827 + }, + { + "epoch": 0.54, + "learning_rate": 0.000276879532212833, + "loss": 1.7515, + "step": 6828 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002768729391176526, + "loss": 1.7491, + "step": 6829 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027686634516107503, + "loss": 1.7145, + "step": 6830 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002768597503431449, + "loss": 1.6598, + "step": 6831 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002768531546639071, + "loss": 1.7571, + "step": 6832 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002768465581234064, + "loss": 1.6584, + "step": 6833 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027683996072168756, + "loss": 1.7214, + "step": 6834 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002768333624587954, + "loss": 1.7112, + "step": 6835 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002768267633347747, + "loss": 1.7303, + "step": 6836 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002768201633496702, + "loss": 1.7411, + "step": 6837 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002768135625035268, + "loss": 1.6945, + "step": 6838 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002768069607963894, + "loss": 1.6894, + "step": 6839 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002768003582283026, + "loss": 1.7243, + "step": 6840 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002767937547993114, + "loss": 1.7614, + "step": 6841 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027678715050946054, + "loss": 1.7279, + "step": 6842 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027678054535879487, + "loss": 1.7034, + "step": 6843 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002767739393473593, + "loss": 1.6552, + "step": 6844 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027676733247519866, + "loss": 1.7339, + "step": 6845 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002767607247423578, + "loss": 1.7431, + "step": 6846 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027675411614888146, + "loss": 1.7431, + "step": 6847 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002767475066948147, + "loss": 1.7251, + "step": 6848 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027674089638020236, + "loss": 1.7313, + "step": 6849 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002767342852050892, + "loss": 1.7774, + "step": 6850 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027672767316952023, + "loss": 1.7315, + "step": 6851 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027672106027354024, + "loss": 1.7438, + "step": 6852 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027671444651719427, + "loss": 1.7128, + "step": 6853 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027670783190052704, + "loss": 1.7129, + "step": 6854 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002767012164235836, + "loss": 1.7589, + "step": 6855 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002766946000864088, + "loss": 1.6906, + "step": 6856 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002766879828890476, + "loss": 1.741, + "step": 6857 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002766813648315449, + "loss": 1.7747, + "step": 6858 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027667474591394566, + "loss": 1.6846, + "step": 6859 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027666812613629476, + "loss": 1.7204, + "step": 6860 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002766615054986372, + "loss": 1.7305, + "step": 6861 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002766548840010179, + "loss": 1.712, + "step": 6862 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002766482616434819, + "loss": 1.6962, + "step": 6863 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027664163842607405, + "loss": 1.78, + "step": 6864 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027663501434883935, + "loss": 1.7327, + "step": 6865 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002766283894118228, + "loss": 1.7601, + "step": 6866 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027662176361506935, + "loss": 1.7068, + "step": 6867 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027661513695862404, + "loss": 1.6565, + "step": 6868 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027660850944253174, + "loss": 1.7151, + "step": 6869 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027660188106683756, + "loss": 1.6957, + "step": 6870 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027659525183158654, + "loss": 1.675, + "step": 6871 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027658862173682357, + "loss": 1.7233, + "step": 6872 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027658199078259375, + "loss": 1.681, + "step": 6873 + }, + { + "epoch": 0.54, + "learning_rate": 0.000276575358968942, + "loss": 1.719, + "step": 6874 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002765687262959135, + "loss": 1.7199, + "step": 6875 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027656209276355313, + "loss": 1.7243, + "step": 6876 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027655545837190597, + "loss": 1.7342, + "step": 6877 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027654882312101714, + "loss": 1.7169, + "step": 6878 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002765421870109316, + "loss": 1.6998, + "step": 6879 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002765355500416945, + "loss": 1.6621, + "step": 6880 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002765289122133508, + "loss": 1.7408, + "step": 6881 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002765222735259456, + "loss": 1.6668, + "step": 6882 + }, + { + "epoch": 0.54, + "learning_rate": 0.000276515633979524, + "loss": 1.6829, + "step": 6883 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002765089935741311, + "loss": 1.7657, + "step": 6884 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002765023523098119, + "loss": 1.7352, + "step": 6885 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027649571018661153, + "loss": 1.6866, + "step": 6886 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002764890672045751, + "loss": 1.6866, + "step": 6887 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027648242336374775, + "loss": 1.7646, + "step": 6888 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027647577866417446, + "loss": 1.7021, + "step": 6889 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027646913310590054, + "loss": 1.7139, + "step": 6890 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002764624866889709, + "loss": 1.6926, + "step": 6891 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027645583941343085, + "loss": 1.6871, + "step": 6892 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027644919127932534, + "loss": 1.7267, + "step": 6893 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027644254228669966, + "loss": 1.7336, + "step": 6894 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002764358924355989, + "loss": 1.7091, + "step": 6895 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027642924172606816, + "loss": 1.7114, + "step": 6896 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027642259015815267, + "loss": 1.6996, + "step": 6897 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002764159377318975, + "loss": 1.6798, + "step": 6898 + }, + { + "epoch": 0.54, + "learning_rate": 0.000276409284447348, + "loss": 1.7236, + "step": 6899 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027640263030454914, + "loss": 1.7044, + "step": 6900 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002763959753035461, + "loss": 1.7595, + "step": 6901 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027638931944438423, + "loss": 1.679, + "step": 6902 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027638266272710864, + "loss": 1.6613, + "step": 6903 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002763760051517645, + "loss": 1.655, + "step": 6904 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027636934671839704, + "loss": 1.6844, + "step": 6905 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002763626874270514, + "loss": 1.7382, + "step": 6906 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002763560272777729, + "loss": 1.7226, + "step": 6907 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002763493662706067, + "loss": 1.6828, + "step": 6908 + }, + { + "epoch": 0.54, + "learning_rate": 0.000276342704405598, + "loss": 1.7463, + "step": 6909 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027633604168279206, + "loss": 1.7174, + "step": 6910 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002763293781022341, + "loss": 1.7264, + "step": 6911 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002763227136639694, + "loss": 1.6589, + "step": 6912 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027631604836804316, + "loss": 1.6813, + "step": 6913 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002763093822145007, + "loss": 1.7818, + "step": 6914 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002763027152033872, + "loss": 1.7151, + "step": 6915 + }, + { + "epoch": 0.54, + "learning_rate": 0.000276296047334748, + "loss": 1.7381, + "step": 6916 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002762893786086283, + "loss": 1.7218, + "step": 6917 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002762827090250734, + "loss": 1.6786, + "step": 6918 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027627603858412867, + "loss": 1.6569, + "step": 6919 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027626936728583927, + "loss": 1.6893, + "step": 6920 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002762626951302505, + "loss": 1.6849, + "step": 6921 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002762560221174078, + "loss": 1.6641, + "step": 6922 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002762493482473563, + "loss": 1.7621, + "step": 6923 + }, + { + "epoch": 0.54, + "learning_rate": 0.00027624267352014146, + "loss": 1.6572, + "step": 6924 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002762359979358085, + "loss": 1.682, + "step": 6925 + }, + { + "epoch": 0.54, + "learning_rate": 0.0002762293214944028, + "loss": 1.6615, + "step": 6926 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027622264419596964, + "loss": 1.73, + "step": 6927 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027621596604055437, + "loss": 1.7212, + "step": 6928 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002762092870282024, + "loss": 1.6969, + "step": 6929 + }, + { + "epoch": 0.55, + "learning_rate": 0.000276202607158959, + "loss": 1.6757, + "step": 6930 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002761959264328695, + "loss": 1.7498, + "step": 6931 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027618924484997936, + "loss": 1.7078, + "step": 6932 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027618256241033383, + "loss": 1.6907, + "step": 6933 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027617587911397837, + "loss": 1.6965, + "step": 6934 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002761691949609583, + "loss": 1.7275, + "step": 6935 + }, + { + "epoch": 0.55, + "learning_rate": 0.000276162509951319, + "loss": 1.6994, + "step": 6936 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002761558240851059, + "loss": 1.7246, + "step": 6937 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027614913736236443, + "loss": 1.6536, + "step": 6938 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002761424497831399, + "loss": 1.7332, + "step": 6939 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002761357613474777, + "loss": 1.7046, + "step": 6940 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027612907205542327, + "loss": 1.6753, + "step": 6941 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002761223819070222, + "loss": 1.7171, + "step": 6942 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002761156909023196, + "loss": 1.6956, + "step": 6943 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002761089990413611, + "loss": 1.653, + "step": 6944 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002761023063241921, + "loss": 1.6632, + "step": 6945 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027609561275085805, + "loss": 1.7819, + "step": 6946 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027608891832140434, + "loss": 1.714, + "step": 6947 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002760822230358765, + "loss": 1.7401, + "step": 6948 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027607552689431987, + "loss": 1.7146, + "step": 6949 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027606882989678, + "loss": 1.7226, + "step": 6950 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002760621320433024, + "loss": 1.6873, + "step": 6951 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027605543333393247, + "loss": 1.7237, + "step": 6952 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027604873376871564, + "loss": 1.6683, + "step": 6953 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002760420333476976, + "loss": 1.7443, + "step": 6954 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002760353320709236, + "loss": 1.6814, + "step": 6955 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002760286299384393, + "loss": 1.6943, + "step": 6956 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002760219269502901, + "loss": 1.701, + "step": 6957 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002760152231065216, + "loss": 1.7409, + "step": 6958 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002760085184071793, + "loss": 1.7155, + "step": 6959 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027600181285230863, + "loss": 1.7862, + "step": 6960 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027599510644195526, + "loss": 1.6773, + "step": 6961 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002759883991761646, + "loss": 1.6984, + "step": 6962 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002759816910549823, + "loss": 1.692, + "step": 6963 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002759749820784537, + "loss": 1.702, + "step": 6964 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027596827224662463, + "loss": 1.7238, + "step": 6965 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027596156155954043, + "loss": 1.697, + "step": 6966 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027595485001724677, + "loss": 1.7191, + "step": 6967 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002759481376197892, + "loss": 1.7045, + "step": 6968 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002759414243672132, + "loss": 1.7422, + "step": 6969 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002759347102595646, + "loss": 1.6836, + "step": 6970 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027592799529688866, + "loss": 1.6986, + "step": 6971 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027592127947923114, + "loss": 1.7466, + "step": 6972 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027591456280663765, + "loss": 1.7445, + "step": 6973 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027590784527915373, + "loss": 1.784, + "step": 6974 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002759011268968251, + "loss": 1.7018, + "step": 6975 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027589440765969723, + "loss": 1.6726, + "step": 6976 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027588768756781583, + "loss": 1.7061, + "step": 6977 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027588096662122647, + "loss": 1.7027, + "step": 6978 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002758742448199749, + "loss": 1.7087, + "step": 6979 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027586752216410656, + "loss": 1.7004, + "step": 6980 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002758607986536673, + "loss": 1.7196, + "step": 6981 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002758540742887026, + "loss": 1.7186, + "step": 6982 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027584734906925827, + "loss": 1.7389, + "step": 6983 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002758406229953798, + "loss": 1.7082, + "step": 6984 + }, + { + "epoch": 0.55, + "learning_rate": 0.000275833896067113, + "loss": 1.7484, + "step": 6985 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027582716828450344, + "loss": 1.6895, + "step": 6986 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002758204396475969, + "loss": 1.738, + "step": 6987 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027581371015643894, + "loss": 1.69, + "step": 6988 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027580697981107534, + "loss": 1.5823, + "step": 6989 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027580024861155185, + "loss": 1.7508, + "step": 6990 + }, + { + "epoch": 0.55, + "learning_rate": 0.000275793516557914, + "loss": 1.6626, + "step": 6991 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002757867836502076, + "loss": 1.7423, + "step": 6992 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002757800498884784, + "loss": 1.6746, + "step": 6993 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027577331527277207, + "loss": 1.7043, + "step": 6994 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002757665798031343, + "loss": 1.6954, + "step": 6995 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027575984347961085, + "loss": 1.6967, + "step": 6996 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002757531063022475, + "loss": 1.6704, + "step": 6997 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027574636827109, + "loss": 1.7194, + "step": 6998 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027573962938618396, + "loss": 1.6873, + "step": 6999 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002757328896475753, + "loss": 1.6182, + "step": 7000 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002757261490553096, + "loss": 1.6519, + "step": 7001 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027571940760943276, + "loss": 1.7633, + "step": 7002 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002757126653099906, + "loss": 1.7525, + "step": 7003 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027570592215702875, + "loss": 1.7154, + "step": 7004 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027569917815059315, + "loss": 1.7136, + "step": 7005 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002756924332907294, + "loss": 1.7437, + "step": 7006 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027568568757748335, + "loss": 1.6922, + "step": 7007 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027567894101090094, + "loss": 1.719, + "step": 7008 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027567219359102784, + "loss": 1.7282, + "step": 7009 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002756654453179099, + "loss": 1.7205, + "step": 7010 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027565869619159295, + "loss": 1.6503, + "step": 7011 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002756519462121228, + "loss": 1.6643, + "step": 7012 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027564519537954526, + "loss": 1.6904, + "step": 7013 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027563844369390614, + "loss": 1.6951, + "step": 7014 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002756316911552514, + "loss": 1.7011, + "step": 7015 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027562493776362676, + "loss": 1.736, + "step": 7016 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002756181835190781, + "loss": 1.6697, + "step": 7017 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027561142842165133, + "loss": 1.7037, + "step": 7018 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027560467247139225, + "loss": 1.6921, + "step": 7019 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002755979156683468, + "loss": 1.6691, + "step": 7020 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027559115801256077, + "loss": 1.7762, + "step": 7021 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002755843995040801, + "loss": 1.7451, + "step": 7022 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002755776401429507, + "loss": 1.7366, + "step": 7023 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027557087992921835, + "loss": 1.7962, + "step": 7024 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027556411886292905, + "loss": 1.6746, + "step": 7025 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002755573569441287, + "loss": 1.7363, + "step": 7026 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002755505941728632, + "loss": 1.6771, + "step": 7027 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027554383054917837, + "loss": 1.738, + "step": 7028 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027553706607312024, + "loss": 1.6795, + "step": 7029 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027553030074473474, + "loss": 1.7375, + "step": 7030 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002755235345640678, + "loss": 1.7046, + "step": 7031 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027551676753116526, + "loss": 1.6994, + "step": 7032 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002755099996460732, + "loss": 1.7188, + "step": 7033 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027550323090883743, + "loss": 1.7179, + "step": 7034 + }, + { + "epoch": 0.55, + "learning_rate": 0.000275496461319504, + "loss": 1.7295, + "step": 7035 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027548969087811884, + "loss": 1.701, + "step": 7036 + }, + { + "epoch": 0.55, + "learning_rate": 0.000275482919584728, + "loss": 1.6783, + "step": 7037 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027547614743937736, + "loss": 1.7533, + "step": 7038 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027546937444211287, + "loss": 1.6904, + "step": 7039 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027546260059298065, + "loss": 1.7126, + "step": 7040 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027545582589202656, + "loss": 1.6889, + "step": 7041 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002754490503392966, + "loss": 1.7107, + "step": 7042 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002754422739348369, + "loss": 1.6761, + "step": 7043 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002754354966786933, + "loss": 1.6811, + "step": 7044 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027542871857091195, + "loss": 1.7036, + "step": 7045 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027542193961153883, + "loss": 1.7097, + "step": 7046 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027541515980061994, + "loss": 1.6582, + "step": 7047 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002754083791382013, + "loss": 1.6621, + "step": 7048 + }, + { + "epoch": 0.55, + "learning_rate": 0.000275401597624329, + "loss": 1.655, + "step": 7049 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027539481525904906, + "loss": 1.6941, + "step": 7050 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002753880320424075, + "loss": 1.7182, + "step": 7051 + }, + { + "epoch": 0.55, + "learning_rate": 0.0002753812479744504, + "loss": 1.68, + "step": 7052 + }, + { + "epoch": 0.55, + "learning_rate": 0.00027537446305522383, + "loss": 1.7235, + "step": 7053 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002753676772847739, + "loss": 1.7324, + "step": 7054 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002753608906631465, + "loss": 1.74, + "step": 7055 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027535410319038794, + "loss": 1.7361, + "step": 7056 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002753473148665441, + "loss": 1.7285, + "step": 7057 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002753405256916612, + "loss": 1.7201, + "step": 7058 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027533373566578534, + "loss": 1.7012, + "step": 7059 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027532694478896256, + "loss": 1.732, + "step": 7060 + }, + { + "epoch": 0.56, + "learning_rate": 0.000275320153061239, + "loss": 1.726, + "step": 7061 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002753133604826607, + "loss": 1.7224, + "step": 7062 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002753065670532739, + "loss": 1.7337, + "step": 7063 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027529977277312463, + "loss": 1.7393, + "step": 7064 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027529297764225904, + "loss": 1.7359, + "step": 7065 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002752861816607233, + "loss": 1.7072, + "step": 7066 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002752793848285635, + "loss": 1.6722, + "step": 7067 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027527258714582584, + "loss": 1.725, + "step": 7068 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002752657886125564, + "loss": 1.6411, + "step": 7069 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002752589892288014, + "loss": 1.7263, + "step": 7070 + }, + { + "epoch": 0.56, + "learning_rate": 0.000275252188994607, + "loss": 1.7484, + "step": 7071 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002752453879100194, + "loss": 1.6115, + "step": 7072 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027523858597508467, + "loss": 1.6346, + "step": 7073 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002752317831898491, + "loss": 1.714, + "step": 7074 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027522497955435876, + "loss": 1.7235, + "step": 7075 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027521817506866, + "loss": 1.7166, + "step": 7076 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002752113697327989, + "loss": 1.6951, + "step": 7077 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027520456354682165, + "loss": 1.7324, + "step": 7078 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002751977565107745, + "loss": 1.7113, + "step": 7079 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027519094862470377, + "loss": 1.724, + "step": 7080 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027518413988865555, + "loss": 1.7077, + "step": 7081 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027517733030267604, + "loss": 1.7046, + "step": 7082 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002751705198668116, + "loss": 1.7046, + "step": 7083 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002751637085811084, + "loss": 1.7354, + "step": 7084 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027515689644561265, + "loss": 1.6923, + "step": 7085 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027515008346037066, + "loss": 1.6874, + "step": 7086 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027514326962542864, + "loss": 1.6773, + "step": 7087 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027513645494083293, + "loss": 1.6428, + "step": 7088 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027512963940662974, + "loss": 1.6665, + "step": 7089 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027512282302286534, + "loss": 1.7623, + "step": 7090 + }, + { + "epoch": 0.56, + "learning_rate": 0.000275116005789586, + "loss": 1.7122, + "step": 7091 + }, + { + "epoch": 0.56, + "learning_rate": 0.000275109187706838, + "loss": 1.7169, + "step": 7092 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027510236877466775, + "loss": 1.6866, + "step": 7093 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002750955489931214, + "loss": 1.6789, + "step": 7094 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002750887283622453, + "loss": 1.7291, + "step": 7095 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027508190688208575, + "loss": 1.6356, + "step": 7096 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027507508455268913, + "loss": 1.6606, + "step": 7097 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002750682613741017, + "loss": 1.7075, + "step": 7098 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027506143734636973, + "loss": 1.7456, + "step": 7099 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027505461246953966, + "loss": 1.7374, + "step": 7100 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002750477867436578, + "loss": 1.7225, + "step": 7101 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027504096016877044, + "loss": 1.7296, + "step": 7102 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027503413274492395, + "loss": 1.7073, + "step": 7103 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002750273044721647, + "loss": 1.727, + "step": 7104 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002750204753505391, + "loss": 1.6974, + "step": 7105 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027501364538009345, + "loss": 1.6792, + "step": 7106 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002750068145608741, + "loss": 1.6584, + "step": 7107 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027499998289292753, + "loss": 1.7238, + "step": 7108 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002749931503763, + "loss": 1.696, + "step": 7109 + }, + { + "epoch": 0.56, + "learning_rate": 0.000274986317011038, + "loss": 1.7342, + "step": 7110 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002749794827971878, + "loss": 1.6997, + "step": 7111 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027497264773479593, + "loss": 1.7, + "step": 7112 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002749658118239088, + "loss": 1.688, + "step": 7113 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027495897506457265, + "loss": 1.7038, + "step": 7114 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027495213745683413, + "loss": 1.7227, + "step": 7115 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002749452990007395, + "loss": 1.7272, + "step": 7116 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027493845969633527, + "loss": 1.6635, + "step": 7117 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002749316195436678, + "loss": 1.6852, + "step": 7118 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002749247785427836, + "loss": 1.7519, + "step": 7119 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002749179366937291, + "loss": 1.6978, + "step": 7120 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027491109399655075, + "loss": 1.7611, + "step": 7121 + }, + { + "epoch": 0.56, + "learning_rate": 0.000274904250451295, + "loss": 1.667, + "step": 7122 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027489740605800826, + "loss": 1.7406, + "step": 7123 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027489056081673714, + "loss": 1.7218, + "step": 7124 + }, + { + "epoch": 0.56, + "learning_rate": 0.000274883714727528, + "loss": 1.7536, + "step": 7125 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002748768677904273, + "loss": 1.7492, + "step": 7126 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002748700200054817, + "loss": 1.7163, + "step": 7127 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002748631713727375, + "loss": 1.725, + "step": 7128 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027485632189224124, + "loss": 1.6479, + "step": 7129 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027484947156403947, + "loss": 1.6916, + "step": 7130 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027484262038817873, + "loss": 1.7334, + "step": 7131 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002748357683647055, + "loss": 1.6743, + "step": 7132 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027482891549366625, + "loss": 1.7078, + "step": 7133 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002748220617751076, + "loss": 1.6987, + "step": 7134 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027481520720907594, + "loss": 1.7193, + "step": 7135 + }, + { + "epoch": 0.56, + "learning_rate": 0.000274808351795618, + "loss": 1.6678, + "step": 7136 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002748014955347802, + "loss": 1.7213, + "step": 7137 + }, + { + "epoch": 0.56, + "learning_rate": 0.000274794638426609, + "loss": 1.6856, + "step": 7138 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002747877804711512, + "loss": 1.7042, + "step": 7139 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002747809216684532, + "loss": 1.6896, + "step": 7140 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027477406201856165, + "loss": 1.6152, + "step": 7141 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027476720152152303, + "loss": 1.7573, + "step": 7142 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027476034017738396, + "loss": 1.6789, + "step": 7143 + }, + { + "epoch": 0.56, + "learning_rate": 0.000274753477986191, + "loss": 1.7242, + "step": 7144 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002747466149479909, + "loss": 1.7252, + "step": 7145 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027473975106282996, + "loss": 1.6718, + "step": 7146 + }, + { + "epoch": 0.56, + "learning_rate": 0.000274732886330755, + "loss": 1.6937, + "step": 7147 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002747260207518126, + "loss": 1.7351, + "step": 7148 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002747191543260494, + "loss": 1.7141, + "step": 7149 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027471228705351186, + "loss": 1.7058, + "step": 7150 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027470541893424676, + "loss": 1.746, + "step": 7151 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002746985499683007, + "loss": 1.7033, + "step": 7152 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002746916801557203, + "loss": 1.7098, + "step": 7153 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002746848094965522, + "loss": 1.7052, + "step": 7154 + }, + { + "epoch": 0.56, + "learning_rate": 0.000274677937990843, + "loss": 1.7307, + "step": 7155 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002746710656386395, + "loss": 1.7294, + "step": 7156 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027466419243998814, + "loss": 1.7069, + "step": 7157 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002746573183949358, + "loss": 1.7524, + "step": 7158 + }, + { + "epoch": 0.56, + "learning_rate": 0.000274650443503529, + "loss": 1.7312, + "step": 7159 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027464356776581454, + "loss": 1.7324, + "step": 7160 + }, + { + "epoch": 0.56, + "learning_rate": 0.000274636691181839, + "loss": 1.6611, + "step": 7161 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027462981375164916, + "loss": 1.662, + "step": 7162 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002746229354752916, + "loss": 1.7474, + "step": 7163 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002746160563528131, + "loss": 1.7362, + "step": 7164 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002746091763842603, + "loss": 1.6331, + "step": 7165 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027460229556968004, + "loss": 1.7027, + "step": 7166 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027459541390911893, + "loss": 1.7335, + "step": 7167 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027458853140262365, + "loss": 1.6725, + "step": 7168 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027458164805024105, + "loss": 1.702, + "step": 7169 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027457476385201786, + "loss": 1.7045, + "step": 7170 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002745678788080007, + "loss": 1.6392, + "step": 7171 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027456099291823643, + "loss": 1.716, + "step": 7172 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002745541061827717, + "loss": 1.6506, + "step": 7173 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027454721860165337, + "loss": 1.6424, + "step": 7174 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002745403301749281, + "loss": 1.6725, + "step": 7175 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002745334409026428, + "loss": 1.691, + "step": 7176 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002745265507848441, + "loss": 1.6637, + "step": 7177 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002745196598215788, + "loss": 1.6703, + "step": 7178 + }, + { + "epoch": 0.56, + "learning_rate": 0.0002745127680128938, + "loss": 1.7103, + "step": 7179 + }, + { + "epoch": 0.56, + "learning_rate": 0.00027450587535883585, + "loss": 1.7012, + "step": 7180 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002744989818594516, + "loss": 1.7088, + "step": 7181 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027449208751478805, + "loss": 1.7116, + "step": 7182 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002744851923248919, + "loss": 1.751, + "step": 7183 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027447829628981, + "loss": 1.7358, + "step": 7184 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027447139940958915, + "loss": 1.688, + "step": 7185 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002744645016842762, + "loss": 1.6977, + "step": 7186 + }, + { + "epoch": 0.57, + "learning_rate": 0.000274457603113918, + "loss": 1.7358, + "step": 7187 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027445070369856126, + "loss": 1.6731, + "step": 7188 + }, + { + "epoch": 0.57, + "learning_rate": 0.000274443803438253, + "loss": 1.7612, + "step": 7189 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027443690233303997, + "loss": 1.7282, + "step": 7190 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027443000038296903, + "loss": 1.7321, + "step": 7191 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002744230975880871, + "loss": 1.6646, + "step": 7192 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027441619394844095, + "loss": 1.7344, + "step": 7193 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027440928946407747, + "loss": 1.7433, + "step": 7194 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027440238413504363, + "loss": 1.6871, + "step": 7195 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002743954779613862, + "loss": 1.7465, + "step": 7196 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002743885709431522, + "loss": 1.7622, + "step": 7197 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002743816630803884, + "loss": 1.7202, + "step": 7198 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002743747543731417, + "loss": 1.706, + "step": 7199 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002743678448214592, + "loss": 1.6755, + "step": 7200 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002743609344253875, + "loss": 1.743, + "step": 7201 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002743540231849738, + "loss": 1.6447, + "step": 7202 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002743471111002648, + "loss": 1.7041, + "step": 7203 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027434019817130763, + "loss": 1.6975, + "step": 7204 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002743332843981491, + "loss": 1.6761, + "step": 7205 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002743263697808362, + "loss": 1.6906, + "step": 7206 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027431945431941583, + "loss": 1.7098, + "step": 7207 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027431253801393497, + "loss": 1.7379, + "step": 7208 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027430562086444056, + "loss": 1.7465, + "step": 7209 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002742987028709796, + "loss": 1.7137, + "step": 7210 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002742917840335991, + "loss": 1.6391, + "step": 7211 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002742848643523459, + "loss": 1.6919, + "step": 7212 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027427794382726706, + "loss": 1.7165, + "step": 7213 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002742710224584096, + "loss": 1.6913, + "step": 7214 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027426410024582046, + "loss": 1.7072, + "step": 7215 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027425717718954665, + "loss": 1.7079, + "step": 7216 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002742502532896352, + "loss": 1.7005, + "step": 7217 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002742433285461331, + "loss": 1.7091, + "step": 7218 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027423640295908734, + "loss": 1.6715, + "step": 7219 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027422947652854494, + "loss": 1.6733, + "step": 7220 + }, + { + "epoch": 0.57, + "learning_rate": 0.000274222549254553, + "loss": 1.6844, + "step": 7221 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002742156211371585, + "loss": 1.6926, + "step": 7222 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027420869217640844, + "loss": 1.7072, + "step": 7223 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002742017623723499, + "loss": 1.6361, + "step": 7224 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027419483172502995, + "loss": 1.6924, + "step": 7225 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002741879002344957, + "loss": 1.737, + "step": 7226 + }, + { + "epoch": 0.57, + "learning_rate": 0.000274180967900794, + "loss": 1.6845, + "step": 7227 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027417403472397215, + "loss": 1.7363, + "step": 7228 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002741671007040771, + "loss": 1.649, + "step": 7229 + }, + { + "epoch": 0.57, + "learning_rate": 0.000274160165841156, + "loss": 1.7558, + "step": 7230 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027415323013525587, + "loss": 1.7086, + "step": 7231 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002741462935864238, + "loss": 1.7699, + "step": 7232 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002741393561947069, + "loss": 1.681, + "step": 7233 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002741324179601523, + "loss": 1.6729, + "step": 7234 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027412547888280706, + "loss": 1.6764, + "step": 7235 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002741185389627183, + "loss": 1.6911, + "step": 7236 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002741115981999332, + "loss": 1.7415, + "step": 7237 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002741046565944989, + "loss": 1.694, + "step": 7238 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002740977141464624, + "loss": 1.6839, + "step": 7239 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002740907708558709, + "loss": 1.694, + "step": 7240 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002740838267227715, + "loss": 1.6872, + "step": 7241 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027407688174721143, + "loss": 1.6714, + "step": 7242 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002740699359292378, + "loss": 1.7636, + "step": 7243 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002740629892688978, + "loss": 1.7375, + "step": 7244 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027405604176623853, + "loss": 1.7212, + "step": 7245 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027404909342130726, + "loss": 1.6814, + "step": 7246 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027404214423415105, + "loss": 1.7453, + "step": 7247 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002740351942048171, + "loss": 1.6563, + "step": 7248 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002740282433333527, + "loss": 1.7289, + "step": 7249 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027402129161980496, + "loss": 1.6788, + "step": 7250 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027401433906422103, + "loss": 1.6721, + "step": 7251 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027400738566664824, + "loss": 1.6991, + "step": 7252 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002740004314271337, + "loss": 1.7167, + "step": 7253 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002739934763457247, + "loss": 1.708, + "step": 7254 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027398652042246835, + "loss": 1.6674, + "step": 7255 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027397956365741196, + "loss": 1.6944, + "step": 7256 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002739726060506028, + "loss": 1.6932, + "step": 7257 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027396564760208804, + "loss": 1.6736, + "step": 7258 + }, + { + "epoch": 0.57, + "learning_rate": 0.000273958688311915, + "loss": 1.692, + "step": 7259 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027395172818013076, + "loss": 1.6457, + "step": 7260 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002739447672067828, + "loss": 1.6636, + "step": 7261 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027393780539191817, + "loss": 1.6826, + "step": 7262 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002739308427355843, + "loss": 1.7193, + "step": 7263 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027392387923782835, + "loss": 1.6984, + "step": 7264 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002739169148986977, + "loss": 1.6863, + "step": 7265 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002739099497182395, + "loss": 1.7484, + "step": 7266 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002739029836965012, + "loss": 1.7186, + "step": 7267 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027389601683353, + "loss": 1.7261, + "step": 7268 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027388904912937324, + "loss": 1.7251, + "step": 7269 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002738820805840781, + "loss": 1.6625, + "step": 7270 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002738751111976921, + "loss": 1.645, + "step": 7271 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002738681409702624, + "loss": 1.6945, + "step": 7272 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002738611699018364, + "loss": 1.6807, + "step": 7273 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002738541979924614, + "loss": 1.7028, + "step": 7274 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002738472252421848, + "loss": 1.7183, + "step": 7275 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002738402516510538, + "loss": 1.6715, + "step": 7276 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002738332772191159, + "loss": 1.6736, + "step": 7277 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027382630194641835, + "loss": 1.6983, + "step": 7278 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027381932583300854, + "loss": 1.7309, + "step": 7279 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027381234887893384, + "loss": 1.6717, + "step": 7280 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027380537108424163, + "loss": 1.6581, + "step": 7281 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027379839244897925, + "loss": 1.6988, + "step": 7282 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002737914129731941, + "loss": 1.7154, + "step": 7283 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002737844326569336, + "loss": 1.656, + "step": 7284 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027377745150024513, + "loss": 1.6587, + "step": 7285 + }, + { + "epoch": 0.57, + "learning_rate": 0.000273770469503176, + "loss": 1.7215, + "step": 7286 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002737634866657737, + "loss": 1.7035, + "step": 7287 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002737565029880857, + "loss": 1.7507, + "step": 7288 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027374951847015927, + "loss": 1.6739, + "step": 7289 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002737425331120419, + "loss": 1.7164, + "step": 7290 + }, + { + "epoch": 0.57, + "learning_rate": 0.000273735546913781, + "loss": 1.7387, + "step": 7291 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027372855987542406, + "loss": 1.6993, + "step": 7292 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002737215719970185, + "loss": 1.6979, + "step": 7293 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002737145832786117, + "loss": 1.6798, + "step": 7294 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027370759372025117, + "loss": 1.6757, + "step": 7295 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027370060332198437, + "loss": 1.6954, + "step": 7296 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002736936120838587, + "loss": 1.7194, + "step": 7297 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027368662000592164, + "loss": 1.7211, + "step": 7298 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027367962708822074, + "loss": 1.6754, + "step": 7299 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027367263333080336, + "loss": 1.6892, + "step": 7300 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002736656387337171, + "loss": 1.7016, + "step": 7301 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002736586432970094, + "loss": 1.7017, + "step": 7302 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027365164702072777, + "loss": 1.6597, + "step": 7303 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002736446499049196, + "loss": 1.7208, + "step": 7304 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027363765194963254, + "loss": 1.7203, + "step": 7305 + }, + { + "epoch": 0.57, + "learning_rate": 0.00027363065315491413, + "loss": 1.6773, + "step": 7306 + }, + { + "epoch": 0.57, + "learning_rate": 0.0002736236535208117, + "loss": 1.756, + "step": 7307 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002736166530473729, + "loss": 1.7135, + "step": 7308 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027360965173464527, + "loss": 1.7484, + "step": 7309 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027360264958267635, + "loss": 1.7042, + "step": 7310 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027359564659151363, + "loss": 1.6986, + "step": 7311 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002735886427612046, + "loss": 1.6595, + "step": 7312 + }, + { + "epoch": 0.58, + "learning_rate": 0.000273581638091797, + "loss": 1.6817, + "step": 7313 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002735746325833382, + "loss": 1.6621, + "step": 7314 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002735676262358759, + "loss": 1.7131, + "step": 7315 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027356061904945753, + "loss": 1.6775, + "step": 7316 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002735536110241308, + "loss": 1.633, + "step": 7317 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002735466021599432, + "loss": 1.6893, + "step": 7318 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002735395924569424, + "loss": 1.6531, + "step": 7319 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027353258191517587, + "loss": 1.7092, + "step": 7320 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027352557053469137, + "loss": 1.7188, + "step": 7321 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002735185583155364, + "loss": 1.6959, + "step": 7322 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002735115452577585, + "loss": 1.7081, + "step": 7323 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002735045313614054, + "loss": 1.7294, + "step": 7324 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002734975166265247, + "loss": 1.6498, + "step": 7325 + }, + { + "epoch": 0.58, + "learning_rate": 0.000273490501053164, + "loss": 1.7136, + "step": 7326 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027348348464137096, + "loss": 1.6797, + "step": 7327 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002734764673911932, + "loss": 1.6597, + "step": 7328 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002734694493026784, + "loss": 1.6858, + "step": 7329 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027346243037587413, + "loss": 1.6957, + "step": 7330 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002734554106108281, + "loss": 1.707, + "step": 7331 + }, + { + "epoch": 0.58, + "learning_rate": 0.000273448390007588, + "loss": 1.6612, + "step": 7332 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027344136856620135, + "loss": 1.6894, + "step": 7333 + }, + { + "epoch": 0.58, + "learning_rate": 0.000273434346286716, + "loss": 1.7276, + "step": 7334 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002734273231691796, + "loss": 1.7069, + "step": 7335 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002734202992136397, + "loss": 1.6988, + "step": 7336 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002734132744201441, + "loss": 1.7179, + "step": 7337 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027340624878874055, + "loss": 1.6774, + "step": 7338 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002733992223194766, + "loss": 1.7101, + "step": 7339 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002733921950124, + "loss": 1.6655, + "step": 7340 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002733851668675586, + "loss": 1.7331, + "step": 7341 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002733781378849999, + "loss": 1.6466, + "step": 7342 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027337110806477177, + "loss": 1.6617, + "step": 7343 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027336407740692186, + "loss": 1.7116, + "step": 7344 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027335704591149797, + "loss": 1.6811, + "step": 7345 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027335001357854785, + "loss": 1.6613, + "step": 7346 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027334298040811915, + "loss": 1.7293, + "step": 7347 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002733359464002597, + "loss": 1.706, + "step": 7348 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027332891155501727, + "loss": 1.7406, + "step": 7349 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027332187587243955, + "loss": 1.6606, + "step": 7350 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002733148393525744, + "loss": 1.6678, + "step": 7351 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027330780199546947, + "loss": 1.6643, + "step": 7352 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002733007638011726, + "loss": 1.6802, + "step": 7353 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027329372476973167, + "loss": 1.7152, + "step": 7354 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002732866849011944, + "loss": 1.6373, + "step": 7355 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027327964419560845, + "loss": 1.7166, + "step": 7356 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002732726026530218, + "loss": 1.7315, + "step": 7357 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027326556027348225, + "loss": 1.6591, + "step": 7358 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027325851705703756, + "loss": 1.7136, + "step": 7359 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027325147300373553, + "loss": 1.7133, + "step": 7360 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027324442811362405, + "loss": 1.6686, + "step": 7361 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027323738238675086, + "loss": 1.6545, + "step": 7362 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002732303358231639, + "loss": 1.668, + "step": 7363 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027322328842291094, + "loss": 1.7098, + "step": 7364 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027321624018603985, + "loss": 1.678, + "step": 7365 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002732091911125985, + "loss": 1.7293, + "step": 7366 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002732021412026347, + "loss": 1.6602, + "step": 7367 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002731950904561964, + "loss": 1.6711, + "step": 7368 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002731880388733314, + "loss": 1.6574, + "step": 7369 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002731809864540876, + "loss": 1.667, + "step": 7370 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027317393319851286, + "loss": 1.6663, + "step": 7371 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002731668791066551, + "loss": 1.7467, + "step": 7372 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027315982417856224, + "loss": 1.7269, + "step": 7373 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002731527684142821, + "loss": 1.7135, + "step": 7374 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002731457118138626, + "loss": 1.7304, + "step": 7375 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002731386543773517, + "loss": 1.6677, + "step": 7376 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002731315961047973, + "loss": 1.6231, + "step": 7377 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002731245369962473, + "loss": 1.6929, + "step": 7378 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027311747705174963, + "loss": 1.7472, + "step": 7379 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027311041627135226, + "loss": 1.7249, + "step": 7380 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027310335465510305, + "loss": 1.6644, + "step": 7381 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027309629220305, + "loss": 1.6636, + "step": 7382 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002730892289152411, + "loss": 1.6641, + "step": 7383 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002730821647917243, + "loss": 1.6093, + "step": 7384 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027307509983254746, + "loss": 1.6596, + "step": 7385 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002730680340377586, + "loss": 1.6534, + "step": 7386 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027306096740740575, + "loss": 1.6771, + "step": 7387 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002730538999415368, + "loss": 1.7429, + "step": 7388 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002730468316401998, + "loss": 1.6808, + "step": 7389 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027303976250344275, + "loss": 1.7538, + "step": 7390 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027303269253131353, + "loss": 1.73, + "step": 7391 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027302562172386026, + "loss": 1.7462, + "step": 7392 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002730185500811309, + "loss": 1.7653, + "step": 7393 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002730114776031735, + "loss": 1.697, + "step": 7394 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027300440429003605, + "loss": 1.7309, + "step": 7395 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027299733014176655, + "loss": 1.7191, + "step": 7396 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027299025515841303, + "loss": 1.7404, + "step": 7397 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002729831793400236, + "loss": 1.7365, + "step": 7398 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027297610268664627, + "loss": 1.648, + "step": 7399 + }, + { + "epoch": 0.58, + "learning_rate": 0.000272969025198329, + "loss": 1.6472, + "step": 7400 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027296194687511993, + "loss": 1.7005, + "step": 7401 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002729548677170671, + "loss": 1.7607, + "step": 7402 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002729477877242186, + "loss": 1.6589, + "step": 7403 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027294070689662245, + "loss": 1.7632, + "step": 7404 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027293362523432677, + "loss": 1.6916, + "step": 7405 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027292654273737956, + "loss": 1.7092, + "step": 7406 + }, + { + "epoch": 0.58, + "learning_rate": 0.000272919459405829, + "loss": 1.7189, + "step": 7407 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027291237523972313, + "loss": 1.6406, + "step": 7408 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027290529023911, + "loss": 1.6986, + "step": 7409 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002728982044040379, + "loss": 1.6349, + "step": 7410 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027289111773455473, + "loss": 1.6958, + "step": 7411 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002728840302307087, + "loss": 1.7451, + "step": 7412 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002728769418925479, + "loss": 1.7363, + "step": 7413 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002728698527201205, + "loss": 1.7257, + "step": 7414 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027286276271347464, + "loss": 1.6821, + "step": 7415 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002728556718726584, + "loss": 1.7299, + "step": 7416 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002728485801977199, + "loss": 1.6805, + "step": 7417 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002728414876887073, + "loss": 1.7392, + "step": 7418 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002728343943456689, + "loss": 1.7125, + "step": 7419 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002728273001686527, + "loss": 1.693, + "step": 7420 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002728202051577069, + "loss": 1.7288, + "step": 7421 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002728131093128797, + "loss": 1.7333, + "step": 7422 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002728060126342193, + "loss": 1.659, + "step": 7423 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002727989151217738, + "loss": 1.6812, + "step": 7424 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002727918167755914, + "loss": 1.6266, + "step": 7425 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002727847175957204, + "loss": 1.7365, + "step": 7426 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002727776175822089, + "loss": 1.6815, + "step": 7427 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002727705167351051, + "loss": 1.6792, + "step": 7428 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027276341505445725, + "loss": 1.6886, + "step": 7429 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027275631254031354, + "loss": 1.6489, + "step": 7430 + }, + { + "epoch": 0.58, + "learning_rate": 0.00027274920919272225, + "loss": 1.6632, + "step": 7431 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002727421050117316, + "loss": 1.6688, + "step": 7432 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002727349999973897, + "loss": 1.726, + "step": 7433 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002727278941497449, + "loss": 1.6739, + "step": 7434 + }, + { + "epoch": 0.58, + "learning_rate": 0.0002727207874688455, + "loss": 1.7166, + "step": 7435 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002727136799547396, + "loss": 1.6968, + "step": 7436 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002727065716074756, + "loss": 1.7008, + "step": 7437 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027269946242710166, + "loss": 1.7715, + "step": 7438 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027269235241366606, + "loss": 1.7009, + "step": 7439 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002726852415672171, + "loss": 1.6875, + "step": 7440 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002726781298878031, + "loss": 1.6621, + "step": 7441 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027267101737547226, + "loss": 1.747, + "step": 7442 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002726639040302729, + "loss": 1.6621, + "step": 7443 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027265678985225334, + "loss": 1.6542, + "step": 7444 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002726496748414618, + "loss": 1.6746, + "step": 7445 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027264255899794675, + "loss": 1.72, + "step": 7446 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002726354423217564, + "loss": 1.6879, + "step": 7447 + }, + { + "epoch": 0.59, + "learning_rate": 0.000272628324812939, + "loss": 1.6036, + "step": 7448 + }, + { + "epoch": 0.59, + "learning_rate": 0.000272621206471543, + "loss": 1.6652, + "step": 7449 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027261408729761663, + "loss": 1.6986, + "step": 7450 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027260696729120834, + "loss": 1.6844, + "step": 7451 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002725998464523663, + "loss": 1.6611, + "step": 7452 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027259272478113907, + "loss": 1.689, + "step": 7453 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027258560227757487, + "loss": 1.709, + "step": 7454 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027257847894172205, + "loss": 1.7184, + "step": 7455 + }, + { + "epoch": 0.59, + "learning_rate": 0.000272571354773629, + "loss": 1.677, + "step": 7456 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027256422977334406, + "loss": 1.7562, + "step": 7457 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002725571039409157, + "loss": 1.7093, + "step": 7458 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002725499772763922, + "loss": 1.7101, + "step": 7459 + }, + { + "epoch": 0.59, + "learning_rate": 0.000272542849779822, + "loss": 1.7496, + "step": 7460 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027253572145125347, + "loss": 1.6623, + "step": 7461 + }, + { + "epoch": 0.59, + "learning_rate": 0.000272528592290735, + "loss": 1.6913, + "step": 7462 + }, + { + "epoch": 0.59, + "learning_rate": 0.000272521462298315, + "loss": 1.6682, + "step": 7463 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002725143314740419, + "loss": 1.6638, + "step": 7464 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002725071998179641, + "loss": 1.6805, + "step": 7465 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027250006733013003, + "loss": 1.7034, + "step": 7466 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002724929340105881, + "loss": 1.6365, + "step": 7467 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002724857998593867, + "loss": 1.7336, + "step": 7468 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002724786648765743, + "loss": 1.758, + "step": 7469 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002724715290621995, + "loss": 1.7362, + "step": 7470 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002724643924163104, + "loss": 1.7271, + "step": 7471 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002724572549389558, + "loss": 1.6865, + "step": 7472 + }, + { + "epoch": 0.59, + "learning_rate": 0.000272450116630184, + "loss": 1.6176, + "step": 7473 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027244297749004346, + "loss": 1.642, + "step": 7474 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027243583751858266, + "loss": 1.6027, + "step": 7475 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027242869671585007, + "loss": 1.7254, + "step": 7476 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027242155508189425, + "loss": 1.6935, + "step": 7477 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002724144126167636, + "loss": 1.6866, + "step": 7478 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002724072693205066, + "loss": 1.6449, + "step": 7479 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027240012519317186, + "loss": 1.6805, + "step": 7480 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002723929802348078, + "loss": 1.7547, + "step": 7481 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002723858344454629, + "loss": 1.7058, + "step": 7482 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002723786878251858, + "loss": 1.6961, + "step": 7483 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027237154037402486, + "loss": 1.7095, + "step": 7484 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027236439209202875, + "loss": 1.7127, + "step": 7485 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002723572429792459, + "loss": 1.673, + "step": 7486 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027235009303572494, + "loss": 1.705, + "step": 7487 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002723429422615143, + "loss": 1.7004, + "step": 7488 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002723357906566627, + "loss": 1.6681, + "step": 7489 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027232863822121856, + "loss": 1.6708, + "step": 7490 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002723214849552304, + "loss": 1.6854, + "step": 7491 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027231433085874693, + "loss": 1.6313, + "step": 7492 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027230717593181665, + "loss": 1.6786, + "step": 7493 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002723000201744881, + "loss": 1.7119, + "step": 7494 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002722928635868099, + "loss": 1.6515, + "step": 7495 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002722857061688307, + "loss": 1.7052, + "step": 7496 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027227854792059896, + "loss": 1.6641, + "step": 7497 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002722713888421634, + "loss": 1.714, + "step": 7498 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002722642289335726, + "loss": 1.6976, + "step": 7499 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002722570681948752, + "loss": 1.6988, + "step": 7500 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002722499066261197, + "loss": 1.6927, + "step": 7501 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002722427442273548, + "loss": 1.6721, + "step": 7502 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027223558099862916, + "loss": 1.6471, + "step": 7503 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027222841693999133, + "loss": 1.6269, + "step": 7504 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027222125205149004, + "loss": 1.704, + "step": 7505 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027221408633317385, + "loss": 1.6941, + "step": 7506 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002722069197850915, + "loss": 1.7167, + "step": 7507 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002721997524072916, + "loss": 1.7624, + "step": 7508 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027219258419982283, + "loss": 1.6585, + "step": 7509 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002721854151627338, + "loss": 1.6781, + "step": 7510 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027217824529607326, + "loss": 1.6971, + "step": 7511 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002721710745998899, + "loss": 1.7003, + "step": 7512 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027216390307423233, + "loss": 1.7285, + "step": 7513 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002721567307191492, + "loss": 1.6951, + "step": 7514 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002721495575346894, + "loss": 1.7496, + "step": 7515 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002721423835209014, + "loss": 1.6229, + "step": 7516 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002721352086778341, + "loss": 1.6905, + "step": 7517 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027212803300553614, + "loss": 1.6032, + "step": 7518 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027212085650405615, + "loss": 1.71, + "step": 7519 + }, + { + "epoch": 0.59, + "learning_rate": 0.000272113679173443, + "loss": 1.7566, + "step": 7520 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027210650101374534, + "loss": 1.7173, + "step": 7521 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027209932202501195, + "loss": 1.6939, + "step": 7522 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002720921422072915, + "loss": 1.7184, + "step": 7523 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002720849615606328, + "loss": 1.7055, + "step": 7524 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027207778008508455, + "loss": 1.7349, + "step": 7525 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002720705977806956, + "loss": 1.6973, + "step": 7526 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002720634146475146, + "loss": 1.7144, + "step": 7527 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002720562306855904, + "loss": 1.7277, + "step": 7528 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027204904589497175, + "loss": 1.7266, + "step": 7529 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002720418602757075, + "loss": 1.7176, + "step": 7530 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002720346738278462, + "loss": 1.6831, + "step": 7531 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027202748655143693, + "loss": 1.6788, + "step": 7532 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027202029844652833, + "loss": 1.6641, + "step": 7533 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002720131095131693, + "loss": 1.6553, + "step": 7534 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002720059197514085, + "loss": 1.7215, + "step": 7535 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027199872916129495, + "loss": 1.6752, + "step": 7536 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002719915377428772, + "loss": 1.7179, + "step": 7537 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027198434549620436, + "loss": 1.6815, + "step": 7538 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002719771524213251, + "loss": 1.7041, + "step": 7539 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027196995851828823, + "loss": 1.7207, + "step": 7540 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002719627637871427, + "loss": 1.6795, + "step": 7541 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027195556822793724, + "loss": 1.6931, + "step": 7542 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027194837184072086, + "loss": 1.6665, + "step": 7543 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002719411746255423, + "loss": 1.7126, + "step": 7544 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027193397658245046, + "loss": 1.671, + "step": 7545 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002719267777114942, + "loss": 1.6831, + "step": 7546 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002719195780127224, + "loss": 1.678, + "step": 7547 + }, + { + "epoch": 0.59, + "learning_rate": 0.000271912377486184, + "loss": 1.6946, + "step": 7548 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027190517613192775, + "loss": 1.7116, + "step": 7549 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002718979739500027, + "loss": 1.6463, + "step": 7550 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027189077094045763, + "loss": 1.6066, + "step": 7551 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002718835671033415, + "loss": 1.6624, + "step": 7552 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002718763624387032, + "loss": 1.7158, + "step": 7553 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002718691569465917, + "loss": 1.6491, + "step": 7554 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027186195062705584, + "loss": 1.7374, + "step": 7555 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027185474348014456, + "loss": 1.743, + "step": 7556 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002718475355059069, + "loss": 1.6777, + "step": 7557 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002718403267043916, + "loss": 1.6868, + "step": 7558 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002718331170756478, + "loss": 1.6627, + "step": 7559 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027182590661972434, + "loss": 1.6575, + "step": 7560 + }, + { + "epoch": 0.59, + "learning_rate": 0.0002718186953366702, + "loss": 1.6577, + "step": 7561 + }, + { + "epoch": 0.59, + "learning_rate": 0.00027181148322653437, + "loss": 1.7298, + "step": 7562 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027180427028936576, + "loss": 1.6644, + "step": 7563 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002717970565252134, + "loss": 1.6828, + "step": 7564 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027178984193412624, + "loss": 1.6782, + "step": 7565 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027178262651615323, + "loss": 1.7056, + "step": 7566 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002717754102713434, + "loss": 1.7003, + "step": 7567 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027176819319974573, + "loss": 1.6483, + "step": 7568 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027176097530140925, + "loss": 1.6868, + "step": 7569 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027175375657638294, + "loss": 1.7036, + "step": 7570 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027174653702471583, + "loss": 1.6919, + "step": 7571 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002717393166464569, + "loss": 1.6507, + "step": 7572 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027173209544165513, + "loss": 1.6637, + "step": 7573 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002717248734103597, + "loss": 1.7043, + "step": 7574 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002717176505526195, + "loss": 1.7313, + "step": 7575 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027171042686848363, + "loss": 1.6536, + "step": 7576 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027170320235800116, + "loss": 1.6796, + "step": 7577 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027169597702122105, + "loss": 1.7097, + "step": 7578 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002716887508581925, + "loss": 1.6431, + "step": 7579 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002716815238689644, + "loss": 1.6832, + "step": 7580 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002716742960535859, + "loss": 1.6959, + "step": 7581 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027166706741210613, + "loss": 1.6647, + "step": 7582 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002716598379445741, + "loss": 1.7074, + "step": 7583 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002716526076510389, + "loss": 1.7063, + "step": 7584 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002716453765315496, + "loss": 1.6459, + "step": 7585 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002716381445861554, + "loss": 1.6759, + "step": 7586 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027163091181490524, + "loss": 1.6879, + "step": 7587 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027162367821784834, + "loss": 1.6841, + "step": 7588 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002716164437950338, + "loss": 1.729, + "step": 7589 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002716092085465107, + "loss": 1.6496, + "step": 7590 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002716019724723282, + "loss": 1.7051, + "step": 7591 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002715947355725354, + "loss": 1.6829, + "step": 7592 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027158749784718145, + "loss": 1.7166, + "step": 7593 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002715802592963155, + "loss": 1.6905, + "step": 7594 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027157301991998666, + "loss": 1.6995, + "step": 7595 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002715657797182441, + "loss": 1.7148, + "step": 7596 + }, + { + "epoch": 0.6, + "learning_rate": 0.000271558538691137, + "loss": 1.6967, + "step": 7597 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027155129683871455, + "loss": 1.6451, + "step": 7598 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002715440541610258, + "loss": 1.6819, + "step": 7599 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027153681065811996, + "loss": 1.6892, + "step": 7600 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027152956633004634, + "loss": 1.716, + "step": 7601 + }, + { + "epoch": 0.6, + "learning_rate": 0.000271522321176854, + "loss": 1.6712, + "step": 7602 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027151507519859215, + "loss": 1.6829, + "step": 7603 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027150782839530996, + "loss": 1.6926, + "step": 7604 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002715005807670567, + "loss": 1.6415, + "step": 7605 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002714933323138816, + "loss": 1.7427, + "step": 7606 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002714860830358338, + "loss": 1.7141, + "step": 7607 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027147883293296253, + "loss": 1.7217, + "step": 7608 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027147158200531695, + "loss": 1.6666, + "step": 7609 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002714643302529464, + "loss": 1.6895, + "step": 7610 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002714570776759001, + "loss": 1.7176, + "step": 7611 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027144982427422727, + "loss": 1.651, + "step": 7612 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002714425700479772, + "loss": 1.6567, + "step": 7613 + }, + { + "epoch": 0.6, + "learning_rate": 0.000271435314997199, + "loss": 1.6357, + "step": 7614 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027142805912194203, + "loss": 1.7244, + "step": 7615 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002714208024222556, + "loss": 1.6917, + "step": 7616 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027141354489818893, + "loss": 1.6865, + "step": 7617 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027140628654979124, + "loss": 1.664, + "step": 7618 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027139902737711194, + "loss": 1.6724, + "step": 7619 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002713917673802002, + "loss": 1.6994, + "step": 7620 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002713845065591053, + "loss": 1.7345, + "step": 7621 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002713772449138766, + "loss": 1.7213, + "step": 7622 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027136998244456346, + "loss": 1.6804, + "step": 7623 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027136271915121507, + "loss": 1.6839, + "step": 7624 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027135545503388083, + "loss": 1.6774, + "step": 7625 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027134819009261, + "loss": 1.7246, + "step": 7626 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027134092432745183, + "loss": 1.7027, + "step": 7627 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027133365773845584, + "loss": 1.6628, + "step": 7628 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002713263903256713, + "loss": 1.6895, + "step": 7629 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027131912208914745, + "loss": 1.7026, + "step": 7630 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002713118530289338, + "loss": 1.6778, + "step": 7631 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027130458314507947, + "loss": 1.6521, + "step": 7632 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002712973124376341, + "loss": 1.7371, + "step": 7633 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002712900409066468, + "loss": 1.7016, + "step": 7634 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027128276855216713, + "loss": 1.6897, + "step": 7635 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002712754953742444, + "loss": 1.7815, + "step": 7636 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027126822137292793, + "loss": 1.7339, + "step": 7637 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027126094654826723, + "loss": 1.7283, + "step": 7638 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027125367090031154, + "loss": 1.6899, + "step": 7639 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002712463944291104, + "loss": 1.7126, + "step": 7640 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002712391171347131, + "loss": 1.66, + "step": 7641 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027123183901716914, + "loss": 1.6935, + "step": 7642 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002712245600765279, + "loss": 1.6505, + "step": 7643 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002712172803128387, + "loss": 1.7, + "step": 7644 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002712099997261512, + "loss": 1.6673, + "step": 7645 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002712027183165146, + "loss": 1.726, + "step": 7646 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027119543608397845, + "loss": 1.6576, + "step": 7647 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002711881530285922, + "loss": 1.6803, + "step": 7648 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027118086915040523, + "loss": 1.6988, + "step": 7649 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027117358444946705, + "loss": 1.7356, + "step": 7650 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002711662989258271, + "loss": 1.6083, + "step": 7651 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027115901257953484, + "loss": 1.6747, + "step": 7652 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002711517254106397, + "loss": 1.6436, + "step": 7653 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027114443741919127, + "loss": 1.6734, + "step": 7654 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027113714860523897, + "loss": 1.6759, + "step": 7655 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002711298589688322, + "loss": 1.6685, + "step": 7656 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027112256851002063, + "loss": 1.6957, + "step": 7657 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002711152772288536, + "loss": 1.6581, + "step": 7658 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027110798512538066, + "loss": 1.6624, + "step": 7659 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027110069219965136, + "loss": 1.6734, + "step": 7660 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002710933984517152, + "loss": 1.6636, + "step": 7661 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002710861038816217, + "loss": 1.657, + "step": 7662 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002710788084894204, + "loss": 1.6635, + "step": 7663 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002710715122751607, + "loss": 1.6743, + "step": 7664 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002710642152388923, + "loss": 1.648, + "step": 7665 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002710569173806647, + "loss": 1.6809, + "step": 7666 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027104961870052743, + "loss": 1.6991, + "step": 7667 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027104231919853006, + "loss": 1.6813, + "step": 7668 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027103501887472213, + "loss": 1.6652, + "step": 7669 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002710277177291532, + "loss": 1.6722, + "step": 7670 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027102041576187286, + "loss": 1.671, + "step": 7671 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002710131129729307, + "loss": 1.6618, + "step": 7672 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027100580936237627, + "loss": 1.7084, + "step": 7673 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027099850493025917, + "loss": 1.6027, + "step": 7674 + }, + { + "epoch": 0.6, + "learning_rate": 0.000270991199676629, + "loss": 1.7443, + "step": 7675 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027098389360153536, + "loss": 1.7147, + "step": 7676 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027097658670502785, + "loss": 1.6694, + "step": 7677 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027096927898715605, + "loss": 1.6139, + "step": 7678 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027096197044796966, + "loss": 1.6711, + "step": 7679 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002709546610875182, + "loss": 1.6158, + "step": 7680 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002709473509058513, + "loss": 1.6948, + "step": 7681 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027094003990301867, + "loss": 1.7084, + "step": 7682 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002709327280790699, + "loss": 1.6321, + "step": 7683 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027092541543405466, + "loss": 1.6759, + "step": 7684 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002709181019680226, + "loss": 1.6781, + "step": 7685 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027091078768102335, + "loss": 1.7327, + "step": 7686 + }, + { + "epoch": 0.6, + "learning_rate": 0.00027090347257310653, + "loss": 1.6678, + "step": 7687 + }, + { + "epoch": 0.6, + "learning_rate": 0.0002708961566443219, + "loss": 1.6637, + "step": 7688 + }, + { + "epoch": 0.6, + "learning_rate": 0.000270888839894719, + "loss": 1.666, + "step": 7689 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027088152232434767, + "loss": 1.6964, + "step": 7690 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002708742039332575, + "loss": 1.6335, + "step": 7691 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027086688472149813, + "loss": 1.7199, + "step": 7692 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002708595646891194, + "loss": 1.7476, + "step": 7693 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027085224383617085, + "loss": 1.6736, + "step": 7694 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002708449221627023, + "loss": 1.6997, + "step": 7695 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027083759966876344, + "loss": 1.7053, + "step": 7696 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002708302763544039, + "loss": 1.6823, + "step": 7697 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027082295221967354, + "loss": 1.6817, + "step": 7698 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027081562726462196, + "loss": 1.6933, + "step": 7699 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002708083014892989, + "loss": 1.7048, + "step": 7700 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002708009748937542, + "loss": 1.6492, + "step": 7701 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002707936474780375, + "loss": 1.683, + "step": 7702 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027078631924219867, + "loss": 1.7572, + "step": 7703 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002707789901862873, + "loss": 1.6935, + "step": 7704 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027077166031035327, + "loss": 1.6798, + "step": 7705 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002707643296144463, + "loss": 1.6856, + "step": 7706 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002707569980986162, + "loss": 1.7108, + "step": 7707 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002707496657629127, + "loss": 1.6775, + "step": 7708 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002707423326073856, + "loss": 1.6686, + "step": 7709 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002707349986320848, + "loss": 1.713, + "step": 7710 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002707276638370599, + "loss": 1.7308, + "step": 7711 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027072032822236076, + "loss": 1.645, + "step": 7712 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027071299178803727, + "loss": 1.5611, + "step": 7713 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002707056545341391, + "loss": 1.6941, + "step": 7714 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027069831646071624, + "loss": 1.7899, + "step": 7715 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002706909775678184, + "loss": 1.6771, + "step": 7716 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027068363785549533, + "loss": 1.7044, + "step": 7717 + }, + { + "epoch": 0.61, + "learning_rate": 0.000270676297323797, + "loss": 1.7449, + "step": 7718 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002706689559727733, + "loss": 1.689, + "step": 7719 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027066161380247386, + "loss": 1.6919, + "step": 7720 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027065427081294873, + "loss": 1.6797, + "step": 7721 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002706469270042476, + "loss": 1.6803, + "step": 7722 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002706395823764205, + "loss": 1.7253, + "step": 7723 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027063223692951716, + "loss": 1.6653, + "step": 7724 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027062489066358755, + "loss": 1.7012, + "step": 7725 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002706175435786815, + "loss": 1.7188, + "step": 7726 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002706101956748488, + "loss": 1.7028, + "step": 7727 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002706028469521395, + "loss": 1.7062, + "step": 7728 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002705954974106034, + "loss": 1.6785, + "step": 7729 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027058814705029045, + "loss": 1.6871, + "step": 7730 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002705807958712505, + "loss": 1.6439, + "step": 7731 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002705734438735335, + "loss": 1.689, + "step": 7732 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002705660910571894, + "loss": 1.6852, + "step": 7733 + }, + { + "epoch": 0.61, + "learning_rate": 0.000270558737422268, + "loss": 1.5901, + "step": 7734 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002705513829688193, + "loss": 1.7427, + "step": 7735 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002705440276968933, + "loss": 1.7023, + "step": 7736 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027053667160653984, + "loss": 1.6657, + "step": 7737 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002705293146978089, + "loss": 1.7394, + "step": 7738 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002705219569707504, + "loss": 1.6606, + "step": 7739 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002705145984254144, + "loss": 1.6896, + "step": 7740 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027050723906185074, + "loss": 1.7368, + "step": 7741 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027049987888010937, + "loss": 1.7081, + "step": 7742 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002704925178802404, + "loss": 1.7303, + "step": 7743 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027048515606229367, + "loss": 1.6666, + "step": 7744 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027047779342631925, + "loss": 1.7523, + "step": 7745 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002704704299723671, + "loss": 1.696, + "step": 7746 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002704630657004872, + "loss": 1.6861, + "step": 7747 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027045570061072955, + "loss": 1.6846, + "step": 7748 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027044833470314417, + "loss": 1.6473, + "step": 7749 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002704409679777811, + "loss": 1.6845, + "step": 7750 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002704336004346903, + "loss": 1.7137, + "step": 7751 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002704262320739218, + "loss": 1.7047, + "step": 7752 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002704188628955257, + "loss": 1.6997, + "step": 7753 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027041149289955187, + "loss": 1.7023, + "step": 7754 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027040412208605055, + "loss": 1.73, + "step": 7755 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002703967504550716, + "loss": 1.6937, + "step": 7756 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002703893780066652, + "loss": 1.6907, + "step": 7757 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027038200474088135, + "loss": 1.7197, + "step": 7758 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027037463065777013, + "loss": 1.6411, + "step": 7759 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002703672557573816, + "loss": 1.6598, + "step": 7760 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027035988003976585, + "loss": 1.7087, + "step": 7761 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002703525035049729, + "loss": 1.6556, + "step": 7762 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027034512615305286, + "loss": 1.5966, + "step": 7763 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002703377479840559, + "loss": 1.6523, + "step": 7764 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002703303689980319, + "loss": 1.6382, + "step": 7765 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002703229891950312, + "loss": 1.6864, + "step": 7766 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002703156085751038, + "loss": 1.6932, + "step": 7767 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002703082271382998, + "loss": 1.7289, + "step": 7768 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002703008448846693, + "loss": 1.6609, + "step": 7769 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027029346181426246, + "loss": 1.6464, + "step": 7770 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027028607792712944, + "loss": 1.658, + "step": 7771 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027027869322332026, + "loss": 1.7308, + "step": 7772 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002702713077028852, + "loss": 1.687, + "step": 7773 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027026392136587425, + "loss": 1.6734, + "step": 7774 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027025653421233775, + "loss": 1.6608, + "step": 7775 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002702491462423257, + "loss": 1.7244, + "step": 7776 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027024175745588827, + "loss": 1.6772, + "step": 7777 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002702343678530757, + "loss": 1.7196, + "step": 7778 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002702269774339381, + "loss": 1.6846, + "step": 7779 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002702195861985257, + "loss": 1.6852, + "step": 7780 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002702121941468886, + "loss": 1.662, + "step": 7781 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027020480127907707, + "loss": 1.6846, + "step": 7782 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002701974075951413, + "loss": 1.682, + "step": 7783 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002701900130951314, + "loss": 1.7145, + "step": 7784 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002701826177790977, + "loss": 1.6503, + "step": 7785 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002701752216470903, + "loss": 1.6752, + "step": 7786 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002701678246991595, + "loss": 1.6866, + "step": 7787 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002701604269353555, + "loss": 1.6393, + "step": 7788 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027015302835572844, + "loss": 1.7086, + "step": 7789 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027014562896032865, + "loss": 1.7065, + "step": 7790 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002701382287492064, + "loss": 1.6913, + "step": 7791 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002701308277224118, + "loss": 1.7747, + "step": 7792 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002701234258799952, + "loss": 1.6597, + "step": 7793 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002701160232220068, + "loss": 1.699, + "step": 7794 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027010861974849696, + "loss": 1.683, + "step": 7795 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027010121545951586, + "loss": 1.7259, + "step": 7796 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027009381035511374, + "loss": 1.6702, + "step": 7797 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002700864044353409, + "loss": 1.7118, + "step": 7798 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027007899770024776, + "loss": 1.6849, + "step": 7799 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002700715901498844, + "loss": 1.6357, + "step": 7800 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002700641817843012, + "loss": 1.6534, + "step": 7801 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027005677260354843, + "loss": 1.6837, + "step": 7802 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027004936260767654, + "loss": 1.6363, + "step": 7803 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027004195179673566, + "loss": 1.6498, + "step": 7804 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027003454017077616, + "loss": 1.7204, + "step": 7805 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027002712772984834, + "loss": 1.6746, + "step": 7806 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002700197144740026, + "loss": 1.673, + "step": 7807 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002700123004032893, + "loss": 1.6588, + "step": 7808 + }, + { + "epoch": 0.61, + "learning_rate": 0.00027000488551775863, + "loss": 1.6707, + "step": 7809 + }, + { + "epoch": 0.61, + "learning_rate": 0.00026999746981746104, + "loss": 1.6246, + "step": 7810 + }, + { + "epoch": 0.61, + "learning_rate": 0.00026999005330244683, + "loss": 1.6991, + "step": 7811 + }, + { + "epoch": 0.61, + "learning_rate": 0.00026998263597276636, + "loss": 1.6535, + "step": 7812 + }, + { + "epoch": 0.61, + "learning_rate": 0.00026997521782847004, + "loss": 1.6328, + "step": 7813 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002699677988696082, + "loss": 1.672, + "step": 7814 + }, + { + "epoch": 0.61, + "learning_rate": 0.00026996037909623116, + "loss": 1.6721, + "step": 7815 + }, + { + "epoch": 0.61, + "learning_rate": 0.0002699529585083894, + "loss": 1.6931, + "step": 7816 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026994553710613323, + "loss": 1.6709, + "step": 7817 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026993811488951305, + "loss": 1.7594, + "step": 7818 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026993069185857926, + "loss": 1.6703, + "step": 7819 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026992326801338225, + "loss": 1.659, + "step": 7820 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002699158433539724, + "loss": 1.6641, + "step": 7821 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002699084178804002, + "loss": 1.7007, + "step": 7822 + }, + { + "epoch": 0.62, + "learning_rate": 0.000269900991592716, + "loss": 1.6525, + "step": 7823 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002698935644909702, + "loss": 1.6699, + "step": 7824 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002698861365752133, + "loss": 1.715, + "step": 7825 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002698787078454957, + "loss": 1.6312, + "step": 7826 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002698712783018678, + "loss": 1.705, + "step": 7827 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002698638479443801, + "loss": 1.6992, + "step": 7828 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026985641677308296, + "loss": 1.6437, + "step": 7829 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026984898478802695, + "loss": 1.6819, + "step": 7830 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026984155198926245, + "loss": 1.6611, + "step": 7831 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026983411837683995, + "loss": 1.6746, + "step": 7832 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002698266839508099, + "loss": 1.7234, + "step": 7833 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026981924871122287, + "loss": 1.7195, + "step": 7834 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026981181265812917, + "loss": 1.6817, + "step": 7835 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002698043757915794, + "loss": 1.6272, + "step": 7836 + }, + { + "epoch": 0.62, + "learning_rate": 0.000269796938111624, + "loss": 1.692, + "step": 7837 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026978949961831356, + "loss": 1.6702, + "step": 7838 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002697820603116985, + "loss": 1.6806, + "step": 7839 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026977462019182934, + "loss": 1.6646, + "step": 7840 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002697671792587567, + "loss": 1.655, + "step": 7841 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026975973751253087, + "loss": 1.7019, + "step": 7842 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002697522949532026, + "loss": 1.6034, + "step": 7843 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002697448515808223, + "loss": 1.6622, + "step": 7844 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002697374073954405, + "loss": 1.7003, + "step": 7845 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002697299623971078, + "loss": 1.7274, + "step": 7846 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002697225165858748, + "loss": 1.6939, + "step": 7847 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002697150699617919, + "loss": 1.6633, + "step": 7848 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026970762252490977, + "loss": 1.6455, + "step": 7849 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026970017427527894, + "loss": 1.7162, + "step": 7850 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026969272521294995, + "loss": 1.7257, + "step": 7851 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002696852753379734, + "loss": 1.7001, + "step": 7852 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026967782465039995, + "loss": 1.6862, + "step": 7853 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002696703731502801, + "loss": 1.6244, + "step": 7854 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026966292083766447, + "loss": 1.652, + "step": 7855 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002696554677126036, + "loss": 1.6518, + "step": 7856 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002696480137751481, + "loss": 1.6362, + "step": 7857 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026964055902534866, + "loss": 1.688, + "step": 7858 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002696331034632559, + "loss": 1.6737, + "step": 7859 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002696256470889203, + "loss": 1.6757, + "step": 7860 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026961818990239265, + "loss": 1.7131, + "step": 7861 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026961073190372343, + "loss": 1.6642, + "step": 7862 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002696032730929634, + "loss": 1.6989, + "step": 7863 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026959581347016305, + "loss": 1.6412, + "step": 7864 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026958835303537325, + "loss": 1.6775, + "step": 7865 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026958089178864445, + "loss": 1.658, + "step": 7866 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026957342973002744, + "loss": 1.6525, + "step": 7867 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026956596685957275, + "loss": 1.6795, + "step": 7868 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026955850317733116, + "loss": 1.6942, + "step": 7869 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002695510386833534, + "loss": 1.655, + "step": 7870 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026954357337768996, + "loss": 1.6853, + "step": 7871 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026953610726039167, + "loss": 1.6029, + "step": 7872 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002695286403315091, + "loss": 1.6674, + "step": 7873 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002695211725910931, + "loss": 1.6964, + "step": 7874 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026951370403919433, + "loss": 1.7697, + "step": 7875 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002695062346758634, + "loss": 1.6439, + "step": 7876 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002694987645011511, + "loss": 1.6776, + "step": 7877 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002694912935151081, + "loss": 1.6482, + "step": 7878 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002694838217177852, + "loss": 1.7287, + "step": 7879 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026947634910923305, + "loss": 1.6736, + "step": 7880 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026946887568950244, + "loss": 1.7489, + "step": 7881 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026946140145864413, + "loss": 1.6102, + "step": 7882 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026945392641670876, + "loss": 1.6736, + "step": 7883 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026944645056374724, + "loss": 1.6409, + "step": 7884 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002694389738998102, + "loss": 1.6954, + "step": 7885 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002694314964249484, + "loss": 1.6533, + "step": 7886 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002694240181392126, + "loss": 1.674, + "step": 7887 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026941653904265374, + "loss": 1.6555, + "step": 7888 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002694090591353224, + "loss": 1.6473, + "step": 7889 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002694015784172695, + "loss": 1.6539, + "step": 7890 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026939409688854575, + "loss": 1.6771, + "step": 7891 + }, + { + "epoch": 0.62, + "learning_rate": 0.000269386614549202, + "loss": 1.6686, + "step": 7892 + }, + { + "epoch": 0.62, + "learning_rate": 0.000269379131399289, + "loss": 1.6812, + "step": 7893 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026937164743885754, + "loss": 1.6667, + "step": 7894 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002693641626679585, + "loss": 1.6442, + "step": 7895 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026935667708664267, + "loss": 1.686, + "step": 7896 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026934919069496085, + "loss": 1.7095, + "step": 7897 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002693417034929639, + "loss": 1.6472, + "step": 7898 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026933421548070265, + "loss": 1.6792, + "step": 7899 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002693267266582279, + "loss": 1.7338, + "step": 7900 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002693192370255905, + "loss": 1.8002, + "step": 7901 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002693117465828414, + "loss": 1.6385, + "step": 7902 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026930425533003136, + "loss": 1.6931, + "step": 7903 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026929676326721124, + "loss": 1.6821, + "step": 7904 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026928927039443197, + "loss": 1.6751, + "step": 7905 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026928177671174436, + "loss": 1.6336, + "step": 7906 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002692742822191993, + "loss": 1.6661, + "step": 7907 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002692667869168477, + "loss": 1.6494, + "step": 7908 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026925929080474047, + "loss": 1.6953, + "step": 7909 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002692517938829284, + "loss": 1.6734, + "step": 7910 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002692442961514625, + "loss": 1.7193, + "step": 7911 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002692367976103936, + "loss": 1.6322, + "step": 7912 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002692292982597726, + "loss": 1.5961, + "step": 7913 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002692217980996506, + "loss": 1.6965, + "step": 7914 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002692142971300783, + "loss": 1.6774, + "step": 7915 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002692067953511067, + "loss": 1.6905, + "step": 7916 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002691992927627868, + "loss": 1.7207, + "step": 7917 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002691917893651694, + "loss": 1.7294, + "step": 7918 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026918428515830555, + "loss": 1.7074, + "step": 7919 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002691767801422462, + "loss": 1.7388, + "step": 7920 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002691692743170423, + "loss": 1.7046, + "step": 7921 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002691617676827448, + "loss": 1.6875, + "step": 7922 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002691542602394046, + "loss": 1.705, + "step": 7923 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026914675198707276, + "loss": 1.6737, + "step": 7924 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002691392429258002, + "loss": 1.6599, + "step": 7925 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026913173305563793, + "loss": 1.6479, + "step": 7926 + }, + { + "epoch": 0.62, + "learning_rate": 0.000269124222376637, + "loss": 1.7129, + "step": 7927 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026911671088884824, + "loss": 1.6592, + "step": 7928 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002691091985923228, + "loss": 1.646, + "step": 7929 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026910168548711157, + "loss": 1.6659, + "step": 7930 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026909417157326574, + "loss": 1.6579, + "step": 7931 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002690866568508361, + "loss": 1.6447, + "step": 7932 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026907914131987386, + "loss": 1.6983, + "step": 7933 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026907162498042994, + "loss": 1.674, + "step": 7934 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026906410783255534, + "loss": 1.7435, + "step": 7935 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026905658987630117, + "loss": 1.6837, + "step": 7936 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002690490711117185, + "loss": 1.6758, + "step": 7937 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002690415515388583, + "loss": 1.6396, + "step": 7938 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002690340311577717, + "loss": 1.7036, + "step": 7939 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026902650996850965, + "loss": 1.6679, + "step": 7940 + }, + { + "epoch": 0.62, + "learning_rate": 0.0002690189879711233, + "loss": 1.7178, + "step": 7941 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026901146516566374, + "loss": 1.7402, + "step": 7942 + }, + { + "epoch": 0.62, + "learning_rate": 0.00026900394155218195, + "loss": 1.6485, + "step": 7943 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002689964171307291, + "loss": 1.6952, + "step": 7944 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026898889190135627, + "loss": 1.6555, + "step": 7945 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026898136586411456, + "loss": 1.6018, + "step": 7946 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026897383901905496, + "loss": 1.7018, + "step": 7947 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026896631136622863, + "loss": 1.6841, + "step": 7948 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026895878290568675, + "loss": 1.6678, + "step": 7949 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002689512536374804, + "loss": 1.6184, + "step": 7950 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002689437235616606, + "loss": 1.7013, + "step": 7951 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026893619267827866, + "loss": 1.7164, + "step": 7952 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002689286609873855, + "loss": 1.7282, + "step": 7953 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026892112848903244, + "loss": 1.6961, + "step": 7954 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026891359518327047, + "loss": 1.6069, + "step": 7955 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002689060610701509, + "loss": 1.7091, + "step": 7956 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026889852614972475, + "loss": 1.6868, + "step": 7957 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026889099042204324, + "loss": 1.6756, + "step": 7958 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002688834538871575, + "loss": 1.7184, + "step": 7959 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002688759165451187, + "loss": 1.6596, + "step": 7960 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026886837839597803, + "loss": 1.6758, + "step": 7961 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026886083943978667, + "loss": 1.6293, + "step": 7962 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002688532996765958, + "loss": 1.6653, + "step": 7963 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002688457591064566, + "loss": 1.6791, + "step": 7964 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002688382177294203, + "loss": 1.6436, + "step": 7965 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026883067554553814, + "loss": 1.6405, + "step": 7966 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002688231325548612, + "loss": 1.6868, + "step": 7967 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002688155887574408, + "loss": 1.6961, + "step": 7968 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026880804415332807, + "loss": 1.6919, + "step": 7969 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026880049874257423, + "loss": 1.647, + "step": 7970 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002687929525252307, + "loss": 1.7107, + "step": 7971 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002687854055013485, + "loss": 1.6925, + "step": 7972 + }, + { + "epoch": 0.63, + "learning_rate": 0.000268777857670979, + "loss": 1.6872, + "step": 7973 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026877030903417335, + "loss": 1.7126, + "step": 7974 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026876275959098286, + "loss": 1.6558, + "step": 7975 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026875520934145874, + "loss": 1.7005, + "step": 7976 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026874765828565234, + "loss": 1.6815, + "step": 7977 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002687401064236148, + "loss": 1.6932, + "step": 7978 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002687325537553975, + "loss": 1.6381, + "step": 7979 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002687250002810517, + "loss": 1.6071, + "step": 7980 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026871744600062865, + "loss": 1.6768, + "step": 7981 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002687098909141797, + "loss": 1.6963, + "step": 7982 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026870233502175605, + "loss": 1.6512, + "step": 7983 + }, + { + "epoch": 0.63, + "learning_rate": 0.000268694778323409, + "loss": 1.6491, + "step": 7984 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026868722081919, + "loss": 1.6878, + "step": 7985 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002686796625091502, + "loss": 1.673, + "step": 7986 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026867210339334105, + "loss": 1.6792, + "step": 7987 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002686645434718138, + "loss": 1.6862, + "step": 7988 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026865698274461977, + "loss": 1.6718, + "step": 7989 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026864942121181026, + "loss": 1.661, + "step": 7990 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002686418588734367, + "loss": 1.6575, + "step": 7991 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026863429572955035, + "loss": 1.7183, + "step": 7992 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002686267317802026, + "loss": 1.7032, + "step": 7993 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002686191670254449, + "loss": 1.6925, + "step": 7994 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002686116014653285, + "loss": 1.6807, + "step": 7995 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002686040350999047, + "loss": 1.689, + "step": 7996 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026859646792922495, + "loss": 1.7119, + "step": 7997 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002685888999533407, + "loss": 1.6868, + "step": 7998 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026858133117230317, + "loss": 1.7426, + "step": 7999 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002685737615861639, + "loss": 1.6945, + "step": 8000 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026856619119497427, + "loss": 1.6439, + "step": 8001 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026855861999878556, + "loss": 1.722, + "step": 8002 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026855104799764927, + "loss": 1.7296, + "step": 8003 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002685434751916168, + "loss": 1.6209, + "step": 8004 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002685359015807395, + "loss": 1.6897, + "step": 8005 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002685283271650689, + "loss": 1.7329, + "step": 8006 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026852075194465635, + "loss": 1.6984, + "step": 8007 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002685131759195533, + "loss": 1.6564, + "step": 8008 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026850559908981117, + "loss": 1.7169, + "step": 8009 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002684980214554814, + "loss": 1.6742, + "step": 8010 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002684904430166155, + "loss": 1.6893, + "step": 8011 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002684828637732649, + "loss": 1.6508, + "step": 8012 + }, + { + "epoch": 0.63, + "learning_rate": 0.000268475283725481, + "loss": 1.6691, + "step": 8013 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002684677028733153, + "loss": 1.7192, + "step": 8014 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002684601212168193, + "loss": 1.6655, + "step": 8015 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002684525387560444, + "loss": 1.6709, + "step": 8016 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026844495549104214, + "loss": 1.7078, + "step": 8017 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026843737142186403, + "loss": 1.717, + "step": 8018 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002684297865485615, + "loss": 1.6707, + "step": 8019 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002684222008711861, + "loss": 1.6902, + "step": 8020 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026841461438978934, + "loss": 1.6427, + "step": 8021 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002684070271044226, + "loss": 1.6507, + "step": 8022 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026839943901513756, + "loss": 1.6883, + "step": 8023 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026839185012198565, + "loss": 1.6779, + "step": 8024 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002683842604250184, + "loss": 1.6883, + "step": 8025 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026837666992428734, + "loss": 1.709, + "step": 8026 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026836907861984405, + "loss": 1.6425, + "step": 8027 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026836148651174, + "loss": 1.6228, + "step": 8028 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002683538936000268, + "loss": 1.6381, + "step": 8029 + }, + { + "epoch": 0.63, + "learning_rate": 0.000268346299884756, + "loss": 1.6916, + "step": 8030 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026833870536597913, + "loss": 1.6401, + "step": 8031 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026833111004374773, + "loss": 1.6433, + "step": 8032 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026832351391811336, + "loss": 1.7554, + "step": 8033 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002683159169891277, + "loss": 1.6828, + "step": 8034 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026830831925684224, + "loss": 1.669, + "step": 8035 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002683007207213085, + "loss": 1.6838, + "step": 8036 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002682931213825782, + "loss": 1.6407, + "step": 8037 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002682855212407029, + "loss": 1.6445, + "step": 8038 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002682779202957342, + "loss": 1.7145, + "step": 8039 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026827031854772366, + "loss": 1.6482, + "step": 8040 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002682627159967229, + "loss": 1.6455, + "step": 8041 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002682551126427836, + "loss": 1.6741, + "step": 8042 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002682475084859574, + "loss": 1.7201, + "step": 8043 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002682399035262958, + "loss": 1.688, + "step": 8044 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002682322977638505, + "loss": 1.6639, + "step": 8045 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002682246911986732, + "loss": 1.6863, + "step": 8046 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002682170838308154, + "loss": 1.6544, + "step": 8047 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002682094756603289, + "loss": 1.6814, + "step": 8048 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002682018666872653, + "loss": 1.6869, + "step": 8049 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026819425691167626, + "loss": 1.714, + "step": 8050 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002681866463336134, + "loss": 1.6934, + "step": 8051 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026817903495312845, + "loss": 1.632, + "step": 8052 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026817142277027305, + "loss": 1.6972, + "step": 8053 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002681638097850989, + "loss": 1.6909, + "step": 8054 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026815619599765775, + "loss": 1.6625, + "step": 8055 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002681485814080011, + "loss": 1.5984, + "step": 8056 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026814096601618094, + "loss": 1.6554, + "step": 8057 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026813334982224874, + "loss": 1.6908, + "step": 8058 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002681257328262563, + "loss": 1.6707, + "step": 8059 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026811811502825534, + "loss": 1.7074, + "step": 8060 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002681104964282975, + "loss": 1.6452, + "step": 8061 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026810287702643465, + "loss": 1.7012, + "step": 8062 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002680952568227184, + "loss": 1.6252, + "step": 8063 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002680876358172005, + "loss": 1.6627, + "step": 8064 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002680800140099328, + "loss": 1.6289, + "step": 8065 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026807239140096687, + "loss": 1.6608, + "step": 8066 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026806476799035457, + "loss": 1.7209, + "step": 8067 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002680571437781477, + "loss": 1.6477, + "step": 8068 + }, + { + "epoch": 0.63, + "learning_rate": 0.00026804951876439794, + "loss": 1.7136, + "step": 8069 + }, + { + "epoch": 0.63, + "learning_rate": 0.0002680418929491571, + "loss": 1.6526, + "step": 8070 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026803426633247696, + "loss": 1.6023, + "step": 8071 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026802663891440927, + "loss": 1.6697, + "step": 8072 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026801901069500584, + "loss": 1.6448, + "step": 8073 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026801138167431847, + "loss": 1.6497, + "step": 8074 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026800375185239897, + "loss": 1.7163, + "step": 8075 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026799612122929906, + "loss": 1.6562, + "step": 8076 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002679884898050706, + "loss": 1.6522, + "step": 8077 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026798085757976547, + "loss": 1.6682, + "step": 8078 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002679732245534354, + "loss": 1.7205, + "step": 8079 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026796559072613213, + "loss": 1.6988, + "step": 8080 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026795795609790775, + "loss": 1.6689, + "step": 8081 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026795032066881386, + "loss": 1.7073, + "step": 8082 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026794268443890244, + "loss": 1.6581, + "step": 8083 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002679350474082252, + "loss": 1.6882, + "step": 8084 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002679274095768341, + "loss": 1.6925, + "step": 8085 + }, + { + "epoch": 0.64, + "learning_rate": 0.000267919770944781, + "loss": 1.7519, + "step": 8086 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002679121315121177, + "loss": 1.6465, + "step": 8087 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002679044912788961, + "loss": 1.6788, + "step": 8088 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002678968502451681, + "loss": 1.6597, + "step": 8089 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002678892084109855, + "loss": 1.6476, + "step": 8090 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026788156577640026, + "loss": 1.6792, + "step": 8091 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026787392234146423, + "loss": 1.631, + "step": 8092 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002678662781062293, + "loss": 1.7074, + "step": 8093 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002678586330707474, + "loss": 1.685, + "step": 8094 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002678509872350704, + "loss": 1.6629, + "step": 8095 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002678433405992503, + "loss": 1.644, + "step": 8096 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026783569316333886, + "loss": 1.6092, + "step": 8097 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002678280449273882, + "loss": 1.7022, + "step": 8098 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026782039589145004, + "loss": 1.6751, + "step": 8099 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026781274605557645, + "loss": 1.6853, + "step": 8100 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002678050954198193, + "loss": 1.6191, + "step": 8101 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026779744398423063, + "loss": 1.6612, + "step": 8102 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026778979174886227, + "loss": 1.6861, + "step": 8103 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002677821387137662, + "loss": 1.6706, + "step": 8104 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026777448487899446, + "loss": 1.6572, + "step": 8105 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026776683024459894, + "loss": 1.6829, + "step": 8106 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026775917481063164, + "loss": 1.7045, + "step": 8107 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002677515185771445, + "loss": 1.6156, + "step": 8108 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026774386154418953, + "loss": 1.6785, + "step": 8109 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026773620371181876, + "loss": 1.6452, + "step": 8110 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002677285450800841, + "loss": 1.672, + "step": 8111 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002677208856490376, + "loss": 1.624, + "step": 8112 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026771322541873125, + "loss": 1.6388, + "step": 8113 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002677055643892171, + "loss": 1.616, + "step": 8114 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002676979025605471, + "loss": 1.6454, + "step": 8115 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026769023993277325, + "loss": 1.7039, + "step": 8116 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002676825765059476, + "loss": 1.7104, + "step": 8117 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002676749122801223, + "loss": 1.6562, + "step": 8118 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002676672472553492, + "loss": 1.6751, + "step": 8119 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002676595814316805, + "loss": 1.711, + "step": 8120 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002676519148091681, + "loss": 1.6443, + "step": 8121 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002676442473878641, + "loss": 1.6957, + "step": 8122 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026763657916782066, + "loss": 1.6643, + "step": 8123 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026762891014908973, + "loss": 1.6219, + "step": 8124 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002676212403317234, + "loss": 1.6676, + "step": 8125 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002676135697157738, + "loss": 1.6797, + "step": 8126 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002676058983012929, + "loss": 1.6985, + "step": 8127 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002675982260883329, + "loss": 1.7225, + "step": 8128 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026759055307694585, + "loss": 1.7174, + "step": 8129 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026758287926718384, + "loss": 1.6862, + "step": 8130 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002675752046590989, + "loss": 1.6954, + "step": 8131 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026756752925274327, + "loss": 1.6927, + "step": 8132 + }, + { + "epoch": 0.64, + "learning_rate": 0.000267559853048169, + "loss": 1.6237, + "step": 8133 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026755217604542813, + "loss": 1.6414, + "step": 8134 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002675444982445729, + "loss": 1.6172, + "step": 8135 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002675368196456554, + "loss": 1.7271, + "step": 8136 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002675291402487278, + "loss": 1.6144, + "step": 8137 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026752146005384214, + "loss": 1.666, + "step": 8138 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002675137790610506, + "loss": 1.7447, + "step": 8139 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002675060972704054, + "loss": 1.7418, + "step": 8140 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002674984146819586, + "loss": 1.6182, + "step": 8141 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026749073129576245, + "loss": 1.6027, + "step": 8142 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026748304711186904, + "loss": 1.7185, + "step": 8143 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002674753621303306, + "loss": 1.6619, + "step": 8144 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026746767635119924, + "loss": 1.6, + "step": 8145 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002674599897745272, + "loss": 1.686, + "step": 8146 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002674523024003667, + "loss": 1.6941, + "step": 8147 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026744461422876977, + "loss": 1.668, + "step": 8148 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002674369252597888, + "loss": 1.6378, + "step": 8149 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026742923549347587, + "loss": 1.6949, + "step": 8150 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002674215449298833, + "loss": 1.6727, + "step": 8151 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026741385356906323, + "loss": 1.6903, + "step": 8152 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026740616141106787, + "loss": 1.6657, + "step": 8153 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002673984684559494, + "loss": 1.6796, + "step": 8154 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002673907747037602, + "loss": 1.6957, + "step": 8155 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026738308015455237, + "loss": 1.7172, + "step": 8156 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026737538480837823, + "loss": 1.7152, + "step": 8157 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026736768866529, + "loss": 1.6797, + "step": 8158 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002673599917253399, + "loss": 1.6594, + "step": 8159 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002673522939885803, + "loss": 1.6776, + "step": 8160 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002673445954550633, + "loss": 1.6824, + "step": 8161 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002673368961248413, + "loss": 1.6764, + "step": 8162 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002673291959979665, + "loss": 1.6308, + "step": 8163 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002673214950744912, + "loss": 1.6248, + "step": 8164 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002673137933544677, + "loss": 1.6441, + "step": 8165 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002673060908379483, + "loss": 1.6479, + "step": 8166 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026729838752498526, + "loss": 1.6779, + "step": 8167 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026729068341563094, + "loss": 1.6383, + "step": 8168 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026728297850993755, + "loss": 1.6761, + "step": 8169 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002672752728079575, + "loss": 1.6413, + "step": 8170 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026726756630974304, + "loss": 1.6993, + "step": 8171 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002672598590153466, + "loss": 1.6767, + "step": 8172 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002672521509248203, + "loss": 1.6667, + "step": 8173 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026724444203821666, + "loss": 1.6784, + "step": 8174 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002672367323555879, + "loss": 1.6656, + "step": 8175 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026722902187698656, + "loss": 1.6756, + "step": 8176 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026722131060246475, + "loss": 1.656, + "step": 8177 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026721359853207495, + "loss": 1.6413, + "step": 8178 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002672058856658695, + "loss": 1.7307, + "step": 8179 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026719817200390077, + "loss": 1.6537, + "step": 8180 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002671904575462211, + "loss": 1.6717, + "step": 8181 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026718274229288295, + "loss": 1.6689, + "step": 8182 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002671750262439386, + "loss": 1.6661, + "step": 8183 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002671673093994405, + "loss": 1.6373, + "step": 8184 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026715959175944103, + "loss": 1.6083, + "step": 8185 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002671518733239926, + "loss": 1.6498, + "step": 8186 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026714415409314756, + "loss": 1.6772, + "step": 8187 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026713643406695844, + "loss": 1.6516, + "step": 8188 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002671287132454775, + "loss": 1.6847, + "step": 8189 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002671209916287572, + "loss": 1.6567, + "step": 8190 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026711326921685, + "loss": 1.6398, + "step": 8191 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026710554600980845, + "loss": 1.6094, + "step": 8192 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002670978220076848, + "loss": 1.6579, + "step": 8193 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026709009721053155, + "loss": 1.6467, + "step": 8194 + }, + { + "epoch": 0.64, + "learning_rate": 0.0002670823716184011, + "loss": 1.6801, + "step": 8195 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026707464523134607, + "loss": 1.6925, + "step": 8196 + }, + { + "epoch": 0.64, + "learning_rate": 0.00026706691804941876, + "loss": 1.6015, + "step": 8197 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002670591900726717, + "loss": 1.6707, + "step": 8198 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002670514613011573, + "loss": 1.692, + "step": 8199 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002670437317349281, + "loss": 1.6843, + "step": 8200 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026703600137403653, + "loss": 1.6931, + "step": 8201 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002670282702185351, + "loss": 1.6605, + "step": 8202 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026702053826847626, + "loss": 1.7114, + "step": 8203 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002670128055239126, + "loss": 1.738, + "step": 8204 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026700507198489657, + "loss": 1.6886, + "step": 8205 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002669973376514806, + "loss": 1.6997, + "step": 8206 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002669896025237173, + "loss": 1.682, + "step": 8207 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002669818666016592, + "loss": 1.6452, + "step": 8208 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026697412988535877, + "loss": 1.6342, + "step": 8209 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026696639237486854, + "loss": 1.6999, + "step": 8210 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026695865407024103, + "loss": 1.6683, + "step": 8211 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026695091497152884, + "loss": 1.6839, + "step": 8212 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026694317507878443, + "loss": 1.6508, + "step": 8213 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026693543439206045, + "loss": 1.7201, + "step": 8214 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002669276929114094, + "loss": 1.5918, + "step": 8215 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002669199506368838, + "loss": 1.6578, + "step": 8216 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026691220756853626, + "loss": 1.7081, + "step": 8217 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002669044637064194, + "loss": 1.6516, + "step": 8218 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026689671905058565, + "loss": 1.659, + "step": 8219 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002668889736010878, + "loss": 1.7127, + "step": 8220 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026688122735797826, + "loss": 1.6691, + "step": 8221 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002668734803213097, + "loss": 1.657, + "step": 8222 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026686573249113467, + "loss": 1.6452, + "step": 8223 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002668579838675058, + "loss": 1.6932, + "step": 8224 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002668502344504758, + "loss": 1.6244, + "step": 8225 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002668424842400971, + "loss": 1.6358, + "step": 8226 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026683473323642245, + "loss": 1.7188, + "step": 8227 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026682698143950444, + "loss": 1.6375, + "step": 8228 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002668192288493957, + "loss": 1.6967, + "step": 8229 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002668114754661488, + "loss": 1.619, + "step": 8230 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026680372128981653, + "loss": 1.6935, + "step": 8231 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002667959663204514, + "loss": 1.7059, + "step": 8232 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026678821055810617, + "loss": 1.677, + "step": 8233 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026678045400283336, + "loss": 1.6652, + "step": 8234 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026677269665468573, + "loss": 1.7097, + "step": 8235 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026676493851371597, + "loss": 1.6849, + "step": 8236 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002667571795799767, + "loss": 1.7036, + "step": 8237 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002667494198535206, + "loss": 1.7169, + "step": 8238 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002667416593344004, + "loss": 1.6571, + "step": 8239 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002667338980226687, + "loss": 1.6894, + "step": 8240 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002667261359183783, + "loss": 1.724, + "step": 8241 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026671837302158177, + "loss": 1.6543, + "step": 8242 + }, + { + "epoch": 0.65, + "learning_rate": 0.000266710609332332, + "loss": 1.6437, + "step": 8243 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026670284485068156, + "loss": 1.6967, + "step": 8244 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002666950795766832, + "loss": 1.6781, + "step": 8245 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002666873135103896, + "loss": 1.6893, + "step": 8246 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026667954665185364, + "loss": 1.6667, + "step": 8247 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002666717790011279, + "loss": 1.6942, + "step": 8248 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026666401055826515, + "loss": 1.7053, + "step": 8249 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026665624132331814, + "loss": 1.6618, + "step": 8250 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026664847129633965, + "loss": 1.6438, + "step": 8251 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026664070047738243, + "loss": 1.6746, + "step": 8252 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026663292886649917, + "loss": 1.6481, + "step": 8253 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002666251564637427, + "loss": 1.6858, + "step": 8254 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026661738326916583, + "loss": 1.6369, + "step": 8255 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026660960928282125, + "loss": 1.6336, + "step": 8256 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002666018345047618, + "loss": 1.6357, + "step": 8257 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026659405893504016, + "loss": 1.6644, + "step": 8258 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026658628257370925, + "loss": 1.7026, + "step": 8259 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002665785054208218, + "loss": 1.662, + "step": 8260 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026657072747643065, + "loss": 1.6901, + "step": 8261 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026656294874058856, + "loss": 1.6461, + "step": 8262 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026655516921334844, + "loss": 1.6739, + "step": 8263 + }, + { + "epoch": 0.65, + "learning_rate": 0.000266547388894763, + "loss": 1.6479, + "step": 8264 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002665396077848851, + "loss": 1.6645, + "step": 8265 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002665318258837676, + "loss": 1.6764, + "step": 8266 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002665240431914633, + "loss": 1.6517, + "step": 8267 + }, + { + "epoch": 0.65, + "learning_rate": 0.000266516259708025, + "loss": 1.6346, + "step": 8268 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026650847543350565, + "loss": 1.6931, + "step": 8269 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026650069036795803, + "loss": 1.6566, + "step": 8270 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026649290451143505, + "loss": 1.6929, + "step": 8271 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026648511786398946, + "loss": 1.6607, + "step": 8272 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002664773304256743, + "loss": 1.6984, + "step": 8273 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026646954219654225, + "loss": 1.7191, + "step": 8274 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026646175317664633, + "loss": 1.6542, + "step": 8275 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002664539633660394, + "loss": 1.6725, + "step": 8276 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026644617276477426, + "loss": 1.6721, + "step": 8277 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002664383813729039, + "loss": 1.6389, + "step": 8278 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026643058919048113, + "loss": 1.6802, + "step": 8279 + }, + { + "epoch": 0.65, + "learning_rate": 0.000266422796217559, + "loss": 1.6876, + "step": 8280 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026641500245419027, + "loss": 1.6566, + "step": 8281 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002664072079004279, + "loss": 1.6901, + "step": 8282 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002663994125563249, + "loss": 1.6545, + "step": 8283 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002663916164219341, + "loss": 1.7002, + "step": 8284 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002663838194973085, + "loss": 1.6741, + "step": 8285 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002663760217825009, + "loss": 1.6725, + "step": 8286 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026636822327756436, + "loss": 1.6481, + "step": 8287 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002663604239825518, + "loss": 1.662, + "step": 8288 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002663526238975162, + "loss": 1.6934, + "step": 8289 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026634482302251045, + "loss": 1.707, + "step": 8290 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026633702135758764, + "loss": 1.6548, + "step": 8291 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026632921890280055, + "loss": 1.6764, + "step": 8292 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026632141565820233, + "loss": 1.7329, + "step": 8293 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026631361162384587, + "loss": 1.6493, + "step": 8294 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026630580679978415, + "loss": 1.6163, + "step": 8295 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002662980011860703, + "loss": 1.6172, + "step": 8296 + }, + { + "epoch": 0.65, + "learning_rate": 0.000266290194782757, + "loss": 1.6617, + "step": 8297 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026628238758989763, + "loss": 1.7009, + "step": 8298 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002662745796075449, + "loss": 1.6803, + "step": 8299 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026626677083575203, + "loss": 1.7159, + "step": 8300 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002662589612745719, + "loss": 1.6922, + "step": 8301 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026625115092405755, + "loss": 1.7139, + "step": 8302 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002662433397842621, + "loss": 1.7275, + "step": 8303 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026623552785523844, + "loss": 1.694, + "step": 8304 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002662277151370398, + "loss": 1.6196, + "step": 8305 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026621990162971907, + "loss": 1.6839, + "step": 8306 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002662120873333293, + "loss": 1.634, + "step": 8307 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002662042722479236, + "loss": 1.6394, + "step": 8308 + }, + { + "epoch": 0.65, + "learning_rate": 0.000266196456373555, + "loss": 1.6342, + "step": 8309 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026618863971027666, + "loss": 1.6422, + "step": 8310 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026618082225814154, + "loss": 1.6554, + "step": 8311 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002661730040172028, + "loss": 1.6395, + "step": 8312 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002661651849875134, + "loss": 1.6323, + "step": 8313 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002661573651691265, + "loss": 1.6714, + "step": 8314 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002661495445620952, + "loss": 1.6925, + "step": 8315 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026614172316647257, + "loss": 1.6729, + "step": 8316 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002661339009823118, + "loss": 1.6832, + "step": 8317 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002661260780096659, + "loss": 1.7196, + "step": 8318 + }, + { + "epoch": 0.65, + "learning_rate": 0.000266118254248588, + "loss": 1.6565, + "step": 8319 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002661104296991312, + "loss": 1.6616, + "step": 8320 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026610260436134867, + "loss": 1.6832, + "step": 8321 + }, + { + "epoch": 0.65, + "learning_rate": 0.0002660947782352936, + "loss": 1.704, + "step": 8322 + }, + { + "epoch": 0.65, + "learning_rate": 0.000266086951321019, + "loss": 1.6945, + "step": 8323 + }, + { + "epoch": 0.65, + "learning_rate": 0.00026607912361857806, + "loss": 1.6688, + "step": 8324 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026607129512802396, + "loss": 1.6707, + "step": 8325 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002660634658494098, + "loss": 1.677, + "step": 8326 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026605563578278873, + "loss": 1.6515, + "step": 8327 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002660478049282139, + "loss": 1.7121, + "step": 8328 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026603997328573866, + "loss": 1.6814, + "step": 8329 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026603214085541596, + "loss": 1.6447, + "step": 8330 + }, + { + "epoch": 0.66, + "learning_rate": 0.000266024307637299, + "loss": 1.6488, + "step": 8331 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002660164736314411, + "loss": 1.64, + "step": 8332 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026600863883789527, + "loss": 1.6875, + "step": 8333 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002660008032567149, + "loss": 1.644, + "step": 8334 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026599296688795305, + "loss": 1.6525, + "step": 8335 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026598512973166296, + "loss": 1.6783, + "step": 8336 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026597729178789786, + "loss": 1.6297, + "step": 8337 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002659694530567109, + "loss": 1.611, + "step": 8338 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026596161353815544, + "loss": 1.6489, + "step": 8339 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026595377323228455, + "loss": 1.6518, + "step": 8340 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002659459321391516, + "loss": 1.6658, + "step": 8341 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026593809025880966, + "loss": 1.6804, + "step": 8342 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026593024759131214, + "loss": 1.6402, + "step": 8343 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002659224041367122, + "loss": 1.6935, + "step": 8344 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026591455989506305, + "loss": 1.6597, + "step": 8345 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026590671486641807, + "loss": 1.6823, + "step": 8346 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002658988690508304, + "loss": 1.6248, + "step": 8347 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026589102244835343, + "loss": 1.7245, + "step": 8348 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026588317505904036, + "loss": 1.705, + "step": 8349 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002658753268829445, + "loss": 1.6995, + "step": 8350 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026586747792011904, + "loss": 1.6596, + "step": 8351 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002658596281706174, + "loss": 1.6667, + "step": 8352 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002658517776344928, + "loss": 1.6669, + "step": 8353 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026584392631179857, + "loss": 1.6361, + "step": 8354 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026583607420258806, + "loss": 1.6692, + "step": 8355 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026582822130691443, + "loss": 1.6462, + "step": 8356 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002658203676248312, + "loss": 1.6447, + "step": 8357 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002658125131563915, + "loss": 1.6897, + "step": 8358 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002658046579016488, + "loss": 1.6642, + "step": 8359 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002657968018606563, + "loss": 1.6773, + "step": 8360 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026578894503346753, + "loss": 1.6764, + "step": 8361 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002657810874201357, + "loss": 1.6803, + "step": 8362 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026577322902071414, + "loss": 1.6672, + "step": 8363 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002657653698352562, + "loss": 1.708, + "step": 8364 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002657575098638154, + "loss": 1.601, + "step": 8365 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002657496491064449, + "loss": 1.6324, + "step": 8366 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002657417875631982, + "loss": 1.6419, + "step": 8367 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002657339252341286, + "loss": 1.6322, + "step": 8368 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002657260621192895, + "loss": 1.6176, + "step": 8369 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026571819821873436, + "loss": 1.7038, + "step": 8370 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002657103335325165, + "loss": 1.6628, + "step": 8371 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002657024680606893, + "loss": 1.6557, + "step": 8372 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026569460180330627, + "loss": 1.6243, + "step": 8373 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026568673476042064, + "loss": 1.7109, + "step": 8374 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026567886693208595, + "loss": 1.6681, + "step": 8375 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026567099831835563, + "loss": 1.6751, + "step": 8376 + }, + { + "epoch": 0.66, + "learning_rate": 0.000265663128919283, + "loss": 1.6669, + "step": 8377 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002656552587349216, + "loss": 1.6589, + "step": 8378 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026564738776532477, + "loss": 1.6917, + "step": 8379 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026563951601054606, + "loss": 1.6356, + "step": 8380 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002656316434706388, + "loss": 1.6733, + "step": 8381 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026562377014565655, + "loss": 1.6497, + "step": 8382 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026561589603565266, + "loss": 1.7125, + "step": 8383 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026560802114068065, + "loss": 1.6177, + "step": 8384 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026560014546079397, + "loss": 1.7079, + "step": 8385 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002655922689960461, + "loss": 1.6908, + "step": 8386 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002655843917464905, + "loss": 1.6496, + "step": 8387 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026557651371218066, + "loss": 1.6109, + "step": 8388 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026556863489317014, + "loss": 1.6428, + "step": 8389 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026556075528951233, + "loss": 1.7128, + "step": 8390 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002655528749012607, + "loss": 1.6237, + "step": 8391 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026554499372846886, + "loss": 1.6684, + "step": 8392 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002655371117711903, + "loss": 1.6629, + "step": 8393 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026552922902947846, + "loss": 1.6865, + "step": 8394 + }, + { + "epoch": 0.66, + "learning_rate": 0.000265521345503387, + "loss": 1.7029, + "step": 8395 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002655134611929692, + "loss": 1.7273, + "step": 8396 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002655055760982789, + "loss": 1.6498, + "step": 8397 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002654976902193694, + "loss": 1.6741, + "step": 8398 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026548980355629436, + "loss": 1.648, + "step": 8399 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002654819161091072, + "loss": 1.6668, + "step": 8400 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026547402787786167, + "loss": 1.7155, + "step": 8401 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026546613886261114, + "loss": 1.669, + "step": 8402 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026545824906340927, + "loss": 1.6135, + "step": 8403 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026545035848030965, + "loss": 1.6831, + "step": 8404 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026544246711336574, + "loss": 1.7165, + "step": 8405 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002654345749626312, + "loss": 1.6393, + "step": 8406 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002654266820281596, + "loss": 1.66, + "step": 8407 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002654187883100045, + "loss": 1.7154, + "step": 8408 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026541089380821954, + "loss": 1.6877, + "step": 8409 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026540299852285834, + "loss": 1.6762, + "step": 8410 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002653951024539745, + "loss": 1.6611, + "step": 8411 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002653872056016215, + "loss": 1.6467, + "step": 8412 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026537930796585306, + "loss": 1.614, + "step": 8413 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002653714095467228, + "loss": 1.6536, + "step": 8414 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026536351034428437, + "loss": 1.7031, + "step": 8415 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026535561035859136, + "loss": 1.6674, + "step": 8416 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026534770958969736, + "loss": 1.6948, + "step": 8417 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002653398080376561, + "loss": 1.6325, + "step": 8418 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002653319057025212, + "loss": 1.6826, + "step": 8419 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002653240025843463, + "loss": 1.667, + "step": 8420 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026531609868318514, + "loss": 1.6913, + "step": 8421 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026530819399909117, + "loss": 1.7037, + "step": 8422 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002653002885321183, + "loss": 1.6514, + "step": 8423 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026529238228232004, + "loss": 1.664, + "step": 8424 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026528447524975016, + "loss": 1.5901, + "step": 8425 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002652765674344623, + "loss": 1.6372, + "step": 8426 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002652686588365101, + "loss": 1.6541, + "step": 8427 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026526074945594746, + "loss": 1.7356, + "step": 8428 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026525283929282784, + "loss": 1.6413, + "step": 8429 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002652449283472051, + "loss": 1.6368, + "step": 8430 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002652370166191328, + "loss": 1.6625, + "step": 8431 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026522910410866485, + "loss": 1.665, + "step": 8432 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002652211908158548, + "loss": 1.6958, + "step": 8433 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002652132767407565, + "loss": 1.6588, + "step": 8434 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026520536188342353, + "loss": 1.6354, + "step": 8435 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026519744624390983, + "loss": 1.6634, + "step": 8436 + }, + { + "epoch": 0.66, + "learning_rate": 0.000265189529822269, + "loss": 1.6731, + "step": 8437 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026518161261855486, + "loss": 1.7163, + "step": 8438 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002651736946328211, + "loss": 1.6209, + "step": 8439 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026516577586512154, + "loss": 1.6977, + "step": 8440 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002651578563155099, + "loss": 1.6857, + "step": 8441 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026514993598404, + "loss": 1.6142, + "step": 8442 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026514201487076554, + "loss": 1.6964, + "step": 8443 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002651340929757404, + "loss": 1.6311, + "step": 8444 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002651261702990182, + "loss": 1.6064, + "step": 8445 + }, + { + "epoch": 0.66, + "learning_rate": 0.00026511824684065285, + "loss": 1.6125, + "step": 8446 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002651103226006982, + "loss": 1.6544, + "step": 8447 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002651023975792079, + "loss": 1.6808, + "step": 8448 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002650944717762359, + "loss": 1.6919, + "step": 8449 + }, + { + "epoch": 0.66, + "learning_rate": 0.000265086545191836, + "loss": 1.6304, + "step": 8450 + }, + { + "epoch": 0.66, + "learning_rate": 0.0002650786178260619, + "loss": 1.687, + "step": 8451 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002650706896789675, + "loss": 1.6451, + "step": 8452 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002650627607506066, + "loss": 1.7084, + "step": 8453 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026505483104103305, + "loss": 1.6544, + "step": 8454 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026504690055030074, + "loss": 1.6533, + "step": 8455 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002650389692784634, + "loss": 1.7324, + "step": 8456 + }, + { + "epoch": 0.67, + "learning_rate": 0.000265031037225575, + "loss": 1.6456, + "step": 8457 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026502310439168933, + "loss": 1.6474, + "step": 8458 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002650151707768602, + "loss": 1.6866, + "step": 8459 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002650072363811416, + "loss": 1.6879, + "step": 8460 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002649993012045873, + "loss": 1.6496, + "step": 8461 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026499136524725124, + "loss": 1.6901, + "step": 8462 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026498342850918717, + "loss": 1.653, + "step": 8463 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002649754909904492, + "loss": 1.6671, + "step": 8464 + }, + { + "epoch": 0.67, + "learning_rate": 0.000264967552691091, + "loss": 1.7339, + "step": 8465 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002649596136111666, + "loss": 1.687, + "step": 8466 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002649516737507298, + "loss": 1.6517, + "step": 8467 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002649437331098347, + "loss": 1.6547, + "step": 8468 + }, + { + "epoch": 0.67, + "learning_rate": 0.000264935791688535, + "loss": 1.634, + "step": 8469 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026492784948688473, + "loss": 1.641, + "step": 8470 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026491990650493775, + "loss": 1.6909, + "step": 8471 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026491196274274804, + "loss": 1.671, + "step": 8472 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026490401820036954, + "loss": 1.7071, + "step": 8473 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002648960728778561, + "loss": 1.616, + "step": 8474 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002648881267752618, + "loss": 1.6281, + "step": 8475 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002648801798926405, + "loss": 1.6565, + "step": 8476 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026487223223004615, + "loss": 1.6198, + "step": 8477 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026486428378753277, + "loss": 1.6405, + "step": 8478 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002648563345651543, + "loss": 1.6636, + "step": 8479 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002648483845629646, + "loss": 1.6774, + "step": 8480 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002648404337810179, + "loss": 1.674, + "step": 8481 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002648324822193679, + "loss": 1.6031, + "step": 8482 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026482452987806876, + "loss": 1.7357, + "step": 8483 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026481657675717443, + "loss": 1.7086, + "step": 8484 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026480862285673895, + "loss": 1.638, + "step": 8485 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002648006681768162, + "loss": 1.6472, + "step": 8486 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002647927127174603, + "loss": 1.6448, + "step": 8487 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026478475647872526, + "loss": 1.6778, + "step": 8488 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026477679946066503, + "loss": 1.686, + "step": 8489 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026476884166333367, + "loss": 1.6773, + "step": 8490 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026476088308678524, + "loss": 1.6357, + "step": 8491 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002647529237310737, + "loss": 1.6686, + "step": 8492 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026474496359625316, + "loss": 1.7053, + "step": 8493 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002647370026823776, + "loss": 1.7029, + "step": 8494 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002647290409895012, + "loss": 1.687, + "step": 8495 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026472107851767786, + "loss": 1.6612, + "step": 8496 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026471311526696174, + "loss": 1.6718, + "step": 8497 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026470515123740683, + "loss": 1.6405, + "step": 8498 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002646971864290672, + "loss": 1.6993, + "step": 8499 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026468922084199706, + "loss": 1.6868, + "step": 8500 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026468125447625036, + "loss": 1.6091, + "step": 8501 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026467328733188126, + "loss": 1.6344, + "step": 8502 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002646653194089438, + "loss": 1.6538, + "step": 8503 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002646573507074921, + "loss": 1.7218, + "step": 8504 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026464938122758026, + "loss": 1.6765, + "step": 8505 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002646414109692624, + "loss": 1.6668, + "step": 8506 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002646334399325926, + "loss": 1.6509, + "step": 8507 + }, + { + "epoch": 0.67, + "learning_rate": 0.000264625468117625, + "loss": 1.6812, + "step": 8508 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026461749552441374, + "loss": 1.6961, + "step": 8509 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026460952215301295, + "loss": 1.6497, + "step": 8510 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026460154800347674, + "loss": 1.68, + "step": 8511 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026459357307585926, + "loss": 1.6464, + "step": 8512 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002645855973702146, + "loss": 1.647, + "step": 8513 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026457762088659707, + "loss": 1.6499, + "step": 8514 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026456964362506067, + "loss": 1.6893, + "step": 8515 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026456166558565963, + "loss": 1.6394, + "step": 8516 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002645536867684481, + "loss": 1.6482, + "step": 8517 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026454570717348024, + "loss": 1.6966, + "step": 8518 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026453772680081026, + "loss": 1.6507, + "step": 8519 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002645297456504923, + "loss": 1.6653, + "step": 8520 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026452176372258055, + "loss": 1.6944, + "step": 8521 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002645137810171293, + "loss": 1.6271, + "step": 8522 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002645057975341926, + "loss": 1.6714, + "step": 8523 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026449781327382473, + "loss": 1.6707, + "step": 8524 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026448982823607995, + "loss": 1.6867, + "step": 8525 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026448184242101235, + "loss": 1.6663, + "step": 8526 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026447385582867625, + "loss": 1.6422, + "step": 8527 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002644658684591258, + "loss": 1.7278, + "step": 8528 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002644578803124153, + "loss": 1.6775, + "step": 8529 + }, + { + "epoch": 0.67, + "learning_rate": 0.000264449891388599, + "loss": 1.6381, + "step": 8530 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026444190168773107, + "loss": 1.6752, + "step": 8531 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026443391120986576, + "loss": 1.7161, + "step": 8532 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002644259199550573, + "loss": 1.7003, + "step": 8533 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002644179279233601, + "loss": 1.6784, + "step": 8534 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026440993511482825, + "loss": 1.6909, + "step": 8535 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002644019415295161, + "loss": 1.6109, + "step": 8536 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026439394716747783, + "loss": 1.6494, + "step": 8537 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026438595202876784, + "loss": 1.6344, + "step": 8538 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002643779561134403, + "loss": 1.643, + "step": 8539 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002643699594215496, + "loss": 1.6795, + "step": 8540 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026436196195315007, + "loss": 1.6915, + "step": 8541 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026435396370829583, + "loss": 1.6444, + "step": 8542 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002643459646870413, + "loss": 1.6811, + "step": 8543 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026433796488944077, + "loss": 1.661, + "step": 8544 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002643299643155486, + "loss": 1.6509, + "step": 8545 + }, + { + "epoch": 0.67, + "learning_rate": 0.000264321962965419, + "loss": 1.6098, + "step": 8546 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026431396083910643, + "loss": 1.672, + "step": 8547 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026430595793666505, + "loss": 1.7108, + "step": 8548 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026429795425814937, + "loss": 1.721, + "step": 8549 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026428994980361365, + "loss": 1.6781, + "step": 8550 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026428194457311227, + "loss": 1.6106, + "step": 8551 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002642739385666995, + "loss": 1.6463, + "step": 8552 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026426593178442974, + "loss": 1.6935, + "step": 8553 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002642579242263574, + "loss": 1.6907, + "step": 8554 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026424991589253676, + "loss": 1.6893, + "step": 8555 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002642419067830223, + "loss": 1.6331, + "step": 8556 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002642338968978683, + "loss": 1.6651, + "step": 8557 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002642258862371292, + "loss": 1.6471, + "step": 8558 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002642178748008594, + "loss": 1.6479, + "step": 8559 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026420986258911315, + "loss": 1.633, + "step": 8560 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026420184960194504, + "loss": 1.6699, + "step": 8561 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002641938358394094, + "loss": 1.6401, + "step": 8562 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026418582130156057, + "loss": 1.6835, + "step": 8563 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002641778059884531, + "loss": 1.6368, + "step": 8564 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002641697899001413, + "loss": 1.6757, + "step": 8565 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002641617730366796, + "loss": 1.6136, + "step": 8566 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026415375539812246, + "loss": 1.6893, + "step": 8567 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002641457369845244, + "loss": 1.6831, + "step": 8568 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002641377177959397, + "loss": 1.677, + "step": 8569 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002641296978324229, + "loss": 1.6502, + "step": 8570 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026412167709402844, + "loss": 1.6782, + "step": 8571 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002641136555808108, + "loss": 1.683, + "step": 8572 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026410563329282437, + "loss": 1.5964, + "step": 8573 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002640976102301237, + "loss": 1.6773, + "step": 8574 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026408958639276313, + "loss": 1.71, + "step": 8575 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026408156178079733, + "loss": 1.6183, + "step": 8576 + }, + { + "epoch": 0.67, + "learning_rate": 0.00026407353639428064, + "loss": 1.6826, + "step": 8577 + }, + { + "epoch": 0.67, + "learning_rate": 0.0002640655102332676, + "loss": 1.6655, + "step": 8578 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002640574832978127, + "loss": 1.6226, + "step": 8579 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002640494555879703, + "loss": 1.6785, + "step": 8580 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002640414271037952, + "loss": 1.6507, + "step": 8581 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002640333978453417, + "loss": 1.7058, + "step": 8582 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026402536781266437, + "loss": 1.6429, + "step": 8583 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002640173370058177, + "loss": 1.6398, + "step": 8584 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002640093054248562, + "loss": 1.6859, + "step": 8585 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002640012730698345, + "loss": 1.6709, + "step": 8586 + }, + { + "epoch": 0.68, + "learning_rate": 0.000263993239940807, + "loss": 1.6681, + "step": 8587 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002639852060378283, + "loss": 1.7115, + "step": 8588 + }, + { + "epoch": 0.68, + "learning_rate": 0.000263977171360953, + "loss": 1.6381, + "step": 8589 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002639691359102356, + "loss": 1.6652, + "step": 8590 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026396109968573065, + "loss": 1.6606, + "step": 8591 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002639530626874927, + "loss": 1.6481, + "step": 8592 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002639450249155764, + "loss": 1.6273, + "step": 8593 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002639369863700362, + "loss": 1.6437, + "step": 8594 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026392894705092675, + "loss": 1.6717, + "step": 8595 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026392090695830263, + "loss": 1.7021, + "step": 8596 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026391286609221844, + "loss": 1.6918, + "step": 8597 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002639048244527287, + "loss": 1.6659, + "step": 8598 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002638967820398881, + "loss": 1.6215, + "step": 8599 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002638887388537512, + "loss": 1.6561, + "step": 8600 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002638806948943726, + "loss": 1.6738, + "step": 8601 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026387265016180694, + "loss": 1.7176, + "step": 8602 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002638646046561088, + "loss": 1.6061, + "step": 8603 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002638565583773329, + "loss": 1.6535, + "step": 8604 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026384851132553374, + "loss": 1.6781, + "step": 8605 + }, + { + "epoch": 0.68, + "learning_rate": 0.000263840463500766, + "loss": 1.7042, + "step": 8606 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026383241490308436, + "loss": 1.6322, + "step": 8607 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002638243655325435, + "loss": 1.6831, + "step": 8608 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002638163153891979, + "loss": 1.6606, + "step": 8609 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026380826447310236, + "loss": 1.6275, + "step": 8610 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026380021278431156, + "loss": 1.6614, + "step": 8611 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002637921603228801, + "loss": 1.6566, + "step": 8612 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026378410708886266, + "loss": 1.6713, + "step": 8613 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002637760530823139, + "loss": 1.6528, + "step": 8614 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026376799830328854, + "loss": 1.6974, + "step": 8615 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026375994275184124, + "loss": 1.6293, + "step": 8616 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002637518864280267, + "loss": 1.6755, + "step": 8617 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026374382933189963, + "loss": 1.6758, + "step": 8618 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026373577146351473, + "loss": 1.6582, + "step": 8619 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002637277128229268, + "loss": 1.6893, + "step": 8620 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002637196534101903, + "loss": 1.6503, + "step": 8621 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026371159322536024, + "loss": 1.7044, + "step": 8622 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026370353226849117, + "loss": 1.6636, + "step": 8623 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026369547053963784, + "loss": 1.6077, + "step": 8624 + }, + { + "epoch": 0.68, + "learning_rate": 0.000263687408038855, + "loss": 1.6674, + "step": 8625 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002636793447661974, + "loss": 1.6809, + "step": 8626 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026367128072171984, + "loss": 1.5994, + "step": 8627 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026366321590547695, + "loss": 1.6816, + "step": 8628 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002636551503175236, + "loss": 1.608, + "step": 8629 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026364708395791445, + "loss": 1.6375, + "step": 8630 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026363901682670434, + "loss": 1.6741, + "step": 8631 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026363094892394804, + "loss": 1.643, + "step": 8632 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026362288024970026, + "loss": 1.6062, + "step": 8633 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026361481080401585, + "loss": 1.6397, + "step": 8634 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026360674058694956, + "loss": 1.608, + "step": 8635 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002635986695985562, + "loss": 1.6925, + "step": 8636 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002635905978388906, + "loss": 1.6409, + "step": 8637 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002635825253080075, + "loss": 1.6401, + "step": 8638 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026357445200596167, + "loss": 1.6671, + "step": 8639 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026356637793280806, + "loss": 1.5894, + "step": 8640 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002635583030886014, + "loss": 1.5897, + "step": 8641 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002635502274733965, + "loss": 1.6346, + "step": 8642 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026354215108724825, + "loss": 1.6903, + "step": 8643 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026353407393021145, + "loss": 1.6523, + "step": 8644 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002635259960023409, + "loss": 1.6415, + "step": 8645 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002635179173036915, + "loss": 1.7182, + "step": 8646 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026350983783431813, + "loss": 1.6995, + "step": 8647 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002635017575942756, + "loss": 1.6414, + "step": 8648 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002634936765836187, + "loss": 1.7108, + "step": 8649 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002634855948024024, + "loss": 1.72, + "step": 8650 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026347751225068157, + "loss": 1.6993, + "step": 8651 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002634694289285111, + "loss": 1.6653, + "step": 8652 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026346134483594576, + "loss": 1.7251, + "step": 8653 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026345325997304046, + "loss": 1.6401, + "step": 8654 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002634451743398502, + "loss": 1.6432, + "step": 8655 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002634370879364298, + "loss": 1.6281, + "step": 8656 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002634290007628341, + "loss": 1.6793, + "step": 8657 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002634209128191182, + "loss": 1.6376, + "step": 8658 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002634128241053368, + "loss": 1.6209, + "step": 8659 + }, + { + "epoch": 0.68, + "learning_rate": 0.000263404734621545, + "loss": 1.6903, + "step": 8660 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002633966443677975, + "loss": 1.7004, + "step": 8661 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026338855334414945, + "loss": 1.7039, + "step": 8662 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026338046155065573, + "loss": 1.6571, + "step": 8663 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026337236898737115, + "loss": 1.6774, + "step": 8664 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026336427565435083, + "loss": 1.6875, + "step": 8665 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026335618155164955, + "loss": 1.6614, + "step": 8666 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026334808667932247, + "loss": 1.6347, + "step": 8667 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026333999103742435, + "loss": 1.65, + "step": 8668 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026333189462601027, + "loss": 1.6786, + "step": 8669 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026332379744513514, + "loss": 1.6837, + "step": 8670 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026331569949485394, + "loss": 1.6444, + "step": 8671 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002633076007752218, + "loss": 1.6394, + "step": 8672 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026329950128629344, + "loss": 1.6727, + "step": 8673 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026329140102812404, + "loss": 1.6672, + "step": 8674 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026328330000076854, + "loss": 1.6838, + "step": 8675 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026327519820428197, + "loss": 1.6208, + "step": 8676 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002632670956387193, + "loss": 1.6347, + "step": 8677 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026325899230413555, + "loss": 1.6809, + "step": 8678 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026325088820058575, + "loss": 1.6192, + "step": 8679 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002632427833281249, + "loss": 1.6772, + "step": 8680 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002632346776868081, + "loss": 1.698, + "step": 8681 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002632265712766902, + "loss": 1.6756, + "step": 8682 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026321846409782653, + "loss": 1.6565, + "step": 8683 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002632103561502718, + "loss": 1.6132, + "step": 8684 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002632022474340814, + "loss": 1.6934, + "step": 8685 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002631941379493101, + "loss": 1.6907, + "step": 8686 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026318602769601307, + "loss": 1.699, + "step": 8687 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026317791667424537, + "loss": 1.7099, + "step": 8688 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002631698048840622, + "loss": 1.6851, + "step": 8689 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026316169232551835, + "loss": 1.6386, + "step": 8690 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002631535789986691, + "loss": 1.6859, + "step": 8691 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026314546490356953, + "loss": 1.6927, + "step": 8692 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026313735004027464, + "loss": 1.6372, + "step": 8693 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026312923440883964, + "loss": 1.6303, + "step": 8694 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002631211180093195, + "loss": 1.662, + "step": 8695 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026311300084176946, + "loss": 1.6187, + "step": 8696 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026310488290624454, + "loss": 1.6637, + "step": 8697 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002630967642027999, + "loss": 1.6895, + "step": 8698 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026308864473149055, + "loss": 1.6791, + "step": 8699 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002630805244923718, + "loss": 1.6612, + "step": 8700 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002630724034854987, + "loss": 1.6512, + "step": 8701 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002630642817109263, + "loss": 1.6444, + "step": 8702 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026305615916870985, + "loss": 1.6451, + "step": 8703 + }, + { + "epoch": 0.68, + "learning_rate": 0.0002630480358589045, + "loss": 1.6203, + "step": 8704 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026303991178156536, + "loss": 1.6664, + "step": 8705 + }, + { + "epoch": 0.68, + "learning_rate": 0.00026303178693674764, + "loss": 1.6894, + "step": 8706 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026302366132450637, + "loss": 1.621, + "step": 8707 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002630155349448969, + "loss": 1.6409, + "step": 8708 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002630074077979742, + "loss": 1.7074, + "step": 8709 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002629992798837937, + "loss": 1.7262, + "step": 8710 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026299115120241036, + "loss": 1.6874, + "step": 8711 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002629830217538795, + "loss": 1.6558, + "step": 8712 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002629748915382562, + "loss": 1.6414, + "step": 8713 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002629667605555958, + "loss": 1.6961, + "step": 8714 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026295862880595347, + "loss": 1.6513, + "step": 8715 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026295049628938434, + "loss": 1.6567, + "step": 8716 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026294236300594367, + "loss": 1.6563, + "step": 8717 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002629342289556867, + "loss": 1.6486, + "step": 8718 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002629260941386686, + "loss": 1.6909, + "step": 8719 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026291795855494466, + "loss": 1.6562, + "step": 8720 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002629098222045701, + "loss": 1.6452, + "step": 8721 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026290168508760016, + "loss": 1.7005, + "step": 8722 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002628935472040901, + "loss": 1.652, + "step": 8723 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002628854085540951, + "loss": 1.6648, + "step": 8724 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026287726913767044, + "loss": 1.706, + "step": 8725 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002628691289548715, + "loss": 1.6627, + "step": 8726 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026286098800575345, + "loss": 1.6738, + "step": 8727 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026285284629037155, + "loss": 1.6403, + "step": 8728 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026284470380878115, + "loss": 1.7123, + "step": 8729 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002628365605610374, + "loss": 1.691, + "step": 8730 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002628284165471957, + "loss": 1.6401, + "step": 8731 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002628202717673113, + "loss": 1.6364, + "step": 8732 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026281212622143957, + "loss": 1.6665, + "step": 8733 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026280397990963573, + "loss": 1.7127, + "step": 8734 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002627958328319551, + "loss": 1.6302, + "step": 8735 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026278768498845306, + "loss": 1.7086, + "step": 8736 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026277953637918487, + "loss": 1.6277, + "step": 8737 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026277138700420583, + "loss": 1.6057, + "step": 8738 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026276323686357135, + "loss": 1.6379, + "step": 8739 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002627550859573366, + "loss": 1.6342, + "step": 8740 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002627469342855572, + "loss": 1.6334, + "step": 8741 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026273878184828825, + "loss": 1.6526, + "step": 8742 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002627306286455852, + "loss": 1.6416, + "step": 8743 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026272247467750337, + "loss": 1.5685, + "step": 8744 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026271431994409817, + "loss": 1.6743, + "step": 8745 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002627061644454249, + "loss": 1.6429, + "step": 8746 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026269800818153906, + "loss": 1.6921, + "step": 8747 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026268985115249585, + "loss": 1.7483, + "step": 8748 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002626816933583508, + "loss": 1.639, + "step": 8749 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026267353479915916, + "loss": 1.6756, + "step": 8750 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026266537547497645, + "loss": 1.6295, + "step": 8751 + }, + { + "epoch": 0.69, + "learning_rate": 0.000262657215385858, + "loss": 1.6294, + "step": 8752 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002626490545318592, + "loss": 1.6263, + "step": 8753 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002626408929130355, + "loss": 1.6534, + "step": 8754 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026263273052944233, + "loss": 1.6365, + "step": 8755 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026262456738113506, + "loss": 1.6568, + "step": 8756 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026261640346816916, + "loss": 1.6515, + "step": 8757 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002626082387906, + "loss": 1.6525, + "step": 8758 + }, + { + "epoch": 0.69, + "learning_rate": 0.000262600073348483, + "loss": 1.6226, + "step": 8759 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026259190714187367, + "loss": 1.6437, + "step": 8760 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002625837401708274, + "loss": 1.6137, + "step": 8761 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002625755724353997, + "loss": 1.6618, + "step": 8762 + }, + { + "epoch": 0.69, + "learning_rate": 0.000262567403935646, + "loss": 1.6705, + "step": 8763 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002625592346716217, + "loss": 1.634, + "step": 8764 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026255106464338236, + "loss": 1.6698, + "step": 8765 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026254289385098335, + "loss": 1.6321, + "step": 8766 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002625347222944803, + "loss": 1.652, + "step": 8767 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002625265499739285, + "loss": 1.6549, + "step": 8768 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026251837688938347, + "loss": 1.6767, + "step": 8769 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026251020304090086, + "loss": 1.6521, + "step": 8770 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026250202842853596, + "loss": 1.5983, + "step": 8771 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002624938530523445, + "loss": 1.6327, + "step": 8772 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026248567691238174, + "loss": 1.7048, + "step": 8773 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002624775000087034, + "loss": 1.681, + "step": 8774 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026246932234136485, + "loss": 1.7397, + "step": 8775 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026246114391042163, + "loss": 1.708, + "step": 8776 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002624529647159294, + "loss": 1.6257, + "step": 8777 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026244478475794355, + "loss": 1.6826, + "step": 8778 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026243660403651965, + "loss": 1.6339, + "step": 8779 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002624284225517133, + "loss": 1.6081, + "step": 8780 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002624202403035799, + "loss": 1.6687, + "step": 8781 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002624120572921752, + "loss": 1.7141, + "step": 8782 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026240387351755465, + "loss": 1.6584, + "step": 8783 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002623956889797738, + "loss": 1.6685, + "step": 8784 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002623875036788883, + "loss": 1.6172, + "step": 8785 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026237931761495363, + "loss": 1.6042, + "step": 8786 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002623711307880254, + "loss": 1.6878, + "step": 8787 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026236294319815926, + "loss": 1.699, + "step": 8788 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026235475484541064, + "loss": 1.6354, + "step": 8789 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026234656572983537, + "loss": 1.6744, + "step": 8790 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026233837585148886, + "loss": 1.669, + "step": 8791 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002623301852104267, + "loss": 1.6822, + "step": 8792 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026232199380670467, + "loss": 1.6185, + "step": 8793 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026231380164037823, + "loss": 1.7071, + "step": 8794 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002623056087115031, + "loss": 1.6689, + "step": 8795 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026229741502013484, + "loss": 1.6542, + "step": 8796 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026228922056632906, + "loss": 1.5947, + "step": 8797 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002622810253501415, + "loss": 1.659, + "step": 8798 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002622728293716277, + "loss": 1.7103, + "step": 8799 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002622646326308434, + "loss": 1.653, + "step": 8800 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002622564351278441, + "loss": 1.6607, + "step": 8801 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026224823686268563, + "loss": 1.7031, + "step": 8802 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026224003783542355, + "loss": 1.6192, + "step": 8803 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002622318380461136, + "loss": 1.6708, + "step": 8804 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026222363749481135, + "loss": 1.6208, + "step": 8805 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002622154361815726, + "loss": 1.6806, + "step": 8806 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002622072341064529, + "loss": 1.605, + "step": 8807 + }, + { + "epoch": 0.69, + "learning_rate": 0.000262199031269508, + "loss": 1.6771, + "step": 8808 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002621908276707936, + "loss": 1.633, + "step": 8809 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002621826233103654, + "loss": 1.5956, + "step": 8810 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002621744181882791, + "loss": 1.6823, + "step": 8811 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002621662123045904, + "loss": 1.6577, + "step": 8812 + }, + { + "epoch": 0.69, + "learning_rate": 0.000262158005659355, + "loss": 1.7249, + "step": 8813 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002621497982526287, + "loss": 1.6074, + "step": 8814 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026214159008446704, + "loss": 1.6679, + "step": 8815 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026213338115492593, + "loss": 1.6363, + "step": 8816 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002621251714640611, + "loss": 1.6787, + "step": 8817 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026211696101192814, + "loss": 1.6321, + "step": 8818 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026210874979858297, + "loss": 1.7233, + "step": 8819 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002621005378240812, + "loss": 1.6847, + "step": 8820 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026209232508847866, + "loss": 1.6527, + "step": 8821 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002620841115918311, + "loss": 1.6794, + "step": 8822 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002620758973341942, + "loss": 1.6254, + "step": 8823 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002620676823156239, + "loss": 1.6423, + "step": 8824 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026205946653617583, + "loss": 1.6624, + "step": 8825 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002620512499959059, + "loss": 1.7093, + "step": 8826 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002620430326948697, + "loss": 1.6684, + "step": 8827 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026203481463312324, + "loss": 1.6841, + "step": 8828 + }, + { + "epoch": 0.69, + "learning_rate": 0.00026202659581072216, + "loss": 1.6046, + "step": 8829 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002620183762277223, + "loss": 1.6457, + "step": 8830 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002620101558841795, + "loss": 1.7032, + "step": 8831 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002620019347801496, + "loss": 1.6418, + "step": 8832 + }, + { + "epoch": 0.69, + "learning_rate": 0.0002619937129156883, + "loss": 1.6511, + "step": 8833 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026198549029085154, + "loss": 1.6541, + "step": 8834 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026197726690569507, + "loss": 1.642, + "step": 8835 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026196904276027473, + "loss": 1.6489, + "step": 8836 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026196081785464647, + "loss": 1.6572, + "step": 8837 + }, + { + "epoch": 0.7, + "learning_rate": 0.000261952592188866, + "loss": 1.7017, + "step": 8838 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026194436576298914, + "loss": 1.6042, + "step": 8839 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002619361385770719, + "loss": 1.6689, + "step": 8840 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026192791063117004, + "loss": 1.6472, + "step": 8841 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002619196819253394, + "loss": 1.6515, + "step": 8842 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026191145245963587, + "loss": 1.7106, + "step": 8843 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026190322223411535, + "loss": 1.6475, + "step": 8844 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026189499124883376, + "loss": 1.6444, + "step": 8845 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002618867595038469, + "loss": 1.6468, + "step": 8846 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026187852699921066, + "loss": 1.6189, + "step": 8847 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026187029373498093, + "loss": 1.6704, + "step": 8848 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002618620597112137, + "loss": 1.6431, + "step": 8849 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002618538249279648, + "loss": 1.6163, + "step": 8850 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002618455893852901, + "loss": 1.6895, + "step": 8851 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026183735308324565, + "loss": 1.6458, + "step": 8852 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002618291160218873, + "loss": 1.6668, + "step": 8853 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002618208782012709, + "loss": 1.6292, + "step": 8854 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002618126396214525, + "loss": 1.7078, + "step": 8855 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026180440028248796, + "loss": 1.628, + "step": 8856 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002617961601844332, + "loss": 1.6727, + "step": 8857 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002617879193273442, + "loss": 1.6696, + "step": 8858 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026177967771127703, + "loss": 1.706, + "step": 8859 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002617714353362874, + "loss": 1.6659, + "step": 8860 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002617631922024315, + "loss": 1.5907, + "step": 8861 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026175494830976513, + "loss": 1.6477, + "step": 8862 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002617467036583444, + "loss": 1.6526, + "step": 8863 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002617384582482252, + "loss": 1.6614, + "step": 8864 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026173021207946353, + "loss": 1.6608, + "step": 8865 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002617219651521153, + "loss": 1.6157, + "step": 8866 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026171371746623666, + "loss": 1.6491, + "step": 8867 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026170546902188355, + "loss": 1.751, + "step": 8868 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002616972198191119, + "loss": 1.6584, + "step": 8869 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002616889698579778, + "loss": 1.6008, + "step": 8870 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026168071913853716, + "loss": 1.5715, + "step": 8871 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026167246766084615, + "loss": 1.622, + "step": 8872 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002616642154249607, + "loss": 1.628, + "step": 8873 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002616559624309368, + "loss": 1.6638, + "step": 8874 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002616477086788305, + "loss": 1.6578, + "step": 8875 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026163945416869796, + "loss": 1.6256, + "step": 8876 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002616311989005951, + "loss": 1.6469, + "step": 8877 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026162294287457804, + "loss": 1.6976, + "step": 8878 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026161468609070277, + "loss": 1.7056, + "step": 8879 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026160642854902537, + "loss": 1.6637, + "step": 8880 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002615981702496019, + "loss": 1.6656, + "step": 8881 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002615899111924884, + "loss": 1.6816, + "step": 8882 + }, + { + "epoch": 0.7, + "learning_rate": 0.000261581651377741, + "loss": 1.6265, + "step": 8883 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002615733908054159, + "loss": 1.6813, + "step": 8884 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002615651294755689, + "loss": 1.6401, + "step": 8885 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002615568673882563, + "loss": 1.6281, + "step": 8886 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026154860454353406, + "loss": 1.693, + "step": 8887 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026154034094145844, + "loss": 1.6396, + "step": 8888 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026153207658208543, + "loss": 1.7, + "step": 8889 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026152381146547115, + "loss": 1.6635, + "step": 8890 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002615155455916717, + "loss": 1.6973, + "step": 8891 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002615072789607433, + "loss": 1.6575, + "step": 8892 + }, + { + "epoch": 0.7, + "learning_rate": 0.000261499011572742, + "loss": 1.6669, + "step": 8893 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002614907434277239, + "loss": 1.6565, + "step": 8894 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002614824745257452, + "loss": 1.7059, + "step": 8895 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026147420486686207, + "loss": 1.666, + "step": 8896 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002614659344511305, + "loss": 1.6792, + "step": 8897 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026145766327860683, + "loss": 1.6696, + "step": 8898 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026144939134934716, + "loss": 1.6722, + "step": 8899 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026144111866340756, + "loss": 1.6576, + "step": 8900 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002614328452208443, + "loss": 1.6609, + "step": 8901 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002614245710217135, + "loss": 1.6514, + "step": 8902 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026141629606607134, + "loss": 1.6917, + "step": 8903 + }, + { + "epoch": 0.7, + "learning_rate": 0.000261408020353974, + "loss": 1.695, + "step": 8904 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026139974388547773, + "loss": 1.6117, + "step": 8905 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026139146666063866, + "loss": 1.6455, + "step": 8906 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026138318867951295, + "loss": 1.6652, + "step": 8907 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026137490994215687, + "loss": 1.6562, + "step": 8908 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026136663044862664, + "loss": 1.6286, + "step": 8909 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002613583501989785, + "loss": 1.6391, + "step": 8910 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026135006919326856, + "loss": 1.6757, + "step": 8911 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026134178743155307, + "loss": 1.6743, + "step": 8912 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002613335049138883, + "loss": 1.6758, + "step": 8913 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002613252216403305, + "loss": 1.6471, + "step": 8914 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002613169376109359, + "loss": 1.6035, + "step": 8915 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026130865282576065, + "loss": 1.6493, + "step": 8916 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002613003672848611, + "loss": 1.6333, + "step": 8917 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026129208098829354, + "loss": 1.6818, + "step": 8918 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002612837939361141, + "loss": 1.6977, + "step": 8919 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002612755061283791, + "loss": 1.7199, + "step": 8920 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026126721756514486, + "loss": 1.6949, + "step": 8921 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002612589282464676, + "loss": 1.6815, + "step": 8922 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026125063817240363, + "loss": 1.6224, + "step": 8923 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026124234734300924, + "loss": 1.5872, + "step": 8924 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002612340557583406, + "loss": 1.6515, + "step": 8925 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002612257634184542, + "loss": 1.6311, + "step": 8926 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002612174703234062, + "loss": 1.6006, + "step": 8927 + }, + { + "epoch": 0.7, + "learning_rate": 0.000261209176473253, + "loss": 1.6888, + "step": 8928 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002612008818680508, + "loss": 1.631, + "step": 8929 + }, + { + "epoch": 0.7, + "learning_rate": 0.000261192586507856, + "loss": 1.6433, + "step": 8930 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002611842903927249, + "loss": 1.6595, + "step": 8931 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026117599352271385, + "loss": 1.7044, + "step": 8932 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002611676958978791, + "loss": 1.6102, + "step": 8933 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002611593975182771, + "loss": 1.6546, + "step": 8934 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002611510983839641, + "loss": 1.7387, + "step": 8935 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026114279849499654, + "loss": 1.6446, + "step": 8936 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026113449785143065, + "loss": 1.6597, + "step": 8937 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026112619645332283, + "loss": 1.6834, + "step": 8938 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002611178943007295, + "loss": 1.6538, + "step": 8939 + }, + { + "epoch": 0.7, + "learning_rate": 0.000261109591393707, + "loss": 1.7417, + "step": 8940 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002611012877323117, + "loss": 1.6459, + "step": 8941 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002610929833165999, + "loss": 1.6095, + "step": 8942 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002610846781466281, + "loss": 1.6754, + "step": 8943 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026107637222245263, + "loss": 1.6623, + "step": 8944 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002610680655441299, + "loss": 1.6512, + "step": 8945 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026105975811171626, + "loss": 1.6974, + "step": 8946 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002610514499252682, + "loss": 1.6833, + "step": 8947 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026104314098484205, + "loss": 1.6398, + "step": 8948 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002610348312904942, + "loss": 1.6039, + "step": 8949 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026102652084228123, + "loss": 1.67, + "step": 8950 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002610182096402594, + "loss": 1.6378, + "step": 8951 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026100989768448516, + "loss": 1.6719, + "step": 8952 + }, + { + "epoch": 0.7, + "learning_rate": 0.000261001584975015, + "loss": 1.6526, + "step": 8953 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002609932715119053, + "loss": 1.6509, + "step": 8954 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026098495729521263, + "loss": 1.7062, + "step": 8955 + }, + { + "epoch": 0.7, + "learning_rate": 0.0002609766423249933, + "loss": 1.6363, + "step": 8956 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026096832660130377, + "loss": 1.6303, + "step": 8957 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026096001012420055, + "loss": 1.6906, + "step": 8958 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026095169289374015, + "loss": 1.695, + "step": 8959 + }, + { + "epoch": 0.7, + "learning_rate": 0.00026094337490997896, + "loss": 1.6024, + "step": 8960 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026093505617297345, + "loss": 1.6761, + "step": 8961 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026092673668278013, + "loss": 1.6675, + "step": 8962 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002609184164394555, + "loss": 1.6458, + "step": 8963 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026091009544305607, + "loss": 1.7007, + "step": 8964 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002609017736936382, + "loss": 1.6425, + "step": 8965 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026089345119125856, + "loss": 1.6744, + "step": 8966 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002608851279359736, + "loss": 1.7085, + "step": 8967 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002608768039278397, + "loss": 1.6471, + "step": 8968 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026086847916691365, + "loss": 1.6222, + "step": 8969 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026086015365325165, + "loss": 1.6444, + "step": 8970 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002608518273869105, + "loss": 1.6697, + "step": 8971 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026084350036794654, + "loss": 1.6015, + "step": 8972 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026083517259641644, + "loss": 1.6528, + "step": 8973 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026082684407237664, + "loss": 1.6863, + "step": 8974 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002608185147958838, + "loss": 1.6691, + "step": 8975 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002608101847669943, + "loss": 1.6282, + "step": 8976 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002608018539857648, + "loss": 1.6683, + "step": 8977 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002607935224522519, + "loss": 1.6365, + "step": 8978 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002607851901665122, + "loss": 1.6099, + "step": 8979 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002607768571286021, + "loss": 1.678, + "step": 8980 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026076852333857824, + "loss": 1.6629, + "step": 8981 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002607601887964973, + "loss": 1.656, + "step": 8982 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002607518535024158, + "loss": 1.667, + "step": 8983 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002607435174563903, + "loss": 1.6252, + "step": 8984 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026073518065847744, + "loss": 1.6009, + "step": 8985 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026072684310873384, + "loss": 1.6241, + "step": 8986 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026071850480721605, + "loss": 1.7118, + "step": 8987 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026071016575398073, + "loss": 1.5982, + "step": 8988 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002607018259490844, + "loss": 1.6285, + "step": 8989 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026069348539258387, + "loss": 1.6529, + "step": 8990 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026068514408453567, + "loss": 1.626, + "step": 8991 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002606768020249963, + "loss": 1.684, + "step": 8992 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002606684592140226, + "loss": 1.7219, + "step": 8993 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026066011565167114, + "loss": 1.6288, + "step": 8994 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002606517713379985, + "loss": 1.6826, + "step": 8995 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026064342627306146, + "loss": 1.6557, + "step": 8996 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026063508045691663, + "loss": 1.654, + "step": 8997 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026062673388962065, + "loss": 1.6171, + "step": 8998 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002606183865712301, + "loss": 1.6659, + "step": 8999 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002606100385018019, + "loss": 1.6526, + "step": 9000 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026060168968139246, + "loss": 1.6561, + "step": 9001 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026059334011005865, + "loss": 1.6565, + "step": 9002 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026058498978785705, + "loss": 1.6448, + "step": 9003 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026057663871484435, + "loss": 1.6793, + "step": 9004 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002605682868910774, + "loss": 1.6565, + "step": 9005 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026055993431661274, + "loss": 1.6452, + "step": 9006 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026055158099150716, + "loss": 1.6375, + "step": 9007 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002605432269158173, + "loss": 1.6418, + "step": 9008 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002605348720896, + "loss": 1.6654, + "step": 9009 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002605265165129119, + "loss": 1.6605, + "step": 9010 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002605181601858097, + "loss": 1.6509, + "step": 9011 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002605098031083502, + "loss": 1.6323, + "step": 9012 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002605014452805902, + "loss": 1.6409, + "step": 9013 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002604930867025863, + "loss": 1.6394, + "step": 9014 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026048472737439526, + "loss": 1.6625, + "step": 9015 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026047636729607397, + "loss": 1.6863, + "step": 9016 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002604680064676791, + "loss": 1.6719, + "step": 9017 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026045964488926747, + "loss": 1.674, + "step": 9018 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002604512825608957, + "loss": 1.7074, + "step": 9019 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026044291948262074, + "loss": 1.6664, + "step": 9020 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026043455565449933, + "loss": 1.6716, + "step": 9021 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026042619107658816, + "loss": 1.6631, + "step": 9022 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026041782574894414, + "loss": 1.6812, + "step": 9023 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026040945967162397, + "loss": 1.6625, + "step": 9024 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002604010928446846, + "loss": 1.6647, + "step": 9025 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002603927252681826, + "loss": 1.6525, + "step": 9026 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026038435694217504, + "loss": 1.6624, + "step": 9027 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002603759878667185, + "loss": 1.6841, + "step": 9028 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026036761804187, + "loss": 1.6574, + "step": 9029 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002603592474676862, + "loss": 1.6895, + "step": 9030 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002603508761442241, + "loss": 1.6614, + "step": 9031 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002603425040715404, + "loss": 1.6147, + "step": 9032 + }, + { + "epoch": 0.71, + "learning_rate": 0.000260334131249692, + "loss": 1.6085, + "step": 9033 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002603257576787357, + "loss": 1.6495, + "step": 9034 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002603173833587284, + "loss": 1.6233, + "step": 9035 + }, + { + "epoch": 0.71, + "learning_rate": 0.000260309008289727, + "loss": 1.655, + "step": 9036 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026030063247178825, + "loss": 1.6711, + "step": 9037 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002602922559049691, + "loss": 1.6406, + "step": 9038 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002602838785893264, + "loss": 1.7259, + "step": 9039 + }, + { + "epoch": 0.71, + "learning_rate": 0.000260275500524917, + "loss": 1.6481, + "step": 9040 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002602671217117978, + "loss": 1.6929, + "step": 9041 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026025874215002576, + "loss": 1.6257, + "step": 9042 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026025036183965764, + "loss": 1.6238, + "step": 9043 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026024198078075043, + "loss": 1.6537, + "step": 9044 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026023359897336105, + "loss": 1.6811, + "step": 9045 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026022521641754626, + "loss": 1.6417, + "step": 9046 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026021683311336314, + "loss": 1.6288, + "step": 9047 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026020844906086857, + "loss": 1.6027, + "step": 9048 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002602000642601194, + "loss": 1.7163, + "step": 9049 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026019167871117266, + "loss": 1.6344, + "step": 9050 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026018329241408517, + "loss": 1.7175, + "step": 9051 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026017490536891396, + "loss": 1.6731, + "step": 9052 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026016651757571594, + "loss": 1.6528, + "step": 9053 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026015812903454805, + "loss": 1.6435, + "step": 9054 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002601497397454673, + "loss": 1.6665, + "step": 9055 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002601413497085305, + "loss": 1.6225, + "step": 9056 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002601329589237948, + "loss": 1.6733, + "step": 9057 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002601245673913171, + "loss": 1.6247, + "step": 9058 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002601161751111543, + "loss": 1.6537, + "step": 9059 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002601077820833635, + "loss": 1.6612, + "step": 9060 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002600993883080016, + "loss": 1.6521, + "step": 9061 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002600909937851256, + "loss": 1.6815, + "step": 9062 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026008259851479244, + "loss": 1.6345, + "step": 9063 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026007420249705927, + "loss": 1.7539, + "step": 9064 + }, + { + "epoch": 0.71, + "learning_rate": 0.000260065805731983, + "loss": 1.6421, + "step": 9065 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026005740821962066, + "loss": 1.6663, + "step": 9066 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026004900996002916, + "loss": 1.623, + "step": 9067 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026004061095326575, + "loss": 1.6163, + "step": 9068 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026003221119938724, + "loss": 1.7078, + "step": 9069 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026002381069845077, + "loss": 1.6343, + "step": 9070 + }, + { + "epoch": 0.71, + "learning_rate": 0.00026001540945051326, + "loss": 1.6888, + "step": 9071 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002600070074556319, + "loss": 1.5844, + "step": 9072 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002599986047138637, + "loss": 1.6556, + "step": 9073 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002599902012252656, + "loss": 1.6567, + "step": 9074 + }, + { + "epoch": 0.71, + "learning_rate": 0.00025998179698989476, + "loss": 1.6649, + "step": 9075 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002599733920078082, + "loss": 1.6216, + "step": 9076 + }, + { + "epoch": 0.71, + "learning_rate": 0.00025996498627906304, + "loss": 1.6772, + "step": 9077 + }, + { + "epoch": 0.71, + "learning_rate": 0.00025995657980371626, + "loss": 1.6312, + "step": 9078 + }, + { + "epoch": 0.71, + "learning_rate": 0.000259948172581825, + "loss": 1.6783, + "step": 9079 + }, + { + "epoch": 0.71, + "learning_rate": 0.00025993976461344634, + "loss": 1.6155, + "step": 9080 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002599313558986373, + "loss": 1.6538, + "step": 9081 + }, + { + "epoch": 0.71, + "learning_rate": 0.00025992294643745504, + "loss": 1.6371, + "step": 9082 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002599145362299567, + "loss": 1.6404, + "step": 9083 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002599061252761992, + "loss": 1.6661, + "step": 9084 + }, + { + "epoch": 0.71, + "learning_rate": 0.00025989771357623985, + "loss": 1.6511, + "step": 9085 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002598893011301356, + "loss": 1.6207, + "step": 9086 + }, + { + "epoch": 0.71, + "learning_rate": 0.0002598808879379437, + "loss": 1.6139, + "step": 9087 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025987247399972117, + "loss": 1.6654, + "step": 9088 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002598640593155252, + "loss": 1.7312, + "step": 9089 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002598556438854129, + "loss": 1.658, + "step": 9090 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025984722770944137, + "loss": 1.6194, + "step": 9091 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002598388107876678, + "loss": 1.6055, + "step": 9092 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002598303931201493, + "loss": 1.6807, + "step": 9093 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025982197470694307, + "loss": 1.697, + "step": 9094 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025981355554810623, + "loss": 1.6156, + "step": 9095 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002598051356436959, + "loss": 1.6719, + "step": 9096 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002597967149937694, + "loss": 1.6373, + "step": 9097 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002597882935983837, + "loss": 1.564, + "step": 9098 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002597798714575961, + "loss": 1.6688, + "step": 9099 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002597714485714638, + "loss": 1.71, + "step": 9100 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002597630249400439, + "loss": 1.6507, + "step": 9101 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025975460056339356, + "loss": 1.6694, + "step": 9102 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025974617544157017, + "loss": 1.5786, + "step": 9103 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002597377495746308, + "loss": 1.6727, + "step": 9104 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002597293229626326, + "loss": 1.6504, + "step": 9105 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025972089560563286, + "loss": 1.6621, + "step": 9106 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002597124675036888, + "loss": 1.6422, + "step": 9107 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002597040386568577, + "loss": 1.6938, + "step": 9108 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025969560906519666, + "loss": 1.6691, + "step": 9109 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025968717872876295, + "loss": 1.6524, + "step": 9110 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025967874764761385, + "loss": 1.6284, + "step": 9111 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025967031582180657, + "loss": 1.6297, + "step": 9112 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002596618832513984, + "loss": 1.6665, + "step": 9113 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002596534499364465, + "loss": 1.677, + "step": 9114 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025964501587700823, + "loss": 1.7019, + "step": 9115 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002596365810731408, + "loss": 1.6344, + "step": 9116 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025962814552490146, + "loss": 1.6889, + "step": 9117 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025961970923234754, + "loss": 1.631, + "step": 9118 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025961127219553627, + "loss": 1.7323, + "step": 9119 + }, + { + "epoch": 0.72, + "learning_rate": 0.000259602834414525, + "loss": 1.6511, + "step": 9120 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002595943958893709, + "loss": 1.649, + "step": 9121 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025958595662013136, + "loss": 1.6245, + "step": 9122 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002595775166068636, + "loss": 1.6179, + "step": 9123 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025956907584962505, + "loss": 1.6475, + "step": 9124 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025956063434847294, + "loss": 1.6281, + "step": 9125 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025955219210346456, + "loss": 1.6681, + "step": 9126 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025954374911465723, + "loss": 1.6144, + "step": 9127 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002595353053821083, + "loss": 1.6572, + "step": 9128 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002595268609058751, + "loss": 1.6698, + "step": 9129 + }, + { + "epoch": 0.72, + "learning_rate": 0.000259518415686015, + "loss": 1.699, + "step": 9130 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002595099697225852, + "loss": 1.6393, + "step": 9131 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025950152301564325, + "loss": 1.6871, + "step": 9132 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002594930755652463, + "loss": 1.5913, + "step": 9133 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002594846273714518, + "loss": 1.6742, + "step": 9134 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025947617843431715, + "loss": 1.6972, + "step": 9135 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025946772875389966, + "loss": 1.632, + "step": 9136 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002594592783302566, + "loss": 1.5851, + "step": 9137 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025945082716344553, + "loss": 1.643, + "step": 9138 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025944237525352376, + "loss": 1.6444, + "step": 9139 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025943392260054863, + "loss": 1.6631, + "step": 9140 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025942546920457757, + "loss": 1.6615, + "step": 9141 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025941701506566796, + "loss": 1.6073, + "step": 9142 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025940856018387713, + "loss": 1.6571, + "step": 9143 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025940010455926263, + "loss": 1.6594, + "step": 9144 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025939164819188177, + "loss": 1.6599, + "step": 9145 + }, + { + "epoch": 0.72, + "learning_rate": 0.000259383191081792, + "loss": 1.6361, + "step": 9146 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002593747332290507, + "loss": 1.6895, + "step": 9147 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002593662746337153, + "loss": 1.5995, + "step": 9148 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025935781529584325, + "loss": 1.6775, + "step": 9149 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002593493552154921, + "loss": 1.666, + "step": 9150 + }, + { + "epoch": 0.72, + "learning_rate": 0.000259340894392719, + "loss": 1.6416, + "step": 9151 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002593324328275817, + "loss": 1.6383, + "step": 9152 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025932397052013745, + "loss": 1.6417, + "step": 9153 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025931550747044374, + "loss": 1.6781, + "step": 9154 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025930704367855813, + "loss": 1.655, + "step": 9155 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025929857914453803, + "loss": 1.6359, + "step": 9156 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002592901138684408, + "loss": 1.6645, + "step": 9157 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002592816478503241, + "loss": 1.684, + "step": 9158 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002592731810902453, + "loss": 1.6773, + "step": 9159 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002592647135882618, + "loss": 1.6639, + "step": 9160 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002592562453444313, + "loss": 1.6035, + "step": 9161 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025924777635881116, + "loss": 1.6634, + "step": 9162 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002592393066314589, + "loss": 1.5993, + "step": 9163 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025923083616243204, + "loss": 1.6668, + "step": 9164 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025922236495178806, + "loss": 1.6529, + "step": 9165 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002592138929995846, + "loss": 1.6765, + "step": 9166 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025920542030587895, + "loss": 1.6577, + "step": 9167 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002591969468707288, + "loss": 1.6266, + "step": 9168 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002591884726941916, + "loss": 1.612, + "step": 9169 + }, + { + "epoch": 0.72, + "learning_rate": 0.000259179997776325, + "loss": 1.6009, + "step": 9170 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025917152211718644, + "loss": 1.6722, + "step": 9171 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002591630457168335, + "loss": 1.6299, + "step": 9172 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025915456857532364, + "loss": 1.6612, + "step": 9173 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002591460906927146, + "loss": 1.635, + "step": 9174 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002591376120690638, + "loss": 1.5988, + "step": 9175 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002591291327044288, + "loss": 1.5817, + "step": 9176 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025912065259886725, + "loss": 1.6906, + "step": 9177 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002591121717524367, + "loss": 1.6217, + "step": 9178 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002591036901651947, + "loss": 1.6797, + "step": 9179 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002590952078371988, + "loss": 1.6872, + "step": 9180 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002590867247685067, + "loss": 1.6424, + "step": 9181 + }, + { + "epoch": 0.72, + "learning_rate": 0.000259078240959176, + "loss": 1.6439, + "step": 9182 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025906975640926417, + "loss": 1.6675, + "step": 9183 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002590612711188289, + "loss": 1.6409, + "step": 9184 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025905278508792773, + "loss": 1.6512, + "step": 9185 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002590442983166184, + "loss": 1.6547, + "step": 9186 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002590358108049584, + "loss": 1.5999, + "step": 9187 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025902732255300546, + "loss": 1.7109, + "step": 9188 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002590188335608171, + "loss": 1.6413, + "step": 9189 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002590103438284511, + "loss": 1.6561, + "step": 9190 + }, + { + "epoch": 0.72, + "learning_rate": 0.000259001853355965, + "loss": 1.6222, + "step": 9191 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025899336214341644, + "loss": 1.6511, + "step": 9192 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025898487019086313, + "loss": 1.6193, + "step": 9193 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002589763774983627, + "loss": 1.6628, + "step": 9194 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002589678840659728, + "loss": 1.5718, + "step": 9195 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002589593898937511, + "loss": 1.5932, + "step": 9196 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025895089498175524, + "loss": 1.6387, + "step": 9197 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025894239933004295, + "loss": 1.6281, + "step": 9198 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002589339029386719, + "loss": 1.6678, + "step": 9199 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025892540580769975, + "loss": 1.6482, + "step": 9200 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002589169079371842, + "loss": 1.6333, + "step": 9201 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025890840932718296, + "loss": 1.6474, + "step": 9202 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025889990997775373, + "loss": 1.6992, + "step": 9203 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002588914098889542, + "loss": 1.6659, + "step": 9204 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025888290906084206, + "loss": 1.6143, + "step": 9205 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002588744074934751, + "loss": 1.6828, + "step": 9206 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025886590518691094, + "loss": 1.6334, + "step": 9207 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002588574021412074, + "loss": 1.6734, + "step": 9208 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025884889835642213, + "loss": 1.7054, + "step": 9209 + }, + { + "epoch": 0.72, + "learning_rate": 0.000258840393832613, + "loss": 1.6287, + "step": 9210 + }, + { + "epoch": 0.72, + "learning_rate": 0.00025883188856983756, + "loss": 1.7165, + "step": 9211 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002588233825681537, + "loss": 1.66, + "step": 9212 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002588148758276191, + "loss": 1.682, + "step": 9213 + }, + { + "epoch": 0.72, + "learning_rate": 0.0002588063683482916, + "loss": 1.6147, + "step": 9214 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002587978601302289, + "loss": 1.6795, + "step": 9215 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002587893511734887, + "loss": 1.6526, + "step": 9216 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002587808414781289, + "loss": 1.6429, + "step": 9217 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002587723310442072, + "loss": 1.7356, + "step": 9218 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002587638198717814, + "loss": 1.6353, + "step": 9219 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002587553079609092, + "loss": 1.6218, + "step": 9220 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002587467953116486, + "loss": 1.6696, + "step": 9221 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025873828192405723, + "loss": 1.72, + "step": 9222 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025872976779819294, + "loss": 1.667, + "step": 9223 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002587212529341135, + "loss": 1.6619, + "step": 9224 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002587127373318768, + "loss": 1.648, + "step": 9225 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002587042209915405, + "loss": 1.6519, + "step": 9226 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002586957039131626, + "loss": 1.5704, + "step": 9227 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002586871860968009, + "loss": 1.6081, + "step": 9228 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002586786675425131, + "loss": 1.6455, + "step": 9229 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025867014825035716, + "loss": 1.6406, + "step": 9230 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002586616282203909, + "loss": 1.716, + "step": 9231 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002586531074526721, + "loss": 1.6415, + "step": 9232 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002586445859472587, + "loss": 1.677, + "step": 9233 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002586360637042085, + "loss": 1.6245, + "step": 9234 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025862754072357934, + "loss": 1.5997, + "step": 9235 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002586190170054292, + "loss": 1.637, + "step": 9236 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002586104925498158, + "loss": 1.6535, + "step": 9237 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025860196735679716, + "loss": 1.6935, + "step": 9238 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002585934414264311, + "loss": 1.6729, + "step": 9239 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025858491475877547, + "loss": 1.6334, + "step": 9240 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025857638735388817, + "loss": 1.6563, + "step": 9241 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025856785921182714, + "loss": 1.6769, + "step": 9242 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025855933033265023, + "loss": 1.6312, + "step": 9243 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002585508007164154, + "loss": 1.6332, + "step": 9244 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002585422703631805, + "loss": 1.6723, + "step": 9245 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025853373927300357, + "loss": 1.6511, + "step": 9246 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025852520744594243, + "loss": 1.6398, + "step": 9247 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025851667488205495, + "loss": 1.6532, + "step": 9248 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002585081415813991, + "loss": 1.6469, + "step": 9249 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025849960754403297, + "loss": 1.6706, + "step": 9250 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002584910727700143, + "loss": 1.6256, + "step": 9251 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002584825372594012, + "loss": 1.7208, + "step": 9252 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025847400101225145, + "loss": 1.5874, + "step": 9253 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025846546402862313, + "loss": 1.6697, + "step": 9254 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002584569263085741, + "loss": 1.6665, + "step": 9255 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002584483878521625, + "loss": 1.6479, + "step": 9256 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002584398486594461, + "loss": 1.6772, + "step": 9257 + }, + { + "epoch": 0.73, + "learning_rate": 0.000258431308730483, + "loss": 1.6175, + "step": 9258 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002584227680653312, + "loss": 1.6519, + "step": 9259 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002584142266640486, + "loss": 1.6939, + "step": 9260 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002584056845266932, + "loss": 1.6035, + "step": 9261 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002583971416533231, + "loss": 1.6902, + "step": 9262 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025838859804399613, + "loss": 1.6106, + "step": 9263 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002583800536987705, + "loss": 1.6893, + "step": 9264 + }, + { + "epoch": 0.73, + "learning_rate": 0.000258371508617704, + "loss": 1.6014, + "step": 9265 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002583629628008549, + "loss": 1.6627, + "step": 9266 + }, + { + "epoch": 0.73, + "learning_rate": 0.000258354416248281, + "loss": 1.6264, + "step": 9267 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025834586896004036, + "loss": 1.5965, + "step": 9268 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002583373209361911, + "loss": 1.6227, + "step": 9269 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025832877217679126, + "loss": 1.6105, + "step": 9270 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002583202226818988, + "loss": 1.631, + "step": 9271 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002583116724515718, + "loss": 1.6306, + "step": 9272 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002583031214858683, + "loss": 1.6907, + "step": 9273 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025829456978484637, + "loss": 1.6549, + "step": 9274 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025828601734856414, + "loss": 1.5458, + "step": 9275 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025827746417707954, + "loss": 1.6112, + "step": 9276 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025826891027045073, + "loss": 1.588, + "step": 9277 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002582603556287358, + "loss": 1.667, + "step": 9278 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002582518002519928, + "loss": 1.601, + "step": 9279 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002582432441402798, + "loss": 1.651, + "step": 9280 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025823468729365486, + "loss": 1.6055, + "step": 9281 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025822612971217613, + "loss": 1.6333, + "step": 9282 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025821757139590177, + "loss": 1.6726, + "step": 9283 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002582090123448898, + "loss": 1.6319, + "step": 9284 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002582004525591983, + "loss": 1.6412, + "step": 9285 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002581918920388855, + "loss": 1.6766, + "step": 9286 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025818333078400933, + "loss": 1.6411, + "step": 9287 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002581747687946282, + "loss": 1.6096, + "step": 9288 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002581662060708, + "loss": 1.6663, + "step": 9289 + }, + { + "epoch": 0.73, + "learning_rate": 0.000258157642612583, + "loss": 1.6404, + "step": 9290 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002581490784200353, + "loss": 1.6826, + "step": 9291 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002581405134932149, + "loss": 1.7079, + "step": 9292 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002581319478321803, + "loss": 1.6571, + "step": 9293 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025812338143698933, + "loss": 1.6506, + "step": 9294 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025811481430770025, + "loss": 1.6592, + "step": 9295 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002581062464443713, + "loss": 1.6538, + "step": 9296 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025809767784706054, + "loss": 1.594, + "step": 9297 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025808910851582624, + "loss": 1.6945, + "step": 9298 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025808053845072655, + "loss": 1.6327, + "step": 9299 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025807196765181964, + "loss": 1.6707, + "step": 9300 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002580633961191637, + "loss": 1.6326, + "step": 9301 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025805482385281693, + "loss": 1.6356, + "step": 9302 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025804625085283753, + "loss": 1.6218, + "step": 9303 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002580376771192837, + "loss": 1.6191, + "step": 9304 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025802910265221367, + "loss": 1.643, + "step": 9305 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025802052745168565, + "loss": 1.6114, + "step": 9306 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002580119515177579, + "loss": 1.5628, + "step": 9307 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002580033748504886, + "loss": 1.6635, + "step": 9308 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025799479744993594, + "loss": 1.6761, + "step": 9309 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002579862193161582, + "loss": 1.6429, + "step": 9310 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025797764044921363, + "loss": 1.6333, + "step": 9311 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002579690608491605, + "loss": 1.6239, + "step": 9312 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025796048051605707, + "loss": 1.6541, + "step": 9313 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002579518994499615, + "loss": 1.619, + "step": 9314 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025794331765093204, + "loss": 1.6147, + "step": 9315 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025793473511902715, + "loss": 1.6362, + "step": 9316 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002579261518543049, + "loss": 1.678, + "step": 9317 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002579175678568236, + "loss": 1.5954, + "step": 9318 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002579089831266416, + "loss": 1.6534, + "step": 9319 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025790039766381717, + "loss": 1.6095, + "step": 9320 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025789181146840864, + "loss": 1.6002, + "step": 9321 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025788322454047414, + "loss": 1.7147, + "step": 9322 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002578746368800722, + "loss": 1.662, + "step": 9323 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002578660484872609, + "loss": 1.6388, + "step": 9324 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002578574593620987, + "loss": 1.6497, + "step": 9325 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002578488695046438, + "loss": 1.6855, + "step": 9326 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002578402789149547, + "loss": 1.613, + "step": 9327 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025783168759308954, + "loss": 1.6493, + "step": 9328 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002578230955391068, + "loss": 1.6298, + "step": 9329 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002578145027530647, + "loss": 1.6142, + "step": 9330 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025780590923502164, + "loss": 1.7036, + "step": 9331 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002577973149850359, + "loss": 1.6235, + "step": 9332 + }, + { + "epoch": 0.73, + "learning_rate": 0.000257788720003166, + "loss": 1.6238, + "step": 9333 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025778012428947003, + "loss": 1.6397, + "step": 9334 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002577715278440065, + "loss": 1.6434, + "step": 9335 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002577629306668339, + "loss": 1.6767, + "step": 9336 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002577543327580104, + "loss": 1.6495, + "step": 9337 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002577457341175944, + "loss": 1.6751, + "step": 9338 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002577371347456444, + "loss": 1.6886, + "step": 9339 + }, + { + "epoch": 0.73, + "learning_rate": 0.00025772853464221866, + "loss": 1.6487, + "step": 9340 + }, + { + "epoch": 0.73, + "learning_rate": 0.0002577199338073756, + "loss": 1.6072, + "step": 9341 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002577113322411737, + "loss": 1.6424, + "step": 9342 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002577027299436712, + "loss": 1.7073, + "step": 9343 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002576941269149267, + "loss": 1.6375, + "step": 9344 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025768552315499844, + "loss": 1.6525, + "step": 9345 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002576769186639449, + "loss": 1.6632, + "step": 9346 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002576683134418246, + "loss": 1.6034, + "step": 9347 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025765970748869576, + "loss": 1.6727, + "step": 9348 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025765110080461695, + "loss": 1.6676, + "step": 9349 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002576424933896466, + "loss": 1.6025, + "step": 9350 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002576338852438431, + "loss": 1.6342, + "step": 9351 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025762527636726494, + "loss": 1.6012, + "step": 9352 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002576166667599705, + "loss": 1.6663, + "step": 9353 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002576080564220183, + "loss": 1.6901, + "step": 9354 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002575994453534668, + "loss": 1.6622, + "step": 9355 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025759083355437443, + "loss": 1.6178, + "step": 9356 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025758222102479966, + "loss": 1.624, + "step": 9357 + }, + { + "epoch": 0.74, + "learning_rate": 0.000257573607764801, + "loss": 1.6266, + "step": 9358 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002575649937744369, + "loss": 1.6231, + "step": 9359 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025755637905376585, + "loss": 1.6476, + "step": 9360 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002575477636028463, + "loss": 1.6596, + "step": 9361 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025753914742173686, + "loss": 1.644, + "step": 9362 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025753053051049595, + "loss": 1.6581, + "step": 9363 + }, + { + "epoch": 0.74, + "learning_rate": 0.000257521912869182, + "loss": 1.7045, + "step": 9364 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025751329449785363, + "loss": 1.6992, + "step": 9365 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002575046753965694, + "loss": 1.7043, + "step": 9366 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025749605556538765, + "loss": 1.6134, + "step": 9367 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025748743500436704, + "loss": 1.6249, + "step": 9368 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025747881371356604, + "loss": 1.6291, + "step": 9369 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025747019169304326, + "loss": 1.6428, + "step": 9370 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025746156894285713, + "loss": 1.6166, + "step": 9371 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025745294546306626, + "loss": 1.6357, + "step": 9372 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002574443212537292, + "loss": 1.6442, + "step": 9373 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025743569631490453, + "loss": 1.6947, + "step": 9374 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002574270706466507, + "loss": 1.6768, + "step": 9375 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002574184442490264, + "loss": 1.6101, + "step": 9376 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002574098171220901, + "loss": 1.662, + "step": 9377 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002574011892659004, + "loss": 1.5979, + "step": 9378 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025739256068051596, + "loss": 1.6701, + "step": 9379 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002573839313659953, + "loss": 1.6393, + "step": 9380 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025737530132239695, + "loss": 1.6494, + "step": 9381 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002573666705497796, + "loss": 1.6254, + "step": 9382 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025735803904820175, + "loss": 1.5853, + "step": 9383 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002573494068177221, + "loss": 1.5814, + "step": 9384 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002573407738583992, + "loss": 1.6095, + "step": 9385 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025733214017029175, + "loss": 1.6405, + "step": 9386 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002573235057534582, + "loss": 1.6024, + "step": 9387 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002573148706079573, + "loss": 1.637, + "step": 9388 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002573062347338477, + "loss": 1.6071, + "step": 9389 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002572975981311879, + "loss": 1.6468, + "step": 9390 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002572889608000367, + "loss": 1.6522, + "step": 9391 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025728032274045267, + "loss": 1.6509, + "step": 9392 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025727168395249436, + "loss": 1.6017, + "step": 9393 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002572630444362205, + "loss": 1.6609, + "step": 9394 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002572544041916899, + "loss": 1.6176, + "step": 9395 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025724576321896103, + "loss": 1.6375, + "step": 9396 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002572371215180926, + "loss": 1.6279, + "step": 9397 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002572284790891432, + "loss": 1.6346, + "step": 9398 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025721983593217173, + "loss": 1.6364, + "step": 9399 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002572111920472367, + "loss": 1.6754, + "step": 9400 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025720254743439685, + "loss": 1.6645, + "step": 9401 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025719390209371084, + "loss": 1.6954, + "step": 9402 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002571852560252374, + "loss": 1.6239, + "step": 9403 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025717660922903524, + "loss": 1.6634, + "step": 9404 + }, + { + "epoch": 0.74, + "learning_rate": 0.000257167961705163, + "loss": 1.5995, + "step": 9405 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002571593134536795, + "loss": 1.5917, + "step": 9406 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002571506644746433, + "loss": 1.6333, + "step": 9407 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002571420147681133, + "loss": 1.6679, + "step": 9408 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002571333643341482, + "loss": 1.6279, + "step": 9409 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002571247131728065, + "loss": 1.6714, + "step": 9410 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025711606128414724, + "loss": 1.6613, + "step": 9411 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025710740866822905, + "loss": 1.6571, + "step": 9412 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002570987553251106, + "loss": 1.6772, + "step": 9413 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025709010125485077, + "loss": 1.7034, + "step": 9414 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002570814464575082, + "loss": 1.6535, + "step": 9415 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002570727909331417, + "loss": 1.642, + "step": 9416 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025706413468181, + "loss": 1.6637, + "step": 9417 + }, + { + "epoch": 0.74, + "learning_rate": 0.000257055477703572, + "loss": 1.627, + "step": 9418 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025704681999848635, + "loss": 1.635, + "step": 9419 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025703816156661183, + "loss": 1.583, + "step": 9420 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002570295024080073, + "loss": 1.6586, + "step": 9421 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025702084252273154, + "loss": 1.6425, + "step": 9422 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025701218191084325, + "loss": 1.6309, + "step": 9423 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002570035205724013, + "loss": 1.6165, + "step": 9424 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002569948585074646, + "loss": 1.6181, + "step": 9425 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002569861957160918, + "loss": 1.6797, + "step": 9426 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002569775321983417, + "loss": 1.652, + "step": 9427 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025696886795427323, + "loss": 1.6208, + "step": 9428 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025696020298394517, + "loss": 1.6162, + "step": 9429 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025695153728741644, + "loss": 1.6784, + "step": 9430 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025694287086474573, + "loss": 1.6748, + "step": 9431 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002569342037159919, + "loss": 1.6339, + "step": 9432 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025692553584121387, + "loss": 1.6266, + "step": 9433 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025691686724047045, + "loss": 1.66, + "step": 9434 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025690819791382056, + "loss": 1.7077, + "step": 9435 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025689952786132295, + "loss": 1.6514, + "step": 9436 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025689085708303656, + "loss": 1.6615, + "step": 9437 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025688218557902025, + "loss": 1.6472, + "step": 9438 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025687351334933284, + "loss": 1.6222, + "step": 9439 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025686484039403327, + "loss": 1.6696, + "step": 9440 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002568561667131804, + "loss": 1.6974, + "step": 9441 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025684749230683315, + "loss": 1.6765, + "step": 9442 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025683881717505035, + "loss": 1.6058, + "step": 9443 + }, + { + "epoch": 0.74, + "learning_rate": 0.000256830141317891, + "loss": 1.665, + "step": 9444 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002568214647354139, + "loss": 1.6209, + "step": 9445 + }, + { + "epoch": 0.74, + "learning_rate": 0.000256812787427678, + "loss": 1.7226, + "step": 9446 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025680410939474225, + "loss": 1.714, + "step": 9447 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002567954306366655, + "loss": 1.6508, + "step": 9448 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002567867511535067, + "loss": 1.649, + "step": 9449 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025677807094532485, + "loss": 1.6203, + "step": 9450 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002567693900121788, + "loss": 1.6089, + "step": 9451 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002567607083541275, + "loss": 1.6443, + "step": 9452 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002567520259712299, + "loss": 1.7145, + "step": 9453 + }, + { + "epoch": 0.74, + "learning_rate": 0.000256743342863545, + "loss": 1.6294, + "step": 9454 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025673465903113164, + "loss": 1.6134, + "step": 9455 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025672597447404884, + "loss": 1.67, + "step": 9456 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002567172891923556, + "loss": 1.6105, + "step": 9457 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002567086031861109, + "loss": 1.6071, + "step": 9458 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025669991645537366, + "loss": 1.6357, + "step": 9459 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025669122900020283, + "loss": 1.6547, + "step": 9460 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002566825408206574, + "loss": 1.624, + "step": 9461 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002566738519167965, + "loss": 1.6285, + "step": 9462 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002566651622886789, + "loss": 1.613, + "step": 9463 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025665647193636376, + "loss": 1.6308, + "step": 9464 + }, + { + "epoch": 0.74, + "learning_rate": 0.0002566477808599101, + "loss": 1.6337, + "step": 9465 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025663908905937676, + "loss": 1.6759, + "step": 9466 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025663039653482287, + "loss": 1.6724, + "step": 9467 + }, + { + "epoch": 0.74, + "learning_rate": 0.00025662170328630745, + "loss": 1.653, + "step": 9468 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002566130093138895, + "loss": 1.6451, + "step": 9469 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002566043146176281, + "loss": 1.6252, + "step": 9470 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025659561919758213, + "loss": 1.6451, + "step": 9471 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002565869230538108, + "loss": 1.6036, + "step": 9472 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025657822618637305, + "loss": 1.6617, + "step": 9473 + }, + { + "epoch": 0.75, + "learning_rate": 0.000256569528595328, + "loss": 1.6595, + "step": 9474 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025656083028073465, + "loss": 1.6857, + "step": 9475 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025655213124265206, + "loss": 1.5927, + "step": 9476 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025654343148113926, + "loss": 1.6721, + "step": 9477 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002565347309962554, + "loss": 1.627, + "step": 9478 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002565260297880595, + "loss": 1.6703, + "step": 9479 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002565173278566106, + "loss": 1.5977, + "step": 9480 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002565086252019679, + "loss": 1.6515, + "step": 9481 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002564999218241904, + "loss": 1.6059, + "step": 9482 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025649121772333716, + "loss": 1.5629, + "step": 9483 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025648251289946735, + "loss": 1.6215, + "step": 9484 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025647380735264005, + "loss": 1.6362, + "step": 9485 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025646510108291433, + "loss": 1.6645, + "step": 9486 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002564563940903493, + "loss": 1.6572, + "step": 9487 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002564476863750041, + "loss": 1.6768, + "step": 9488 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002564389779369379, + "loss": 1.7057, + "step": 9489 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002564302687762098, + "loss": 1.6803, + "step": 9490 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002564215588928788, + "loss": 1.6749, + "step": 9491 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025641284828700425, + "loss": 1.6229, + "step": 9492 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025640413695864517, + "loss": 1.6393, + "step": 9493 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025639542490786066, + "loss": 1.5823, + "step": 9494 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025638671213471, + "loss": 1.6195, + "step": 9495 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002563779986392522, + "loss": 1.6502, + "step": 9496 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002563692844215466, + "loss": 1.6771, + "step": 9497 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002563605694816522, + "loss": 1.6691, + "step": 9498 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025635185381962816, + "loss": 1.6629, + "step": 9499 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002563431374355338, + "loss": 1.6426, + "step": 9500 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002563344203294282, + "loss": 1.6461, + "step": 9501 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025632570250137056, + "loss": 1.6834, + "step": 9502 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002563169839514201, + "loss": 1.6385, + "step": 9503 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002563082646796359, + "loss": 1.6594, + "step": 9504 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025629954468607736, + "loss": 1.584, + "step": 9505 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025629082397080353, + "loss": 1.6648, + "step": 9506 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002562821025338737, + "loss": 1.6392, + "step": 9507 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025627338037534695, + "loss": 1.6983, + "step": 9508 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002562646574952827, + "loss": 1.5595, + "step": 9509 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025625593389374, + "loss": 1.689, + "step": 9510 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002562472095707782, + "loss": 1.6213, + "step": 9511 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002562384845264564, + "loss": 1.6277, + "step": 9512 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025622975876083396, + "loss": 1.711, + "step": 9513 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002562210322739701, + "loss": 1.6344, + "step": 9514 + }, + { + "epoch": 0.75, + "learning_rate": 0.000256212305065924, + "loss": 1.6043, + "step": 9515 + }, + { + "epoch": 0.75, + "learning_rate": 0.000256203577136755, + "loss": 1.6551, + "step": 9516 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002561948484865223, + "loss": 1.6325, + "step": 9517 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002561861191152852, + "loss": 1.6426, + "step": 9518 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025617738902310297, + "loss": 1.6386, + "step": 9519 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025616865821003485, + "loss": 1.628, + "step": 9520 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002561599266761401, + "loss": 1.6573, + "step": 9521 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002561511944214781, + "loss": 1.6564, + "step": 9522 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025614246144610794, + "loss": 1.661, + "step": 9523 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025613372775008916, + "loss": 1.6444, + "step": 9524 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002561249933334809, + "loss": 1.62, + "step": 9525 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002561162581963425, + "loss": 1.7062, + "step": 9526 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025610752233873324, + "loss": 1.5972, + "step": 9527 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002560987857607125, + "loss": 1.6606, + "step": 9528 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002560900484623395, + "loss": 1.6608, + "step": 9529 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025608131044367366, + "loss": 1.6243, + "step": 9530 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002560725717047742, + "loss": 1.6919, + "step": 9531 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002560638322457006, + "loss": 1.6706, + "step": 9532 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025605509206651206, + "loss": 1.6167, + "step": 9533 + }, + { + "epoch": 0.75, + "learning_rate": 0.000256046351167268, + "loss": 1.6491, + "step": 9534 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025603760954802775, + "loss": 1.6767, + "step": 9535 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002560288672088506, + "loss": 1.7025, + "step": 9536 + }, + { + "epoch": 0.75, + "learning_rate": 0.000256020124149796, + "loss": 1.629, + "step": 9537 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025601138037092323, + "loss": 1.6343, + "step": 9538 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002560026358722917, + "loss": 1.5996, + "step": 9539 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002559938906539608, + "loss": 1.6066, + "step": 9540 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002559851447159898, + "loss": 1.598, + "step": 9541 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002559763980584382, + "loss": 1.654, + "step": 9542 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025596765068136535, + "loss": 1.644, + "step": 9543 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002559589025848306, + "loss": 1.6181, + "step": 9544 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025595015376889336, + "loss": 1.6445, + "step": 9545 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002559414042336131, + "loss": 1.6641, + "step": 9546 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025593265397904914, + "loss": 1.6509, + "step": 9547 + }, + { + "epoch": 0.75, + "learning_rate": 0.000255923903005261, + "loss": 1.5853, + "step": 9548 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002559151513123079, + "loss": 1.6062, + "step": 9549 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002559063989002494, + "loss": 1.6664, + "step": 9550 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002558976457691449, + "loss": 1.6467, + "step": 9551 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025588889191905376, + "loss": 1.588, + "step": 9552 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002558801373500356, + "loss": 1.6682, + "step": 9553 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002558713820621497, + "loss": 1.7259, + "step": 9554 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002558626260554555, + "loss": 1.6362, + "step": 9555 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002558538693300125, + "loss": 1.5731, + "step": 9556 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025584511188588016, + "loss": 1.6404, + "step": 9557 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002558363537231179, + "loss": 1.6105, + "step": 9558 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025582759484178523, + "loss": 1.6522, + "step": 9559 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002558188352419416, + "loss": 1.5901, + "step": 9560 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002558100749236464, + "loss": 1.6351, + "step": 9561 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025580131388695923, + "loss": 1.6793, + "step": 9562 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002557925521319396, + "loss": 1.7318, + "step": 9563 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025578378965864684, + "loss": 1.6722, + "step": 9564 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002557750264671405, + "loss": 1.6551, + "step": 9565 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025576626255748014, + "loss": 1.6481, + "step": 9566 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025575749792972524, + "loss": 1.6268, + "step": 9567 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002557487325839352, + "loss": 1.6126, + "step": 9568 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002557399665201697, + "loss": 1.6057, + "step": 9569 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002557311997384882, + "loss": 1.5909, + "step": 9570 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025572243223895015, + "loss": 1.675, + "step": 9571 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002557136640216152, + "loss": 1.5954, + "step": 9572 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002557048950865428, + "loss": 1.6247, + "step": 9573 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002556961254337924, + "loss": 1.6738, + "step": 9574 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002556873550634237, + "loss": 1.6445, + "step": 9575 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002556785839754962, + "loss": 1.6575, + "step": 9576 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002556698121700694, + "loss": 1.6498, + "step": 9577 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002556610396472029, + "loss": 1.6673, + "step": 9578 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025565226640695627, + "loss": 1.6275, + "step": 9579 + }, + { + "epoch": 0.75, + "learning_rate": 0.000255643492449389, + "loss": 1.6272, + "step": 9580 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025563471777456073, + "loss": 1.6504, + "step": 9581 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025562594238253105, + "loss": 1.5866, + "step": 9582 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002556171662733595, + "loss": 1.6618, + "step": 9583 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025560838944710564, + "loss": 1.6393, + "step": 9584 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025559961190382916, + "loss": 1.632, + "step": 9585 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002555908336435896, + "loss": 1.6841, + "step": 9586 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025558205466644647, + "loss": 1.6379, + "step": 9587 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002555732749724595, + "loss": 1.628, + "step": 9588 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002555644945616882, + "loss": 1.682, + "step": 9589 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002555557134341923, + "loss": 1.5826, + "step": 9590 + }, + { + "epoch": 0.75, + "learning_rate": 0.00025554693159003135, + "loss": 1.6276, + "step": 9591 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002555381490292649, + "loss": 1.6212, + "step": 9592 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002555293657519528, + "loss": 1.6263, + "step": 9593 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002555205817581545, + "loss": 1.6143, + "step": 9594 + }, + { + "epoch": 0.75, + "learning_rate": 0.0002555117970479296, + "loss": 1.7097, + "step": 9595 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025550301162133787, + "loss": 1.637, + "step": 9596 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002554942254784389, + "loss": 1.679, + "step": 9597 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025548543861929243, + "loss": 1.6444, + "step": 9598 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002554766510439579, + "loss": 1.6785, + "step": 9599 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025546786275249526, + "loss": 1.6596, + "step": 9600 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025545907374496395, + "loss": 1.6154, + "step": 9601 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002554502840214238, + "loss": 1.6279, + "step": 9602 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025544149358193435, + "loss": 1.5644, + "step": 9603 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025543270242655533, + "loss": 1.6215, + "step": 9604 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002554239105553465, + "loss": 1.6363, + "step": 9605 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002554151179683675, + "loss": 1.641, + "step": 9606 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025540632466567793, + "loss": 1.6561, + "step": 9607 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002553975306473377, + "loss": 1.6628, + "step": 9608 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002553887359134063, + "loss": 1.6631, + "step": 9609 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002553799404639436, + "loss": 1.6133, + "step": 9610 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025537114429900927, + "loss": 1.6597, + "step": 9611 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025536234741866293, + "loss": 1.6245, + "step": 9612 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002553535498229645, + "loss": 1.6156, + "step": 9613 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002553447515119736, + "loss": 1.6079, + "step": 9614 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025533595248574987, + "loss": 1.6254, + "step": 9615 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025532715274435326, + "loss": 1.6248, + "step": 9616 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025531835228784336, + "loss": 1.6734, + "step": 9617 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025530955111627995, + "loss": 1.5941, + "step": 9618 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025530074922972283, + "loss": 1.6318, + "step": 9619 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025529194662823174, + "loss": 1.6748, + "step": 9620 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002552831433118664, + "loss": 1.6341, + "step": 9621 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025527433928068666, + "loss": 1.619, + "step": 9622 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002552655345347522, + "loss": 1.6899, + "step": 9623 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002552567290741229, + "loss": 1.6555, + "step": 9624 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025524792289885847, + "loss": 1.6555, + "step": 9625 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002552391160090188, + "loss": 1.6343, + "step": 9626 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002552303084046635, + "loss": 1.6542, + "step": 9627 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025522150008585253, + "loss": 1.6352, + "step": 9628 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002552126910526456, + "loss": 1.6423, + "step": 9629 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002552038813051026, + "loss": 1.7127, + "step": 9630 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002551950708432833, + "loss": 1.6042, + "step": 9631 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025518625966724747, + "loss": 1.5996, + "step": 9632 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025517744777705506, + "loss": 1.6575, + "step": 9633 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025516863517276574, + "loss": 1.6607, + "step": 9634 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025515982185443946, + "loss": 1.7121, + "step": 9635 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025515100782213607, + "loss": 1.6651, + "step": 9636 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002551421930759153, + "loss": 1.6351, + "step": 9637 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002551333776158371, + "loss": 1.666, + "step": 9638 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025512456144196125, + "loss": 1.6706, + "step": 9639 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002551157445543477, + "loss": 1.629, + "step": 9640 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002551069269530562, + "loss": 1.6601, + "step": 9641 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025509810863814664, + "loss": 1.6217, + "step": 9642 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025508928960967897, + "loss": 1.6161, + "step": 9643 + }, + { + "epoch": 0.76, + "learning_rate": 0.000255080469867713, + "loss": 1.6374, + "step": 9644 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025507164941230865, + "loss": 1.6543, + "step": 9645 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025506282824352576, + "loss": 1.5965, + "step": 9646 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002550540063614243, + "loss": 1.6635, + "step": 9647 + }, + { + "epoch": 0.76, + "learning_rate": 0.000255045183766064, + "loss": 1.5928, + "step": 9648 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002550363604575049, + "loss": 1.5873, + "step": 9649 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025502753643580697, + "loss": 1.6661, + "step": 9650 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025501871170102995, + "loss": 1.6655, + "step": 9651 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002550098862532339, + "loss": 1.6379, + "step": 9652 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002550010600924786, + "loss": 1.6657, + "step": 9653 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002549922332188241, + "loss": 1.6863, + "step": 9654 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002549834056323302, + "loss": 1.6679, + "step": 9655 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025497457733305695, + "loss": 1.6642, + "step": 9656 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025496574832106425, + "loss": 1.5723, + "step": 9657 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002549569185964121, + "loss": 1.6933, + "step": 9658 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002549480881591603, + "loss": 1.6433, + "step": 9659 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002549392570093689, + "loss": 1.6258, + "step": 9660 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002549304251470979, + "loss": 1.6024, + "step": 9661 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025492159257240723, + "loss": 1.6621, + "step": 9662 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002549127592853568, + "loss": 1.6083, + "step": 9663 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002549039252860066, + "loss": 1.6221, + "step": 9664 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002548950905744168, + "loss": 1.6719, + "step": 9665 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002548862551506471, + "loss": 1.6607, + "step": 9666 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002548774190147576, + "loss": 1.6223, + "step": 9667 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025486858216680836, + "loss": 1.6071, + "step": 9668 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025485974460685926, + "loss": 1.6483, + "step": 9669 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002548509063349704, + "loss": 1.6689, + "step": 9670 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025484206735120173, + "loss": 1.6371, + "step": 9671 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025483322765561326, + "loss": 1.6573, + "step": 9672 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025482438724826504, + "loss": 1.637, + "step": 9673 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025481554612921713, + "loss": 1.6956, + "step": 9674 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025480670429852944, + "loss": 1.642, + "step": 9675 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002547978617562621, + "loss": 1.5925, + "step": 9676 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025478901850247505, + "loss": 1.6282, + "step": 9677 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025478017453722844, + "loss": 1.6162, + "step": 9678 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002547713298605823, + "loss": 1.6518, + "step": 9679 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002547624844725966, + "loss": 1.6392, + "step": 9680 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025475363837333144, + "loss": 1.6447, + "step": 9681 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002547447915628469, + "loss": 1.6759, + "step": 9682 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025473594404120303, + "loss": 1.6511, + "step": 9683 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002547270958084599, + "loss": 1.6472, + "step": 9684 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025471824686467754, + "loss": 1.669, + "step": 9685 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002547093972099161, + "loss": 1.5841, + "step": 9686 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025470054684423565, + "loss": 1.6598, + "step": 9687 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002546916957676963, + "loss": 1.6581, + "step": 9688 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025468284398035804, + "loss": 1.6306, + "step": 9689 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025467399148228106, + "loss": 1.6237, + "step": 9690 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025466513827352544, + "loss": 1.6269, + "step": 9691 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025465628435415136, + "loss": 1.5991, + "step": 9692 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025464742972421876, + "loss": 1.6411, + "step": 9693 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002546385743837879, + "loss": 1.5873, + "step": 9694 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002546297183329189, + "loss": 1.6348, + "step": 9695 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002546208615716718, + "loss": 1.6981, + "step": 9696 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002546120041001068, + "loss": 1.6029, + "step": 9697 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002546031459182841, + "loss": 1.5729, + "step": 9698 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002545942870262636, + "loss": 1.672, + "step": 9699 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002545854274241057, + "loss": 1.6119, + "step": 9700 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002545765671118705, + "loss": 1.6961, + "step": 9701 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025456770608961807, + "loss": 1.6354, + "step": 9702 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025455884435740864, + "loss": 1.6242, + "step": 9703 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025454998191530234, + "loss": 1.6182, + "step": 9704 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002545411187633594, + "loss": 1.6413, + "step": 9705 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002545322549016399, + "loss": 1.633, + "step": 9706 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025452339033020413, + "loss": 1.6686, + "step": 9707 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025451452504911216, + "loss": 1.6491, + "step": 9708 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025450565905842424, + "loss": 1.5971, + "step": 9709 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025449679235820064, + "loss": 1.6227, + "step": 9710 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025448792494850144, + "loss": 1.6747, + "step": 9711 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002544790568293869, + "loss": 1.6427, + "step": 9712 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002544701880009172, + "loss": 1.6548, + "step": 9713 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002544613184631526, + "loss": 1.6909, + "step": 9714 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002544524482161533, + "loss": 1.6594, + "step": 9715 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002544435772599795, + "loss": 1.7044, + "step": 9716 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025443470559469145, + "loss": 1.6197, + "step": 9717 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025442583322034934, + "loss": 1.6892, + "step": 9718 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002544169601370135, + "loss": 1.5759, + "step": 9719 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002544080863447441, + "loss": 1.6388, + "step": 9720 + }, + { + "epoch": 0.76, + "learning_rate": 0.00025439921184360146, + "loss": 1.5918, + "step": 9721 + }, + { + "epoch": 0.76, + "learning_rate": 0.0002543903366336457, + "loss": 1.6443, + "step": 9722 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025438146071493726, + "loss": 1.7043, + "step": 9723 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002543725840875362, + "loss": 1.6361, + "step": 9724 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025436370675150293, + "loss": 1.6582, + "step": 9725 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025435482870689774, + "loss": 1.6169, + "step": 9726 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002543459499537808, + "loss": 1.6677, + "step": 9727 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002543370704922125, + "loss": 1.5837, + "step": 9728 + }, + { + "epoch": 0.77, + "learning_rate": 0.000254328190322253, + "loss": 1.6246, + "step": 9729 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025431930944396267, + "loss": 1.6578, + "step": 9730 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002543104278574018, + "loss": 1.6404, + "step": 9731 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002543015455626307, + "loss": 1.6684, + "step": 9732 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025429266255970966, + "loss": 1.5891, + "step": 9733 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025428377884869897, + "loss": 1.6174, + "step": 9734 + }, + { + "epoch": 0.77, + "learning_rate": 0.000254274894429659, + "loss": 1.6629, + "step": 9735 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025426600930265, + "loss": 1.6106, + "step": 9736 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002542571234677324, + "loss": 1.7018, + "step": 9737 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025424823692496646, + "loss": 1.66, + "step": 9738 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002542393496744125, + "loss": 1.587, + "step": 9739 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025423046171613086, + "loss": 1.6167, + "step": 9740 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025422157305018196, + "loss": 1.6314, + "step": 9741 + }, + { + "epoch": 0.77, + "learning_rate": 0.000254212683676626, + "loss": 1.5735, + "step": 9742 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002542037935955235, + "loss": 1.644, + "step": 9743 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025419490280693475, + "loss": 1.6274, + "step": 9744 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002541860113109201, + "loss": 1.6451, + "step": 9745 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002541771191075399, + "loss": 1.6827, + "step": 9746 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002541682261968545, + "loss": 1.6851, + "step": 9747 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002541593325789244, + "loss": 1.6555, + "step": 9748 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025415043825380995, + "loss": 1.6241, + "step": 9749 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025414154322157145, + "loss": 1.6426, + "step": 9750 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002541326474822693, + "loss": 1.6054, + "step": 9751 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025412375103596403, + "loss": 1.5867, + "step": 9752 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002541148538827159, + "loss": 1.6157, + "step": 9753 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002541059560225854, + "loss": 1.6574, + "step": 9754 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025409705745563287, + "loss": 1.6497, + "step": 9755 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002540881581819187, + "loss": 1.6385, + "step": 9756 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002540792582015035, + "loss": 1.6697, + "step": 9757 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025407035751444753, + "loss": 1.6583, + "step": 9758 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025406145612081124, + "loss": 1.6391, + "step": 9759 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025405255402065514, + "loss": 1.6065, + "step": 9760 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002540436512140396, + "loss": 1.7021, + "step": 9761 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025403474770102505, + "loss": 1.6498, + "step": 9762 + }, + { + "epoch": 0.77, + "learning_rate": 0.000254025843481672, + "loss": 1.6466, + "step": 9763 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025401693855604086, + "loss": 1.6077, + "step": 9764 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025400803292419214, + "loss": 1.681, + "step": 9765 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025399912658618623, + "loss": 1.6487, + "step": 9766 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002539902195420837, + "loss": 1.7237, + "step": 9767 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025398131179194493, + "loss": 1.6566, + "step": 9768 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025397240333583043, + "loss": 1.6331, + "step": 9769 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002539634941738007, + "loss": 1.6513, + "step": 9770 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002539545843059162, + "loss": 1.6744, + "step": 9771 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002539456737322375, + "loss": 1.6496, + "step": 9772 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025393676245282496, + "loss": 1.6309, + "step": 9773 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002539278504677392, + "loss": 1.6008, + "step": 9774 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025391893777704065, + "loss": 1.6719, + "step": 9775 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002539100243807899, + "loss": 1.6404, + "step": 9776 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002539011102790474, + "loss": 1.6289, + "step": 9777 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025389219547187374, + "loss": 1.6535, + "step": 9778 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002538832799593294, + "loss": 1.6366, + "step": 9779 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025387436374147484, + "loss": 1.6491, + "step": 9780 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025386544681837075, + "loss": 1.6007, + "step": 9781 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025385652919007756, + "loss": 1.6356, + "step": 9782 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025384761085665586, + "loss": 1.6392, + "step": 9783 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002538386918181662, + "loss": 1.6005, + "step": 9784 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025382977207466913, + "loss": 1.6328, + "step": 9785 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002538208516262252, + "loss": 1.678, + "step": 9786 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025381193047289497, + "loss": 1.6879, + "step": 9787 + }, + { + "epoch": 0.77, + "learning_rate": 0.000253803008614739, + "loss": 1.5845, + "step": 9788 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002537940860518179, + "loss": 1.6472, + "step": 9789 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025378516278419224, + "loss": 1.6726, + "step": 9790 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002537762388119226, + "loss": 1.6118, + "step": 9791 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002537673141350696, + "loss": 1.6442, + "step": 9792 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025375838875369377, + "loss": 1.6566, + "step": 9793 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002537494626678557, + "loss": 1.6641, + "step": 9794 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025374053587761606, + "loss": 1.6335, + "step": 9795 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025373160838303545, + "loss": 1.6321, + "step": 9796 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025372268018417445, + "loss": 1.698, + "step": 9797 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002537137512810937, + "loss": 1.5871, + "step": 9798 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002537048216738538, + "loss": 1.6422, + "step": 9799 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002536958913625154, + "loss": 1.6444, + "step": 9800 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025368696034713914, + "loss": 1.639, + "step": 9801 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002536780286277856, + "loss": 1.613, + "step": 9802 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002536690962045154, + "loss": 1.6757, + "step": 9803 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002536601630773894, + "loss": 1.5951, + "step": 9804 + }, + { + "epoch": 0.77, + "learning_rate": 0.000253651229246468, + "loss": 1.6058, + "step": 9805 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025364229471181197, + "loss": 1.5853, + "step": 9806 + }, + { + "epoch": 0.77, + "learning_rate": 0.000253633359473482, + "loss": 1.5803, + "step": 9807 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002536244235315386, + "loss": 1.5994, + "step": 9808 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002536154868860426, + "loss": 1.6554, + "step": 9809 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025360654953705467, + "loss": 1.6389, + "step": 9810 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002535976114846354, + "loss": 1.6269, + "step": 9811 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002535886727288455, + "loss": 1.627, + "step": 9812 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025357973326974574, + "loss": 1.6624, + "step": 9813 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002535707931073967, + "loss": 1.6222, + "step": 9814 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025356185224185914, + "loss": 1.6306, + "step": 9815 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025355291067319374, + "loss": 1.6162, + "step": 9816 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002535439684014613, + "loss": 1.6218, + "step": 9817 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002535350254267224, + "loss": 1.6344, + "step": 9818 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002535260817490377, + "loss": 1.6543, + "step": 9819 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002535171373684682, + "loss": 1.656, + "step": 9820 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002535081922850744, + "loss": 1.6397, + "step": 9821 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002534992464989171, + "loss": 1.6015, + "step": 9822 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025349030001005704, + "loss": 1.5913, + "step": 9823 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002534813528185549, + "loss": 1.6197, + "step": 9824 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002534724049244716, + "loss": 1.6501, + "step": 9825 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002534634563278677, + "loss": 1.6027, + "step": 9826 + }, + { + "epoch": 0.77, + "learning_rate": 0.000253454507028804, + "loss": 1.6394, + "step": 9827 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025344555702734134, + "loss": 1.625, + "step": 9828 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025343660632354037, + "loss": 1.6405, + "step": 9829 + }, + { + "epoch": 0.77, + "learning_rate": 0.000253427654917462, + "loss": 1.6031, + "step": 9830 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025341870280916687, + "loss": 1.6182, + "step": 9831 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002534097499987158, + "loss": 1.6727, + "step": 9832 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025340079648616964, + "loss": 1.6344, + "step": 9833 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025339184227158917, + "loss": 1.6037, + "step": 9834 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025338288735503507, + "loss": 1.6178, + "step": 9835 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025337393173656826, + "loss": 1.6172, + "step": 9836 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002533649754162495, + "loss": 1.6257, + "step": 9837 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025335601839413956, + "loss": 1.6197, + "step": 9838 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025334706067029936, + "loss": 1.6611, + "step": 9839 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002533381022447896, + "loss": 1.6142, + "step": 9840 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025332914311767114, + "loss": 1.644, + "step": 9841 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025332018328900487, + "loss": 1.6601, + "step": 9842 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025331122275885155, + "loss": 1.6393, + "step": 9843 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025330226152727196, + "loss": 1.6447, + "step": 9844 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025329329959432713, + "loss": 1.6414, + "step": 9845 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002532843369600778, + "loss": 1.6585, + "step": 9846 + }, + { + "epoch": 0.77, + "learning_rate": 0.00025327537362458474, + "loss": 1.6589, + "step": 9847 + }, + { + "epoch": 0.77, + "learning_rate": 0.000253266409587909, + "loss": 1.645, + "step": 9848 + }, + { + "epoch": 0.77, + "learning_rate": 0.0002532574448501112, + "loss": 1.6615, + "step": 9849 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025324847941125237, + "loss": 1.6608, + "step": 9850 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025323951327139337, + "loss": 1.6374, + "step": 9851 + }, + { + "epoch": 0.78, + "learning_rate": 0.000253230546430595, + "loss": 1.5417, + "step": 9852 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002532215788889183, + "loss": 1.6529, + "step": 9853 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002532126106464239, + "loss": 1.6876, + "step": 9854 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002532036417031729, + "loss": 1.6503, + "step": 9855 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025319467205922613, + "loss": 1.6668, + "step": 9856 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002531857017146445, + "loss": 1.6805, + "step": 9857 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002531767306694888, + "loss": 1.6033, + "step": 9858 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025316775892382016, + "loss": 1.6172, + "step": 9859 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002531587864776993, + "loss": 1.6401, + "step": 9860 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002531498133311872, + "loss": 1.5894, + "step": 9861 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025314083948434484, + "loss": 1.5757, + "step": 9862 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025313186493723303, + "loss": 1.5893, + "step": 9863 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002531228896899129, + "loss": 1.6112, + "step": 9864 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025311391374244517, + "loss": 1.6891, + "step": 9865 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002531049370948908, + "loss": 1.6286, + "step": 9866 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025309595974731087, + "loss": 1.5937, + "step": 9867 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025308698169976626, + "loss": 1.654, + "step": 9868 + }, + { + "epoch": 0.78, + "learning_rate": 0.000253078002952318, + "loss": 1.6459, + "step": 9869 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002530690235050269, + "loss": 1.6533, + "step": 9870 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025306004335795405, + "loss": 1.6334, + "step": 9871 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002530510625111603, + "loss": 1.6456, + "step": 9872 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002530420809647068, + "loss": 1.6829, + "step": 9873 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002530330987186544, + "loss": 1.6514, + "step": 9874 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002530241157730641, + "loss": 1.6087, + "step": 9875 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025301513212799695, + "loss": 1.6606, + "step": 9876 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002530061477835139, + "loss": 1.6232, + "step": 9877 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025299716273967593, + "loss": 1.6669, + "step": 9878 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025298817699654405, + "loss": 1.6416, + "step": 9879 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002529791905541793, + "loss": 1.6208, + "step": 9880 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002529702034126426, + "loss": 1.6346, + "step": 9881 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025296121557199516, + "loss": 1.6296, + "step": 9882 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025295222703229783, + "loss": 1.6466, + "step": 9883 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025294323779361167, + "loss": 1.6257, + "step": 9884 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002529342478559978, + "loss": 1.6281, + "step": 9885 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025292525721951715, + "loss": 1.6077, + "step": 9886 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025291626588423076, + "loss": 1.6291, + "step": 9887 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002529072738501998, + "loss": 1.6721, + "step": 9888 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002528982811174852, + "loss": 1.6356, + "step": 9889 + }, + { + "epoch": 0.78, + "learning_rate": 0.000252889287686148, + "loss": 1.6524, + "step": 9890 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025288029355624944, + "loss": 1.63, + "step": 9891 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025287129872785034, + "loss": 1.5954, + "step": 9892 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025286230320101195, + "loss": 1.646, + "step": 9893 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002528533069757953, + "loss": 1.6826, + "step": 9894 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025284431005226143, + "loss": 1.6308, + "step": 9895 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025283531243047144, + "loss": 1.638, + "step": 9896 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002528263141104865, + "loss": 1.5817, + "step": 9897 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002528173150923675, + "loss": 1.6102, + "step": 9898 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002528083153761758, + "loss": 1.6224, + "step": 9899 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025279931496197225, + "loss": 1.6339, + "step": 9900 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002527903138498182, + "loss": 1.642, + "step": 9901 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002527813120397746, + "loss": 1.669, + "step": 9902 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025277230953190256, + "loss": 1.6684, + "step": 9903 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025276330632626327, + "loss": 1.6488, + "step": 9904 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002527543024229179, + "loss": 1.6556, + "step": 9905 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025274529782192746, + "loss": 1.6682, + "step": 9906 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002527362925233532, + "loss": 1.6943, + "step": 9907 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025272728652725614, + "loss": 1.6391, + "step": 9908 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025271827983369753, + "loss": 1.6611, + "step": 9909 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002527092724427385, + "loss": 1.6065, + "step": 9910 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002527002643544402, + "loss": 1.5877, + "step": 9911 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025269125556886374, + "loss": 1.6806, + "step": 9912 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002526822460860703, + "loss": 1.6543, + "step": 9913 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025267323590612116, + "loss": 1.6563, + "step": 9914 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025266422502907734, + "loss": 1.6231, + "step": 9915 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002526552134550001, + "loss": 1.5978, + "step": 9916 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025264620118395066, + "loss": 1.6202, + "step": 9917 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002526371882159901, + "loss": 1.6703, + "step": 9918 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002526281745511797, + "loss": 1.6678, + "step": 9919 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002526191601895806, + "loss": 1.6353, + "step": 9920 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002526101451312541, + "loss": 1.6215, + "step": 9921 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025260112937626125, + "loss": 1.5686, + "step": 9922 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002525921129246634, + "loss": 1.6025, + "step": 9923 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002525830957765217, + "loss": 1.5978, + "step": 9924 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002525740779318974, + "loss": 1.576, + "step": 9925 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002525650593908517, + "loss": 1.6686, + "step": 9926 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025255604015344586, + "loss": 1.6339, + "step": 9927 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025254702021974113, + "loss": 1.5895, + "step": 9928 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025253799958979874, + "loss": 1.6514, + "step": 9929 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002525289782636799, + "loss": 1.6111, + "step": 9930 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002525199562414458, + "loss": 1.6311, + "step": 9931 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025251093352315787, + "loss": 1.6423, + "step": 9932 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025250191010887723, + "loss": 1.5924, + "step": 9933 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025249288599866516, + "loss": 1.6353, + "step": 9934 + }, + { + "epoch": 0.78, + "learning_rate": 0.000252483861192583, + "loss": 1.6059, + "step": 9935 + }, + { + "epoch": 0.78, + "learning_rate": 0.000252474835690692, + "loss": 1.6467, + "step": 9936 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002524658094930533, + "loss": 1.6218, + "step": 9937 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025245678259972837, + "loss": 1.6273, + "step": 9938 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025244775501077844, + "loss": 1.7123, + "step": 9939 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002524387267262648, + "loss": 1.6276, + "step": 9940 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025242969774624867, + "loss": 1.5701, + "step": 9941 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002524206680707915, + "loss": 1.633, + "step": 9942 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002524116376999545, + "loss": 1.6244, + "step": 9943 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025240260663379895, + "loss": 1.6001, + "step": 9944 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002523935748723862, + "loss": 1.6827, + "step": 9945 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025238454241577763, + "loss": 1.6135, + "step": 9946 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002523755092640345, + "loss": 1.6474, + "step": 9947 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025236647541721814, + "loss": 1.6361, + "step": 9948 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025235744087538994, + "loss": 1.5966, + "step": 9949 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002523484056386112, + "loss": 1.6746, + "step": 9950 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002523393697069432, + "loss": 1.6676, + "step": 9951 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025233033308044744, + "loss": 1.663, + "step": 9952 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002523212957591851, + "loss": 1.619, + "step": 9953 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002523122577432177, + "loss": 1.5789, + "step": 9954 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025230321903260656, + "loss": 1.6237, + "step": 9955 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025229417962741295, + "loss": 1.6701, + "step": 9956 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025228513952769836, + "loss": 1.631, + "step": 9957 + }, + { + "epoch": 0.78, + "learning_rate": 0.000252276098733524, + "loss": 1.6207, + "step": 9958 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025226705724495154, + "loss": 1.7025, + "step": 9959 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002522580150620421, + "loss": 1.6403, + "step": 9960 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002522489721848572, + "loss": 1.5593, + "step": 9961 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002522399286134582, + "loss": 1.631, + "step": 9962 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025223088434790647, + "loss": 1.7165, + "step": 9963 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002522218393882635, + "loss": 1.591, + "step": 9964 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025221279373459056, + "loss": 1.6474, + "step": 9965 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025220374738694926, + "loss": 1.6229, + "step": 9966 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002521947003454009, + "loss": 1.6252, + "step": 9967 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025218565261000687, + "loss": 1.6168, + "step": 9968 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025217660418082864, + "loss": 1.604, + "step": 9969 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002521675550579277, + "loss": 1.6043, + "step": 9970 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025215850524136545, + "loss": 1.6321, + "step": 9971 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002521494547312033, + "loss": 1.6393, + "step": 9972 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025214040352750273, + "loss": 1.6368, + "step": 9973 + }, + { + "epoch": 0.78, + "learning_rate": 0.00025213135163032523, + "loss": 1.6984, + "step": 9974 + }, + { + "epoch": 0.78, + "learning_rate": 0.0002521222990397322, + "loss": 1.6534, + "step": 9975 + }, + { + "epoch": 0.78, + "learning_rate": 0.000252113245755785, + "loss": 1.6166, + "step": 9976 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002521041917785453, + "loss": 1.6103, + "step": 9977 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002520951371080745, + "loss": 1.6582, + "step": 9978 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025208608174443403, + "loss": 1.6321, + "step": 9979 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002520770256876854, + "loss": 1.6216, + "step": 9980 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002520679689378902, + "loss": 1.6158, + "step": 9981 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002520589114951097, + "loss": 1.6443, + "step": 9982 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002520498533594055, + "loss": 1.6112, + "step": 9983 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025204079453083916, + "loss": 1.6406, + "step": 9984 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025203173500947207, + "loss": 1.6527, + "step": 9985 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002520226747953659, + "loss": 1.6293, + "step": 9986 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025201361388858205, + "loss": 1.6078, + "step": 9987 + }, + { + "epoch": 0.79, + "learning_rate": 0.000252004552289182, + "loss": 1.6494, + "step": 9988 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002519954899972274, + "loss": 1.6354, + "step": 9989 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002519864270127796, + "loss": 1.6767, + "step": 9990 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002519773633359004, + "loss": 1.6468, + "step": 9991 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025196829896665106, + "loss": 1.6471, + "step": 9992 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025195923390509327, + "loss": 1.6442, + "step": 9993 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025195016815128855, + "loss": 1.6649, + "step": 9994 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025194110170529847, + "loss": 1.6648, + "step": 9995 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002519320345671845, + "loss": 1.6528, + "step": 9996 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002519229667370084, + "loss": 1.6444, + "step": 9997 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002519138982148315, + "loss": 1.599, + "step": 9998 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025190482900071547, + "loss": 1.5904, + "step": 9999 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025189575909472195, + "loss": 1.654, + "step": 10000 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025188668849691236, + "loss": 1.6002, + "step": 10001 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025187761720734845, + "loss": 1.6263, + "step": 10002 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002518685452260917, + "loss": 1.5878, + "step": 10003 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025185947255320376, + "loss": 1.6261, + "step": 10004 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025185039918874626, + "loss": 1.603, + "step": 10005 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002518413251327807, + "loss": 1.5935, + "step": 10006 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025183225038536875, + "loss": 1.6658, + "step": 10007 + }, + { + "epoch": 0.79, + "learning_rate": 0.000251823174946572, + "loss": 1.6301, + "step": 10008 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002518140988164521, + "loss": 1.6646, + "step": 10009 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002518050219950707, + "loss": 1.6806, + "step": 10010 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002517959444824893, + "loss": 1.6207, + "step": 10011 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025178686627876963, + "loss": 1.5972, + "step": 10012 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025177778738397336, + "loss": 1.6324, + "step": 10013 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002517687077981621, + "loss": 1.6589, + "step": 10014 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002517596275213974, + "loss": 1.6607, + "step": 10015 + }, + { + "epoch": 0.79, + "learning_rate": 0.000251750546553741, + "loss": 1.6457, + "step": 10016 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025174146489525455, + "loss": 1.5953, + "step": 10017 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025173238254599966, + "loss": 1.695, + "step": 10018 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002517232995060381, + "loss": 1.6151, + "step": 10019 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002517142157754314, + "loss": 1.6627, + "step": 10020 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002517051313542414, + "loss": 1.6726, + "step": 10021 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002516960462425296, + "loss": 1.6536, + "step": 10022 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025168696044035777, + "loss": 1.6269, + "step": 10023 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025167787394778763, + "loss": 1.6275, + "step": 10024 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025166878676488087, + "loss": 1.6424, + "step": 10025 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002516596988916991, + "loss": 1.6627, + "step": 10026 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002516506103283041, + "loss": 1.6303, + "step": 10027 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025164152107475755, + "loss": 1.6747, + "step": 10028 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025163243113112115, + "loss": 1.588, + "step": 10029 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025162334049745665, + "loss": 1.6829, + "step": 10030 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025161424917382566, + "loss": 1.6407, + "step": 10031 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002516051571602901, + "loss": 1.648, + "step": 10032 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002515960644569116, + "loss": 1.6028, + "step": 10033 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002515869710637518, + "loss": 1.6749, + "step": 10034 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025157787698087253, + "loss": 1.6478, + "step": 10035 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002515687822083356, + "loss": 1.6423, + "step": 10036 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002515596867462027, + "loss": 1.6349, + "step": 10037 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002515505905945355, + "loss": 1.6696, + "step": 10038 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025154149375339584, + "loss": 1.6285, + "step": 10039 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002515323962228455, + "loss": 1.5725, + "step": 10040 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002515232980029462, + "loss": 1.6946, + "step": 10041 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025151419909375975, + "loss": 1.586, + "step": 10042 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002515050994953479, + "loss": 1.6994, + "step": 10043 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002514959992077725, + "loss": 1.6336, + "step": 10044 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002514868982310952, + "loss": 1.605, + "step": 10045 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025147779656537785, + "loss": 1.579, + "step": 10046 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002514686942106823, + "loss": 1.6186, + "step": 10047 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025145959116707026, + "loss": 1.6482, + "step": 10048 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025145048743460365, + "loss": 1.6443, + "step": 10049 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002514413830133442, + "loss": 1.6166, + "step": 10050 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025143227790335376, + "loss": 1.6514, + "step": 10051 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002514231721046941, + "loss": 1.589, + "step": 10052 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002514140656174271, + "loss": 1.6676, + "step": 10053 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002514049584416146, + "loss": 1.6502, + "step": 10054 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025139585057731823, + "loss": 1.6539, + "step": 10055 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025138674202460017, + "loss": 1.6495, + "step": 10056 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002513776327835219, + "loss": 1.6763, + "step": 10057 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002513685228541456, + "loss": 1.5691, + "step": 10058 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025135941223653293, + "loss": 1.6192, + "step": 10059 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002513503009307458, + "loss": 1.6168, + "step": 10060 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025134118893684596, + "loss": 1.5989, + "step": 10061 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025133207625489546, + "loss": 1.6539, + "step": 10062 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025132296288495607, + "loss": 1.6331, + "step": 10063 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025131384882708964, + "loss": 1.6229, + "step": 10064 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025130473408135814, + "loss": 1.6618, + "step": 10065 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025129561864782336, + "loss": 1.6681, + "step": 10066 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002512865025265473, + "loss": 1.6782, + "step": 10067 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002512773857175917, + "loss": 1.6112, + "step": 10068 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025126826822101855, + "loss": 1.6413, + "step": 10069 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002512591500368898, + "loss": 1.6467, + "step": 10070 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002512500311652672, + "loss": 1.6493, + "step": 10071 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002512409116062129, + "loss": 1.6486, + "step": 10072 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025123179135978855, + "loss": 1.5876, + "step": 10073 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025122267042605625, + "loss": 1.626, + "step": 10074 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002512135488050779, + "loss": 1.6247, + "step": 10075 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002512044264969154, + "loss": 1.6778, + "step": 10076 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002511953035016307, + "loss": 1.6138, + "step": 10077 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002511861798192857, + "loss": 1.6636, + "step": 10078 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002511770554499424, + "loss": 1.6899, + "step": 10079 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002511679303936627, + "loss": 1.6298, + "step": 10080 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025115880465050863, + "loss": 1.6691, + "step": 10081 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025114967822054206, + "loss": 1.6169, + "step": 10082 + }, + { + "epoch": 0.79, + "learning_rate": 0.000251140551103825, + "loss": 1.5936, + "step": 10083 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025113142330041943, + "loss": 1.6064, + "step": 10084 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025112229481038726, + "loss": 1.6599, + "step": 10085 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025111316563379056, + "loss": 1.6275, + "step": 10086 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025110403577069125, + "loss": 1.6195, + "step": 10087 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002510949052211514, + "loss": 1.6368, + "step": 10088 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002510857739852328, + "loss": 1.58, + "step": 10089 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025107664206299764, + "loss": 1.6505, + "step": 10090 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002510675094545079, + "loss": 1.6389, + "step": 10091 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025105837615982553, + "loss": 1.5669, + "step": 10092 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025104924217901245, + "loss": 1.6718, + "step": 10093 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002510401075121309, + "loss": 1.6295, + "step": 10094 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025103097215924277, + "loss": 1.6544, + "step": 10095 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025102183612041003, + "loss": 1.6742, + "step": 10096 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002510126993956948, + "loss": 1.603, + "step": 10097 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025100356198515906, + "loss": 1.6313, + "step": 10098 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025099442388886497, + "loss": 1.5884, + "step": 10099 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025098528510687437, + "loss": 1.6543, + "step": 10100 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025097614563924944, + "loss": 1.6313, + "step": 10101 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002509670054860522, + "loss": 1.6464, + "step": 10102 + }, + { + "epoch": 0.79, + "learning_rate": 0.0002509578646473447, + "loss": 1.606, + "step": 10103 + }, + { + "epoch": 0.79, + "learning_rate": 0.00025094872312318906, + "loss": 1.6089, + "step": 10104 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002509395809136473, + "loss": 1.6314, + "step": 10105 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002509304380187814, + "loss": 1.6213, + "step": 10106 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025092129443865367, + "loss": 1.6265, + "step": 10107 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002509121501733259, + "loss": 1.6282, + "step": 10108 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002509030052228604, + "loss": 1.6688, + "step": 10109 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025089385958731916, + "loss": 1.6208, + "step": 10110 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002508847132667643, + "loss": 1.6259, + "step": 10111 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002508755662612579, + "loss": 1.67, + "step": 10112 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025086641857086203, + "loss": 1.6712, + "step": 10113 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002508572701956389, + "loss": 1.6967, + "step": 10114 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002508481211356506, + "loss": 1.6542, + "step": 10115 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025083897139095907, + "loss": 1.6085, + "step": 10116 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002508298209616267, + "loss": 1.6193, + "step": 10117 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025082066984771545, + "loss": 1.5484, + "step": 10118 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002508115180492874, + "loss": 1.6168, + "step": 10119 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002508023655664049, + "loss": 1.6547, + "step": 10120 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002507932123991299, + "loss": 1.5679, + "step": 10121 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002507840585475247, + "loss": 1.5841, + "step": 10122 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025077490401165123, + "loss": 1.6318, + "step": 10123 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025076574879157184, + "loss": 1.656, + "step": 10124 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025075659288734863, + "loss": 1.6334, + "step": 10125 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025074743629904377, + "loss": 1.5925, + "step": 10126 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025073827902671934, + "loss": 1.689, + "step": 10127 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002507291210704377, + "loss": 1.6409, + "step": 10128 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002507199624302608, + "loss": 1.6264, + "step": 10129 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025071080310625095, + "loss": 1.6052, + "step": 10130 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002507016430984704, + "loss": 1.6008, + "step": 10131 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025069248240698123, + "loss": 1.5993, + "step": 10132 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025068332103184566, + "loss": 1.6479, + "step": 10133 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002506741589731259, + "loss": 1.6592, + "step": 10134 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002506649962308842, + "loss": 1.6674, + "step": 10135 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002506558328051827, + "loss": 1.6219, + "step": 10136 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002506466686960836, + "loss": 1.5928, + "step": 10137 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025063750390364923, + "loss": 1.6456, + "step": 10138 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025062833842794173, + "loss": 1.6035, + "step": 10139 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002506191722690233, + "loss": 1.6215, + "step": 10140 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025061000542695626, + "loss": 1.6035, + "step": 10141 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025060083790180276, + "loss": 1.6415, + "step": 10142 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025059166969362514, + "loss": 1.6273, + "step": 10143 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025058250080248553, + "loss": 1.6016, + "step": 10144 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025057333122844634, + "loss": 1.6676, + "step": 10145 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002505641609715696, + "loss": 1.6379, + "step": 10146 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002505549900319178, + "loss": 1.6112, + "step": 10147 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025054581840955315, + "loss": 1.6722, + "step": 10148 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025053664610453775, + "loss": 1.6416, + "step": 10149 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002505274731169341, + "loss": 1.6447, + "step": 10150 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002505182994468043, + "loss": 1.5935, + "step": 10151 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002505091250942108, + "loss": 1.6231, + "step": 10152 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025049995005921576, + "loss": 1.6422, + "step": 10153 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025049077434188155, + "loss": 1.6101, + "step": 10154 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002504815979422704, + "loss": 1.6412, + "step": 10155 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002504724208604447, + "loss": 1.6513, + "step": 10156 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002504632430964667, + "loss": 1.653, + "step": 10157 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002504540646503987, + "loss": 1.6498, + "step": 10158 + }, + { + "epoch": 0.8, + "learning_rate": 0.000250444885522303, + "loss": 1.5949, + "step": 10159 + }, + { + "epoch": 0.8, + "learning_rate": 0.000250435705712242, + "loss": 1.6507, + "step": 10160 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025042652522027796, + "loss": 1.6116, + "step": 10161 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002504173440464733, + "loss": 1.6095, + "step": 10162 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002504081621908902, + "loss": 1.609, + "step": 10163 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025039897965359114, + "loss": 1.601, + "step": 10164 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002503897964346384, + "loss": 1.5861, + "step": 10165 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002503806125340943, + "loss": 1.5656, + "step": 10166 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002503714279520213, + "loss": 1.6471, + "step": 10167 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002503622426884817, + "loss": 1.6659, + "step": 10168 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002503530567435378, + "loss": 1.6197, + "step": 10169 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025034387011725205, + "loss": 1.6274, + "step": 10170 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002503346828096868, + "loss": 1.6228, + "step": 10171 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025032549482090444, + "loss": 1.6337, + "step": 10172 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025031630615096726, + "loss": 1.6254, + "step": 10173 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025030711679993785, + "loss": 1.6521, + "step": 10174 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025029792676787833, + "loss": 1.6457, + "step": 10175 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025028873605485133, + "loss": 1.6417, + "step": 10176 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025027954466091913, + "loss": 1.5928, + "step": 10177 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002502703525861442, + "loss": 1.613, + "step": 10178 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002502611598305888, + "loss": 1.6554, + "step": 10179 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002502519663943156, + "loss": 1.6299, + "step": 10180 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025024277227738676, + "loss": 1.6315, + "step": 10181 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002502335774798648, + "loss": 1.6219, + "step": 10182 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002502243820018123, + "loss": 1.6696, + "step": 10183 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002502151858432914, + "loss": 1.6736, + "step": 10184 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025020598900436477, + "loss": 1.602, + "step": 10185 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025019679148509475, + "loss": 1.6459, + "step": 10186 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002501875932855438, + "loss": 1.6394, + "step": 10187 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002501783944057744, + "loss": 1.6569, + "step": 10188 + }, + { + "epoch": 0.8, + "learning_rate": 0.000250169194845849, + "loss": 1.6204, + "step": 10189 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025015999460583, + "loss": 1.6379, + "step": 10190 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025015079368577995, + "loss": 1.7212, + "step": 10191 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002501415920857613, + "loss": 1.6307, + "step": 10192 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002501323898058365, + "loss": 1.6606, + "step": 10193 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025012318684606796, + "loss": 1.6279, + "step": 10194 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002501139832065183, + "loss": 1.6407, + "step": 10195 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002501047788872499, + "loss": 1.6133, + "step": 10196 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002500955738883253, + "loss": 1.5868, + "step": 10197 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025008636820980705, + "loss": 1.6254, + "step": 10198 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002500771618517575, + "loss": 1.6394, + "step": 10199 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002500679548142393, + "loss": 1.6037, + "step": 10200 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002500587470973149, + "loss": 1.6315, + "step": 10201 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025004953870104684, + "loss": 1.6575, + "step": 10202 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025004032962549756, + "loss": 1.6316, + "step": 10203 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002500311198707297, + "loss": 1.6834, + "step": 10204 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025002190943680577, + "loss": 1.6102, + "step": 10205 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002500126983237882, + "loss": 1.6391, + "step": 10206 + }, + { + "epoch": 0.8, + "learning_rate": 0.00025000348653173964, + "loss": 1.6632, + "step": 10207 + }, + { + "epoch": 0.8, + "learning_rate": 0.00024999427406072265, + "loss": 1.644, + "step": 10208 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002499850609107996, + "loss": 1.5916, + "step": 10209 + }, + { + "epoch": 0.8, + "learning_rate": 0.00024997584708203325, + "loss": 1.613, + "step": 10210 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002499666325744861, + "loss": 1.6362, + "step": 10211 + }, + { + "epoch": 0.8, + "learning_rate": 0.00024995741738822054, + "loss": 1.602, + "step": 10212 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002499482015232994, + "loss": 1.6242, + "step": 10213 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002499389849797851, + "loss": 1.6291, + "step": 10214 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002499297677577402, + "loss": 1.6223, + "step": 10215 + }, + { + "epoch": 0.8, + "learning_rate": 0.00024992054985722734, + "loss": 1.6419, + "step": 10216 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002499113312783091, + "loss": 1.5666, + "step": 10217 + }, + { + "epoch": 0.8, + "learning_rate": 0.00024990211202104807, + "loss": 1.6546, + "step": 10218 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002498928920855068, + "loss": 1.5836, + "step": 10219 + }, + { + "epoch": 0.8, + "learning_rate": 0.00024988367147174795, + "loss": 1.6507, + "step": 10220 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002498744501798341, + "loss": 1.6941, + "step": 10221 + }, + { + "epoch": 0.8, + "learning_rate": 0.00024986522820982776, + "loss": 1.645, + "step": 10222 + }, + { + "epoch": 0.8, + "learning_rate": 0.00024985600556179176, + "loss": 1.6526, + "step": 10223 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002498467822357885, + "loss": 1.6633, + "step": 10224 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002498375582318807, + "loss": 1.6638, + "step": 10225 + }, + { + "epoch": 0.8, + "learning_rate": 0.000249828333550131, + "loss": 1.6014, + "step": 10226 + }, + { + "epoch": 0.8, + "learning_rate": 0.00024981910819060196, + "loss": 1.6581, + "step": 10227 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002498098821533563, + "loss": 1.6274, + "step": 10228 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002498006554384566, + "loss": 1.6462, + "step": 10229 + }, + { + "epoch": 0.8, + "learning_rate": 0.00024979142804596556, + "loss": 1.6353, + "step": 10230 + }, + { + "epoch": 0.8, + "learning_rate": 0.0002497821999759458, + "loss": 1.6946, + "step": 10231 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002497729712284599, + "loss": 1.5386, + "step": 10232 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002497637418035706, + "loss": 1.621, + "step": 10233 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024975451170134057, + "loss": 1.6191, + "step": 10234 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024974528092183246, + "loss": 1.6295, + "step": 10235 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002497360494651089, + "loss": 1.6314, + "step": 10236 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024972681733123267, + "loss": 1.6444, + "step": 10237 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024971758452026633, + "loss": 1.634, + "step": 10238 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002497083510322726, + "loss": 1.6913, + "step": 10239 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024969911686731426, + "loss": 1.6672, + "step": 10240 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002496898820254539, + "loss": 1.6124, + "step": 10241 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002496806465067543, + "loss": 1.6211, + "step": 10242 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024967141031127804, + "loss": 1.6096, + "step": 10243 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002496621734390879, + "loss": 1.6653, + "step": 10244 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024965293589024665, + "loss": 1.6133, + "step": 10245 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024964369766481694, + "loss": 1.5657, + "step": 10246 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002496344587628615, + "loss": 1.6451, + "step": 10247 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002496252191844431, + "loss": 1.6769, + "step": 10248 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024961597892962444, + "loss": 1.5898, + "step": 10249 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024960673799846825, + "loss": 1.6459, + "step": 10250 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024959749639103727, + "loss": 1.6452, + "step": 10251 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002495882541073942, + "loss": 1.6829, + "step": 10252 + }, + { + "epoch": 0.81, + "learning_rate": 0.000249579011147602, + "loss": 1.623, + "step": 10253 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002495697675117231, + "loss": 1.65, + "step": 10254 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024956052319982045, + "loss": 1.6303, + "step": 10255 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002495512782119569, + "loss": 1.6017, + "step": 10256 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024954203254819505, + "loss": 1.5902, + "step": 10257 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024953278620859764, + "loss": 1.6055, + "step": 10258 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024952353919322764, + "loss": 1.6643, + "step": 10259 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024951429150214767, + "loss": 1.6386, + "step": 10260 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002495050431354206, + "loss": 1.6394, + "step": 10261 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024949579409310927, + "loss": 1.6698, + "step": 10262 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002494865443752763, + "loss": 1.6076, + "step": 10263 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024947729398198465, + "loss": 1.6299, + "step": 10264 + }, + { + "epoch": 0.81, + "learning_rate": 0.000249468042913297, + "loss": 1.6926, + "step": 10265 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024945879116927634, + "loss": 1.5842, + "step": 10266 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002494495387499853, + "loss": 1.5986, + "step": 10267 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002494402856554868, + "loss": 1.6211, + "step": 10268 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002494310318858437, + "loss": 1.6445, + "step": 10269 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024942177744111864, + "loss": 1.6264, + "step": 10270 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024941252232137465, + "loss": 1.5929, + "step": 10271 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002494032665266744, + "loss": 1.5775, + "step": 10272 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024939401005708093, + "loss": 1.5879, + "step": 10273 + }, + { + "epoch": 0.81, + "learning_rate": 0.000249384752912657, + "loss": 1.6206, + "step": 10274 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024937549509346533, + "loss": 1.5847, + "step": 10275 + }, + { + "epoch": 0.81, + "learning_rate": 0.000249366236599569, + "loss": 1.6303, + "step": 10276 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002493569774310307, + "loss": 1.591, + "step": 10277 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002493477175879134, + "loss": 1.6504, + "step": 10278 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024933845707027984, + "loss": 1.653, + "step": 10279 + }, + { + "epoch": 0.81, + "learning_rate": 0.000249329195878193, + "loss": 1.5981, + "step": 10280 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002493199340117158, + "loss": 1.6321, + "step": 10281 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024931067147091103, + "loss": 1.5791, + "step": 10282 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002493014082558415, + "loss": 1.6164, + "step": 10283 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024929214436657037, + "loss": 1.6462, + "step": 10284 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024928287980316026, + "loss": 1.6594, + "step": 10285 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002492736145656742, + "loss": 1.5804, + "step": 10286 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002492643486541751, + "loss": 1.7146, + "step": 10287 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002492550820687259, + "loss": 1.6673, + "step": 10288 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024924581480938944, + "loss": 1.5741, + "step": 10289 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024923654687622867, + "loss": 1.5524, + "step": 10290 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002492272782693064, + "loss": 1.6475, + "step": 10291 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002492180089886858, + "loss": 1.5954, + "step": 10292 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024920873903442963, + "loss": 1.6295, + "step": 10293 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024919946840660086, + "loss": 1.5909, + "step": 10294 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024919019710526244, + "loss": 1.6308, + "step": 10295 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002491809251304773, + "loss": 1.59, + "step": 10296 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002491716524823085, + "loss": 1.6316, + "step": 10297 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024916237916081883, + "loss": 1.6635, + "step": 10298 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024915310516607133, + "loss": 1.5833, + "step": 10299 + }, + { + "epoch": 0.81, + "learning_rate": 0.000249143830498129, + "loss": 1.6275, + "step": 10300 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024913455515705474, + "loss": 1.6459, + "step": 10301 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002491252791429116, + "loss": 1.6657, + "step": 10302 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002491160024557625, + "loss": 1.651, + "step": 10303 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002491067250956704, + "loss": 1.6584, + "step": 10304 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002490974470626984, + "loss": 1.5902, + "step": 10305 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002490881683569093, + "loss": 1.5894, + "step": 10306 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002490788889783663, + "loss": 1.6923, + "step": 10307 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024906960892713233, + "loss": 1.6321, + "step": 10308 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024906032820327034, + "loss": 1.6504, + "step": 10309 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002490510468068435, + "loss": 1.6041, + "step": 10310 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024904176473791457, + "loss": 1.5962, + "step": 10311 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002490324819965468, + "loss": 1.633, + "step": 10312 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002490231985828031, + "loss": 1.684, + "step": 10313 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002490139144967465, + "loss": 1.6404, + "step": 10314 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002490046297384401, + "loss": 1.5674, + "step": 10315 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002489953443079469, + "loss": 1.6638, + "step": 10316 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002489860582053299, + "loss": 1.6151, + "step": 10317 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024897677143065225, + "loss": 1.5942, + "step": 10318 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002489674839839769, + "loss": 1.6343, + "step": 10319 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024895819586536697, + "loss": 1.6573, + "step": 10320 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002489489070748855, + "loss": 1.6239, + "step": 10321 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024893961761259556, + "loss": 1.6005, + "step": 10322 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002489303274785602, + "loss": 1.5907, + "step": 10323 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024892103667284254, + "loss": 1.6033, + "step": 10324 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024891174519550555, + "loss": 1.5833, + "step": 10325 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024890245304661244, + "loss": 1.5881, + "step": 10326 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024889316022622625, + "loss": 1.6523, + "step": 10327 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002488838667344101, + "loss": 1.6488, + "step": 10328 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002488745725712271, + "loss": 1.6693, + "step": 10329 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002488652777367402, + "loss": 1.6297, + "step": 10330 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002488559822310127, + "loss": 1.61, + "step": 10331 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024884668605410767, + "loss": 1.609, + "step": 10332 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002488373892060881, + "loss": 1.5955, + "step": 10333 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024882809168701723, + "loss": 1.5537, + "step": 10334 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024881879349695823, + "loss": 1.6213, + "step": 10335 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024880949463597406, + "loss": 1.5846, + "step": 10336 + }, + { + "epoch": 0.81, + "learning_rate": 0.000248800195104128, + "loss": 1.6184, + "step": 10337 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002487908949014831, + "loss": 1.6538, + "step": 10338 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024878159402810253, + "loss": 1.5953, + "step": 10339 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002487722924840495, + "loss": 1.6489, + "step": 10340 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002487629902693871, + "loss": 1.6203, + "step": 10341 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002487536873841785, + "loss": 1.6155, + "step": 10342 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002487443838284868, + "loss": 1.6888, + "step": 10343 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002487350796023753, + "loss": 1.6329, + "step": 10344 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002487257747059071, + "loss": 1.6105, + "step": 10345 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002487164691391453, + "loss": 1.6389, + "step": 10346 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024870716290215317, + "loss": 1.6382, + "step": 10347 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002486978559949939, + "loss": 1.6708, + "step": 10348 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024868854841773066, + "loss": 1.6504, + "step": 10349 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024867924017042665, + "loss": 1.6178, + "step": 10350 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024866993125314505, + "loss": 1.6635, + "step": 10351 + }, + { + "epoch": 0.81, + "learning_rate": 0.000248660621665949, + "loss": 1.6435, + "step": 10352 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024865131140890183, + "loss": 1.6513, + "step": 10353 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002486420004820667, + "loss": 1.6711, + "step": 10354 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024863268888550684, + "loss": 1.6316, + "step": 10355 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024862337661928535, + "loss": 1.5965, + "step": 10356 + }, + { + "epoch": 0.81, + "learning_rate": 0.00024861406368346565, + "loss": 1.5897, + "step": 10357 + }, + { + "epoch": 0.81, + "learning_rate": 0.0002486047500781109, + "loss": 1.6115, + "step": 10358 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024859543580328425, + "loss": 1.6249, + "step": 10359 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024858612085904903, + "loss": 1.6275, + "step": 10360 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002485768052454684, + "loss": 1.6167, + "step": 10361 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002485674889626057, + "loss": 1.6526, + "step": 10362 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024855817201052417, + "loss": 1.6357, + "step": 10363 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024854885438928704, + "loss": 1.6354, + "step": 10364 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024853953609895753, + "loss": 1.6685, + "step": 10365 + }, + { + "epoch": 0.82, + "learning_rate": 0.000248530217139599, + "loss": 1.5874, + "step": 10366 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002485208975112746, + "loss": 1.6174, + "step": 10367 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024851157721404775, + "loss": 1.6466, + "step": 10368 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002485022562479816, + "loss": 1.6589, + "step": 10369 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002484929346131395, + "loss": 1.6488, + "step": 10370 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024848361230958473, + "loss": 1.6246, + "step": 10371 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002484742893373806, + "loss": 1.6233, + "step": 10372 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002484649656965904, + "loss": 1.6057, + "step": 10373 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002484556413872774, + "loss": 1.6329, + "step": 10374 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002484463164095049, + "loss": 1.6548, + "step": 10375 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002484369907633362, + "loss": 1.561, + "step": 10376 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002484276644488347, + "loss": 1.6881, + "step": 10377 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024841833746606375, + "loss": 1.6296, + "step": 10378 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002484090098150865, + "loss": 1.6959, + "step": 10379 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024839968149596643, + "loss": 1.5989, + "step": 10380 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024839035250876683, + "loss": 1.6362, + "step": 10381 + }, + { + "epoch": 0.82, + "learning_rate": 0.000248381022853551, + "loss": 1.5572, + "step": 10382 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002483716925303824, + "loss": 1.6238, + "step": 10383 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024836236153932416, + "loss": 1.6682, + "step": 10384 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002483530298804398, + "loss": 1.6107, + "step": 10385 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002483436975537927, + "loss": 1.6678, + "step": 10386 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002483343645594461, + "loss": 1.6359, + "step": 10387 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002483250308974635, + "loss": 1.6547, + "step": 10388 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002483156965679082, + "loss": 1.6564, + "step": 10389 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024830636157084353, + "loss": 1.6306, + "step": 10390 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024829702590633293, + "loss": 1.5826, + "step": 10391 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002482876895744398, + "loss": 1.6388, + "step": 10392 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002482783525752274, + "loss": 1.6416, + "step": 10393 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002482690149087593, + "loss": 1.5643, + "step": 10394 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002482596765750988, + "loss": 1.621, + "step": 10395 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002482503375743093, + "loss": 1.6226, + "step": 10396 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002482409979064543, + "loss": 1.6402, + "step": 10397 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024823165757159707, + "loss": 1.6264, + "step": 10398 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002482223165698011, + "loss": 1.6129, + "step": 10399 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024821297490112986, + "loss": 1.6707, + "step": 10400 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024820363256564663, + "loss": 1.5628, + "step": 10401 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024819428956341494, + "loss": 1.6365, + "step": 10402 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002481849458944983, + "loss": 1.6021, + "step": 10403 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024817560155896, + "loss": 1.6001, + "step": 10404 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024816625655686356, + "loss": 1.5812, + "step": 10405 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002481569108882724, + "loss": 1.6191, + "step": 10406 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024814756455324995, + "loss": 1.62, + "step": 10407 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024813821755185973, + "loss": 1.6198, + "step": 10408 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002481288698841652, + "loss": 1.6742, + "step": 10409 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024811952155022975, + "loss": 1.5715, + "step": 10410 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024811017255011694, + "loss": 1.6134, + "step": 10411 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002481008228838901, + "loss": 1.6122, + "step": 10412 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024809147255161295, + "loss": 1.6376, + "step": 10413 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024808212155334877, + "loss": 1.6379, + "step": 10414 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024807276988916106, + "loss": 1.6737, + "step": 10415 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002480634175591134, + "loss": 1.604, + "step": 10416 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002480540645632693, + "loss": 1.666, + "step": 10417 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024804471090169217, + "loss": 1.6892, + "step": 10418 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024803535657444555, + "loss": 1.6135, + "step": 10419 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024802600158159297, + "loss": 1.6464, + "step": 10420 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024801664592319795, + "loss": 1.5874, + "step": 10421 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002480072895993239, + "loss": 1.632, + "step": 10422 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024799793261003457, + "loss": 1.5667, + "step": 10423 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002479885749553933, + "loss": 1.6417, + "step": 10424 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002479792166354637, + "loss": 1.704, + "step": 10425 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002479698576503093, + "loss": 1.6589, + "step": 10426 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024796049799999354, + "loss": 1.6197, + "step": 10427 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024795113768458015, + "loss": 1.6582, + "step": 10428 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024794177670413255, + "loss": 1.5955, + "step": 10429 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024793241505871436, + "loss": 1.656, + "step": 10430 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002479230527483891, + "loss": 1.602, + "step": 10431 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024791368977322036, + "loss": 1.6424, + "step": 10432 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024790432613327166, + "loss": 1.6084, + "step": 10433 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024789496182860664, + "loss": 1.6183, + "step": 10434 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024788559685928887, + "loss": 1.6459, + "step": 10435 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002478762312253819, + "loss": 1.5827, + "step": 10436 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024786686492694936, + "loss": 1.6309, + "step": 10437 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024785749796405474, + "loss": 1.6323, + "step": 10438 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002478481303367618, + "loss": 1.6207, + "step": 10439 + }, + { + "epoch": 0.82, + "learning_rate": 0.000247838762045134, + "loss": 1.6147, + "step": 10440 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024782939308923497, + "loss": 1.5662, + "step": 10441 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024782002346912844, + "loss": 1.6108, + "step": 10442 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002478106531848778, + "loss": 1.5805, + "step": 10443 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002478012822365469, + "loss": 1.6186, + "step": 10444 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002477919106241993, + "loss": 1.626, + "step": 10445 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024778253834789853, + "loss": 1.6657, + "step": 10446 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024777316540770827, + "loss": 1.6604, + "step": 10447 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002477637918036922, + "loss": 1.6212, + "step": 10448 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002477544175359139, + "loss": 1.6588, + "step": 10449 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024774504260443713, + "loss": 1.599, + "step": 10450 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002477356670093254, + "loss": 1.6432, + "step": 10451 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002477262907506424, + "loss": 1.5343, + "step": 10452 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002477169138284519, + "loss": 1.6062, + "step": 10453 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002477075362428174, + "loss": 1.6556, + "step": 10454 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002476981579938027, + "loss": 1.5922, + "step": 10455 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002476887790814714, + "loss": 1.6326, + "step": 10456 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002476793995058872, + "loss": 1.623, + "step": 10457 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002476700192671138, + "loss": 1.6714, + "step": 10458 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002476606383652148, + "loss": 1.6145, + "step": 10459 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024765125680025407, + "loss": 1.6241, + "step": 10460 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002476418745722951, + "loss": 1.6531, + "step": 10461 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002476324916814017, + "loss": 1.5746, + "step": 10462 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002476231081276376, + "loss": 1.7025, + "step": 10463 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024761372391106644, + "loss": 1.5585, + "step": 10464 + }, + { + "epoch": 0.82, + "learning_rate": 0.000247604339031752, + "loss": 1.6161, + "step": 10465 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002475949534897579, + "loss": 1.6408, + "step": 10466 + }, + { + "epoch": 0.82, + "learning_rate": 0.000247585567285148, + "loss": 1.6947, + "step": 10467 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002475761804179859, + "loss": 1.6043, + "step": 10468 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024756679288833535, + "loss": 1.6242, + "step": 10469 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002475574046962602, + "loss": 1.6444, + "step": 10470 + }, + { + "epoch": 0.82, + "learning_rate": 0.000247548015841824, + "loss": 1.6158, + "step": 10471 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002475386263250907, + "loss": 1.6472, + "step": 10472 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002475292361461239, + "loss": 1.6665, + "step": 10473 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024751984530498744, + "loss": 1.6441, + "step": 10474 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024751045380174504, + "loss": 1.5899, + "step": 10475 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024750106163646044, + "loss": 1.5887, + "step": 10476 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024749166880919744, + "loss": 1.6362, + "step": 10477 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024748227532001986, + "loss": 1.5889, + "step": 10478 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002474728811689914, + "loss": 1.586, + "step": 10479 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024746348635617583, + "loss": 1.615, + "step": 10480 + }, + { + "epoch": 0.82, + "learning_rate": 0.000247454090881637, + "loss": 1.6085, + "step": 10481 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024744469474543873, + "loss": 1.6911, + "step": 10482 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002474352979476447, + "loss": 1.6556, + "step": 10483 + }, + { + "epoch": 0.82, + "learning_rate": 0.00024742590048831874, + "loss": 1.6309, + "step": 10484 + }, + { + "epoch": 0.82, + "learning_rate": 0.0002474165023675247, + "loss": 1.696, + "step": 10485 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002474071035853264, + "loss": 1.6186, + "step": 10486 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002473977041417876, + "loss": 1.6554, + "step": 10487 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002473883040369721, + "loss": 1.571, + "step": 10488 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002473789032709438, + "loss": 1.6298, + "step": 10489 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002473695018437665, + "loss": 1.5881, + "step": 10490 + }, + { + "epoch": 0.83, + "learning_rate": 0.000247360099755504, + "loss": 1.6179, + "step": 10491 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002473506970062202, + "loss": 1.6041, + "step": 10492 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002473412935959788, + "loss": 1.641, + "step": 10493 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024733188952484375, + "loss": 1.6003, + "step": 10494 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002473224847928789, + "loss": 1.6533, + "step": 10495 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024731307940014806, + "loss": 1.6206, + "step": 10496 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002473036733467152, + "loss": 1.6211, + "step": 10497 + }, + { + "epoch": 0.83, + "learning_rate": 0.000247294266632644, + "loss": 1.6474, + "step": 10498 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002472848592579985, + "loss": 1.6377, + "step": 10499 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024727545122284244, + "loss": 1.6255, + "step": 10500 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002472660425272397, + "loss": 1.5508, + "step": 10501 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002472566331712543, + "loss": 1.6346, + "step": 10502 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024724722315494995, + "loss": 1.5986, + "step": 10503 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002472378124783907, + "loss": 1.5762, + "step": 10504 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002472284011416403, + "loss": 1.5907, + "step": 10505 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024721898914476274, + "loss": 1.5958, + "step": 10506 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002472095764878219, + "loss": 1.6476, + "step": 10507 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002472001631708817, + "loss": 1.6862, + "step": 10508 + }, + { + "epoch": 0.83, + "learning_rate": 0.000247190749194006, + "loss": 1.6772, + "step": 10509 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024718133455725876, + "loss": 1.605, + "step": 10510 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002471719192607038, + "loss": 1.6246, + "step": 10511 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024716250330440525, + "loss": 1.6305, + "step": 10512 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024715308668842685, + "loss": 1.6475, + "step": 10513 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024714366941283264, + "loss": 1.5987, + "step": 10514 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024713425147768653, + "loss": 1.6348, + "step": 10515 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002471248328830525, + "loss": 1.6646, + "step": 10516 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024711541362899435, + "loss": 1.6414, + "step": 10517 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002471059937155762, + "loss": 1.6121, + "step": 10518 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024709657314286187, + "loss": 1.6139, + "step": 10519 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002470871519109155, + "loss": 1.6175, + "step": 10520 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024707773001980086, + "loss": 1.6037, + "step": 10521 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024706830746958205, + "loss": 1.631, + "step": 10522 + }, + { + "epoch": 0.83, + "learning_rate": 0.000247058884260323, + "loss": 1.5745, + "step": 10523 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002470494603920877, + "loss": 1.6489, + "step": 10524 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024704003586494005, + "loss": 1.6287, + "step": 10525 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024703061067894407, + "loss": 1.6327, + "step": 10526 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002470211848341639, + "loss": 1.5643, + "step": 10527 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002470117583306634, + "loss": 1.6344, + "step": 10528 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024700233116850664, + "loss": 1.6104, + "step": 10529 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002469929033477575, + "loss": 1.5754, + "step": 10530 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024698347486848014, + "loss": 1.6104, + "step": 10531 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024697404573073843, + "loss": 1.6257, + "step": 10532 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024696461593459653, + "loss": 1.6036, + "step": 10533 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024695518548011833, + "loss": 1.5932, + "step": 10534 + }, + { + "epoch": 0.83, + "learning_rate": 0.000246945754367368, + "loss": 1.6235, + "step": 10535 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002469363225964094, + "loss": 1.6138, + "step": 10536 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024692689016730674, + "loss": 1.6864, + "step": 10537 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024691745708012395, + "loss": 1.615, + "step": 10538 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002469080233349252, + "loss": 1.5858, + "step": 10539 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024689858893177434, + "loss": 1.6444, + "step": 10540 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024688915387073557, + "loss": 1.6261, + "step": 10541 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002468797181518729, + "loss": 1.612, + "step": 10542 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024687028177525043, + "loss": 1.5781, + "step": 10543 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002468608447409322, + "loss": 1.6224, + "step": 10544 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002468514070489823, + "loss": 1.6185, + "step": 10545 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024684196869946475, + "loss": 1.5924, + "step": 10546 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002468325296924437, + "loss": 1.6439, + "step": 10547 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024682309002798324, + "loss": 1.6115, + "step": 10548 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002468136497061474, + "loss": 1.6478, + "step": 10549 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002468042087270003, + "loss": 1.6429, + "step": 10550 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024679476709060604, + "loss": 1.6017, + "step": 10551 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002467853247970287, + "loss": 1.5684, + "step": 10552 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002467758818463325, + "loss": 1.6515, + "step": 10553 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024676643823858137, + "loss": 1.6213, + "step": 10554 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002467569939738396, + "loss": 1.6192, + "step": 10555 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002467475490521712, + "loss": 1.5982, + "step": 10556 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024673810347364034, + "loss": 1.6295, + "step": 10557 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002467286572383111, + "loss": 1.6645, + "step": 10558 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024671921034624775, + "loss": 1.6792, + "step": 10559 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024670976279751424, + "loss": 1.6391, + "step": 10560 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002467003145921749, + "loss": 1.6445, + "step": 10561 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024669086573029375, + "loss": 1.5876, + "step": 10562 + }, + { + "epoch": 0.83, + "learning_rate": 0.000246681416211935, + "loss": 1.6571, + "step": 10563 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002466719660371627, + "loss": 1.6069, + "step": 10564 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002466625152060412, + "loss": 1.6412, + "step": 10565 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024665306371863453, + "loss": 1.5863, + "step": 10566 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024664361157500684, + "loss": 1.6378, + "step": 10567 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024663415877522243, + "loss": 1.6003, + "step": 10568 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002466247053193454, + "loss": 1.6358, + "step": 10569 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024661525120743994, + "loss": 1.5882, + "step": 10570 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024660579643957017, + "loss": 1.6512, + "step": 10571 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002465963410158004, + "loss": 1.5953, + "step": 10572 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002465868849361948, + "loss": 1.5958, + "step": 10573 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024657742820081757, + "loss": 1.643, + "step": 10574 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002465679708097329, + "loss": 1.622, + "step": 10575 + }, + { + "epoch": 0.83, + "learning_rate": 0.000246558512763005, + "loss": 1.5472, + "step": 10576 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024654905406069807, + "loss": 1.615, + "step": 10577 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002465395947028763, + "loss": 1.562, + "step": 10578 + }, + { + "epoch": 0.83, + "learning_rate": 0.000246530134689604, + "loss": 1.6205, + "step": 10579 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002465206740209453, + "loss": 1.6268, + "step": 10580 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002465112126969645, + "loss": 1.62, + "step": 10581 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002465017507177259, + "loss": 1.6576, + "step": 10582 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024649228808329367, + "loss": 1.62, + "step": 10583 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002464828247937319, + "loss": 1.6337, + "step": 10584 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024647336084910514, + "loss": 1.6303, + "step": 10585 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024646389624947745, + "loss": 1.5828, + "step": 10586 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002464544309949132, + "loss": 1.6597, + "step": 10587 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002464449650854765, + "loss": 1.6094, + "step": 10588 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024643549852123176, + "loss": 1.5932, + "step": 10589 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002464260313022432, + "loss": 1.5889, + "step": 10590 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024641656342857507, + "loss": 1.6032, + "step": 10591 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002464070949002917, + "loss": 1.6832, + "step": 10592 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002463976257174574, + "loss": 1.6094, + "step": 10593 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002463881558801363, + "loss": 1.642, + "step": 10594 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002463786853883929, + "loss": 1.6202, + "step": 10595 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002463692142422914, + "loss": 1.6453, + "step": 10596 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024635974244189613, + "loss": 1.6056, + "step": 10597 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024635026998727136, + "loss": 1.6014, + "step": 10598 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024634079687848144, + "loss": 1.5702, + "step": 10599 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002463313231155907, + "loss": 1.5687, + "step": 10600 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002463218486986634, + "loss": 1.6229, + "step": 10601 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002463123736277639, + "loss": 1.611, + "step": 10602 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002463028979029566, + "loss": 1.6946, + "step": 10603 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024629342152430566, + "loss": 1.6511, + "step": 10604 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002462839444918756, + "loss": 1.6539, + "step": 10605 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002462744668057306, + "loss": 1.6213, + "step": 10606 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024626498846593524, + "loss": 1.6162, + "step": 10607 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024625550947255363, + "loss": 1.6472, + "step": 10608 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024624602982565024, + "loss": 1.6182, + "step": 10609 + }, + { + "epoch": 0.83, + "learning_rate": 0.00024623654952528947, + "loss": 1.6376, + "step": 10610 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002462270685715356, + "loss": 1.6051, + "step": 10611 + }, + { + "epoch": 0.83, + "learning_rate": 0.0002462175869644531, + "loss": 1.6109, + "step": 10612 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024620810470410616, + "loss": 1.6034, + "step": 10613 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024619862179055935, + "loss": 1.5749, + "step": 10614 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024618913822387696, + "loss": 1.6334, + "step": 10615 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024617965400412344, + "loss": 1.6357, + "step": 10616 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024617016913136314, + "loss": 1.5843, + "step": 10617 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024616068360566046, + "loss": 1.5852, + "step": 10618 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002461511974270798, + "loss": 1.6438, + "step": 10619 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024614171059568555, + "loss": 1.6329, + "step": 10620 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024613222311154213, + "loss": 1.6375, + "step": 10621 + }, + { + "epoch": 0.84, + "learning_rate": 0.000246122734974714, + "loss": 1.6241, + "step": 10622 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024611324618526554, + "loss": 1.6383, + "step": 10623 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002461037567432612, + "loss": 1.619, + "step": 10624 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024609426664876533, + "loss": 1.6096, + "step": 10625 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024608477590184243, + "loss": 1.603, + "step": 10626 + }, + { + "epoch": 0.84, + "learning_rate": 0.000246075284502557, + "loss": 1.6982, + "step": 10627 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002460657924509733, + "loss": 1.6756, + "step": 10628 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024605629974715595, + "loss": 1.6809, + "step": 10629 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002460468063911693, + "loss": 1.6082, + "step": 10630 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024603731238307785, + "loss": 1.6366, + "step": 10631 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024602781772294606, + "loss": 1.6115, + "step": 10632 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002460183224108384, + "loss": 1.6051, + "step": 10633 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024600882644681927, + "loss": 1.6337, + "step": 10634 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002459993298309532, + "loss": 1.6, + "step": 10635 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002459898325633047, + "loss": 1.6575, + "step": 10636 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002459803346439382, + "loss": 1.5803, + "step": 10637 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002459708360729181, + "loss": 1.5759, + "step": 10638 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024596133685030904, + "loss": 1.5602, + "step": 10639 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002459518369761755, + "loss": 1.6136, + "step": 10640 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024594233645058194, + "loss": 1.6296, + "step": 10641 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024593283527359283, + "loss": 1.6157, + "step": 10642 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002459233334452727, + "loss": 1.6435, + "step": 10643 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002459138309656861, + "loss": 1.696, + "step": 10644 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002459043278348975, + "loss": 1.621, + "step": 10645 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002458948240529714, + "loss": 1.6032, + "step": 10646 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002458853196199724, + "loss": 1.652, + "step": 10647 + }, + { + "epoch": 0.84, + "learning_rate": 0.000245875814535965, + "loss": 1.6174, + "step": 10648 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002458663088010137, + "loss": 1.6717, + "step": 10649 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002458568024151831, + "loss": 1.608, + "step": 10650 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002458472953785377, + "loss": 1.6119, + "step": 10651 + }, + { + "epoch": 0.84, + "learning_rate": 0.000245837787691142, + "loss": 1.6885, + "step": 10652 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002458282793530607, + "loss": 1.5951, + "step": 10653 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024581877036435827, + "loss": 1.626, + "step": 10654 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024580926072509916, + "loss": 1.6319, + "step": 10655 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024579975043534814, + "loss": 1.6293, + "step": 10656 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024579023949516964, + "loss": 1.6328, + "step": 10657 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002457807279046283, + "loss": 1.6206, + "step": 10658 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002457712156637887, + "loss": 1.6346, + "step": 10659 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024576170277271534, + "loss": 1.6369, + "step": 10660 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024575218923147285, + "loss": 1.6512, + "step": 10661 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024574267504012587, + "loss": 1.5709, + "step": 10662 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024573316019873897, + "loss": 1.6029, + "step": 10663 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002457236447073767, + "loss": 1.6144, + "step": 10664 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024571412856610374, + "loss": 1.5998, + "step": 10665 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024570461177498464, + "loss": 1.6662, + "step": 10666 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002456950943340841, + "loss": 1.6148, + "step": 10667 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002456855762434666, + "loss": 1.6033, + "step": 10668 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024567605750319693, + "loss": 1.6293, + "step": 10669 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024566653811333955, + "loss": 1.6092, + "step": 10670 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002456570180739592, + "loss": 1.5749, + "step": 10671 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002456474973851205, + "loss": 1.632, + "step": 10672 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024563797604688805, + "loss": 1.6777, + "step": 10673 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024562845405932656, + "loss": 1.6087, + "step": 10674 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024561893142250056, + "loss": 1.5964, + "step": 10675 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024560940813647485, + "loss": 1.6184, + "step": 10676 + }, + { + "epoch": 0.84, + "learning_rate": 0.000245599884201314, + "loss": 1.5609, + "step": 10677 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002455903596170827, + "loss": 1.6143, + "step": 10678 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002455808343838456, + "loss": 1.6414, + "step": 10679 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002455713085016674, + "loss": 1.5834, + "step": 10680 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002455617819706127, + "loss": 1.5915, + "step": 10681 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002455522547907463, + "loss": 1.5851, + "step": 10682 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024554272696213276, + "loss": 1.6117, + "step": 10683 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002455331984848369, + "loss": 1.666, + "step": 10684 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002455236693589233, + "loss": 1.6239, + "step": 10685 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002455141395844567, + "loss": 1.6108, + "step": 10686 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002455046091615018, + "loss": 1.6311, + "step": 10687 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002454950780901233, + "loss": 1.6663, + "step": 10688 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024548554637038593, + "loss": 1.5973, + "step": 10689 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024547601400235446, + "loss": 1.6517, + "step": 10690 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024546648098609347, + "loss": 1.5831, + "step": 10691 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024545694732166774, + "loss": 1.6043, + "step": 10692 + }, + { + "epoch": 0.84, + "learning_rate": 0.000245447413009142, + "loss": 1.6285, + "step": 10693 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002454378780485811, + "loss": 1.5969, + "step": 10694 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002454283424400496, + "loss": 1.6412, + "step": 10695 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024541880618361234, + "loss": 1.5868, + "step": 10696 + }, + { + "epoch": 0.84, + "learning_rate": 0.000245409269279334, + "loss": 1.5944, + "step": 10697 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024539973172727945, + "loss": 1.5695, + "step": 10698 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002453901935275133, + "loss": 1.6491, + "step": 10699 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002453806546801004, + "loss": 1.5824, + "step": 10700 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024537111518510546, + "loss": 1.6178, + "step": 10701 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024536157504259333, + "loss": 1.6246, + "step": 10702 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024535203425262873, + "loss": 1.6019, + "step": 10703 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002453424928152764, + "loss": 1.6469, + "step": 10704 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024533295073060114, + "loss": 1.6462, + "step": 10705 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002453234079986678, + "loss": 1.5728, + "step": 10706 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002453138646195411, + "loss": 1.6356, + "step": 10707 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024530432059328587, + "loss": 1.6306, + "step": 10708 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002452947759199669, + "loss": 1.6125, + "step": 10709 + }, + { + "epoch": 0.84, + "learning_rate": 0.000245285230599649, + "loss": 1.6168, + "step": 10710 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024527568463239693, + "loss": 1.6708, + "step": 10711 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002452661380182756, + "loss": 1.6014, + "step": 10712 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002452565907573497, + "loss": 1.6564, + "step": 10713 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002452470428496841, + "loss": 1.6433, + "step": 10714 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024523749429534373, + "loss": 1.5943, + "step": 10715 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024522794509439325, + "loss": 1.6305, + "step": 10716 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002452183952468976, + "loss": 1.6691, + "step": 10717 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002452088447529216, + "loss": 1.6348, + "step": 10718 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002451992936125301, + "loss": 1.6678, + "step": 10719 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002451897418257879, + "loss": 1.5795, + "step": 10720 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002451801893927599, + "loss": 1.6431, + "step": 10721 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024517063631351095, + "loss": 1.6643, + "step": 10722 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002451610825881059, + "loss": 1.6607, + "step": 10723 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002451515282166096, + "loss": 1.5883, + "step": 10724 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002451419731990869, + "loss": 1.6269, + "step": 10725 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024513241753560273, + "loss": 1.59, + "step": 10726 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024512286122622197, + "loss": 1.5918, + "step": 10727 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002451133042710094, + "loss": 1.6047, + "step": 10728 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002451037466700301, + "loss": 1.6223, + "step": 10729 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024509418842334876, + "loss": 1.6913, + "step": 10730 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024508462953103035, + "loss": 1.6253, + "step": 10731 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002450750699931398, + "loss": 1.6128, + "step": 10732 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024506550980974204, + "loss": 1.6036, + "step": 10733 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002450559489809019, + "loss": 1.5934, + "step": 10734 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002450463875066843, + "loss": 1.5938, + "step": 10735 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024503682538715415, + "loss": 1.5813, + "step": 10736 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024502726262237647, + "loss": 1.63, + "step": 10737 + }, + { + "epoch": 0.84, + "learning_rate": 0.0002450176992124161, + "loss": 1.5974, + "step": 10738 + }, + { + "epoch": 0.84, + "learning_rate": 0.00024500813515733797, + "loss": 1.6253, + "step": 10739 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024499857045720704, + "loss": 1.6165, + "step": 10740 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002449890051120882, + "loss": 1.6921, + "step": 10741 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002449794391220465, + "loss": 1.6072, + "step": 10742 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024496987248714676, + "loss": 1.6374, + "step": 10743 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024496030520745405, + "loss": 1.6548, + "step": 10744 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024495073728303325, + "loss": 1.6236, + "step": 10745 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002449411687139493, + "loss": 1.6049, + "step": 10746 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002449315995002673, + "loss": 1.6494, + "step": 10747 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024492202964205206, + "loss": 1.6144, + "step": 10748 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024491245913936863, + "loss": 1.5757, + "step": 10749 + }, + { + "epoch": 0.85, + "learning_rate": 0.000244902887992282, + "loss": 1.6518, + "step": 10750 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024489331620085715, + "loss": 1.6279, + "step": 10751 + }, + { + "epoch": 0.85, + "learning_rate": 0.000244883743765159, + "loss": 1.6818, + "step": 10752 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002448741706852526, + "loss": 1.6197, + "step": 10753 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024486459696120293, + "loss": 1.5947, + "step": 10754 + }, + { + "epoch": 0.85, + "learning_rate": 0.000244855022593075, + "loss": 1.6167, + "step": 10755 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002448454475809339, + "loss": 1.6389, + "step": 10756 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024483587192484444, + "loss": 1.573, + "step": 10757 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024482629562487177, + "loss": 1.5916, + "step": 10758 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002448167186810809, + "loss": 1.5879, + "step": 10759 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024480714109353685, + "loss": 1.5431, + "step": 10760 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002447975628623046, + "loss": 1.6437, + "step": 10761 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002447879839874492, + "loss": 1.6539, + "step": 10762 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002447784044690357, + "loss": 1.6104, + "step": 10763 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002447688243071292, + "loss": 1.6271, + "step": 10764 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002447592435017946, + "loss": 1.6113, + "step": 10765 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002447496620530971, + "loss": 1.5952, + "step": 10766 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002447400799611016, + "loss": 1.6723, + "step": 10767 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024473049722587335, + "loss": 1.6803, + "step": 10768 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002447209138474772, + "loss": 1.5897, + "step": 10769 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002447113298259783, + "loss": 1.7135, + "step": 10770 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024470174516144183, + "loss": 1.6495, + "step": 10771 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024469215985393274, + "loss": 1.6001, + "step": 10772 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024468257390351615, + "loss": 1.6298, + "step": 10773 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024467298731025713, + "loss": 1.6449, + "step": 10774 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002446634000742207, + "loss": 1.6511, + "step": 10775 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002446538121954721, + "loss": 1.6044, + "step": 10776 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002446442236740763, + "loss": 1.6014, + "step": 10777 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024463463451009846, + "loss": 1.636, + "step": 10778 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002446250447036037, + "loss": 1.6081, + "step": 10779 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024461545425465717, + "loss": 1.5777, + "step": 10780 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002446058631633238, + "loss": 1.6303, + "step": 10781 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024459627142966886, + "loss": 1.5998, + "step": 10782 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002445866790537575, + "loss": 1.6021, + "step": 10783 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002445770860356547, + "loss": 1.5616, + "step": 10784 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024456749237542576, + "loss": 1.6641, + "step": 10785 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024455789807313567, + "loss": 1.5882, + "step": 10786 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024454830312884963, + "loss": 1.656, + "step": 10787 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002445387075426328, + "loss": 1.6259, + "step": 10788 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024452911131455035, + "loss": 1.6744, + "step": 10789 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002445195144446674, + "loss": 1.6455, + "step": 10790 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024450991693304903, + "loss": 1.5925, + "step": 10791 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024450031877976054, + "loss": 1.5766, + "step": 10792 + }, + { + "epoch": 0.85, + "learning_rate": 0.000244490719984867, + "loss": 1.6776, + "step": 10793 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024448112054843365, + "loss": 1.6405, + "step": 10794 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024447152047052563, + "loss": 1.6261, + "step": 10795 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024446191975120815, + "loss": 1.6678, + "step": 10796 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024445231839054633, + "loss": 1.6168, + "step": 10797 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002444427163886054, + "loss": 1.6218, + "step": 10798 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002444331137454505, + "loss": 1.6053, + "step": 10799 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002444235104611469, + "loss": 1.5836, + "step": 10800 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002444139065357598, + "loss": 1.6298, + "step": 10801 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024440430196935435, + "loss": 1.5817, + "step": 10802 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024439469676199575, + "loss": 1.6021, + "step": 10803 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002443850909137493, + "loss": 1.6549, + "step": 10804 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024437548442468013, + "loss": 1.6498, + "step": 10805 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002443658772948536, + "loss": 1.628, + "step": 10806 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024435626952433475, + "loss": 1.584, + "step": 10807 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002443466611131889, + "loss": 1.6582, + "step": 10808 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002443370520614813, + "loss": 1.5935, + "step": 10809 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002443274423692772, + "loss": 1.5968, + "step": 10810 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024431783203664176, + "loss": 1.5911, + "step": 10811 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002443082210636403, + "loss": 1.5845, + "step": 10812 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002442986094503381, + "loss": 1.6288, + "step": 10813 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002442889971968004, + "loss": 1.6597, + "step": 10814 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002442793843030924, + "loss": 1.5725, + "step": 10815 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024426977076927943, + "loss": 1.6095, + "step": 10816 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024426015659542667, + "loss": 1.6436, + "step": 10817 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024425054178159956, + "loss": 1.6499, + "step": 10818 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002442409263278632, + "loss": 1.6414, + "step": 10819 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024423131023428306, + "loss": 1.5894, + "step": 10820 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002442216935009243, + "loss": 1.6073, + "step": 10821 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002442120761278522, + "loss": 1.5992, + "step": 10822 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002442024581151321, + "loss": 1.591, + "step": 10823 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002441928394628293, + "loss": 1.6298, + "step": 10824 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024418322017100906, + "loss": 1.6241, + "step": 10825 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024417360023973675, + "loss": 1.5991, + "step": 10826 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024416397966907767, + "loss": 1.6237, + "step": 10827 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024415435845909716, + "loss": 1.6533, + "step": 10828 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024414473660986047, + "loss": 1.6058, + "step": 10829 + }, + { + "epoch": 0.85, + "learning_rate": 0.000244135114121433, + "loss": 1.6555, + "step": 10830 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024412549099388006, + "loss": 1.641, + "step": 10831 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024411586722726696, + "loss": 1.6234, + "step": 10832 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024410624282165903, + "loss": 1.6187, + "step": 10833 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002440966177771217, + "loss": 1.6239, + "step": 10834 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002440869920937202, + "loss": 1.6142, + "step": 10835 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024407736577152002, + "loss": 1.6712, + "step": 10836 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024406773881058643, + "loss": 1.6387, + "step": 10837 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024405811121098474, + "loss": 1.5795, + "step": 10838 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024404848297278044, + "loss": 1.6307, + "step": 10839 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024403885409603882, + "loss": 1.6143, + "step": 10840 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024402922458082528, + "loss": 1.5821, + "step": 10841 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002440195944272052, + "loss": 1.6382, + "step": 10842 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024400996363524395, + "loss": 1.587, + "step": 10843 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024400033220500693, + "loss": 1.62, + "step": 10844 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024399070013655954, + "loss": 1.5773, + "step": 10845 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024398106742996715, + "loss": 1.5738, + "step": 10846 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024397143408529516, + "loss": 1.5982, + "step": 10847 + }, + { + "epoch": 0.85, + "learning_rate": 0.000243961800102609, + "loss": 1.6033, + "step": 10848 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002439521654819741, + "loss": 1.6069, + "step": 10849 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024394253022345578, + "loss": 1.6098, + "step": 10850 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002439328943271196, + "loss": 1.6557, + "step": 10851 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024392325779303085, + "loss": 1.5736, + "step": 10852 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024391362062125502, + "loss": 1.5942, + "step": 10853 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024390398281185754, + "loss": 1.6391, + "step": 10854 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024389434436490384, + "loss": 1.5838, + "step": 10855 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024388470528045937, + "loss": 1.6247, + "step": 10856 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002438750655585895, + "loss": 1.6158, + "step": 10857 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024386542519935978, + "loss": 1.6416, + "step": 10858 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024385578420283563, + "loss": 1.6354, + "step": 10859 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024384614256908253, + "loss": 1.6486, + "step": 10860 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024383650029816584, + "loss": 1.5926, + "step": 10861 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024382685739015117, + "loss": 1.6439, + "step": 10862 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024381721384510383, + "loss": 1.6247, + "step": 10863 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024380756966308945, + "loss": 1.6154, + "step": 10864 + }, + { + "epoch": 0.85, + "learning_rate": 0.0002437979248441734, + "loss": 1.5977, + "step": 10865 + }, + { + "epoch": 0.85, + "learning_rate": 0.00024378827938842122, + "loss": 1.6247, + "step": 10866 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024377863329589836, + "loss": 1.558, + "step": 10867 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002437689865666704, + "loss": 1.5943, + "step": 10868 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002437593392008027, + "loss": 1.6325, + "step": 10869 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024374969119836086, + "loss": 1.6148, + "step": 10870 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002437400425594103, + "loss": 1.6162, + "step": 10871 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002437303932840166, + "loss": 1.5701, + "step": 10872 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024372074337224527, + "loss": 1.6461, + "step": 10873 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024371109282416182, + "loss": 1.6232, + "step": 10874 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024370144163983175, + "loss": 1.5422, + "step": 10875 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024369178981932063, + "loss": 1.6549, + "step": 10876 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024368213736269395, + "loss": 1.6033, + "step": 10877 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024367248427001722, + "loss": 1.6638, + "step": 10878 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024366283054135605, + "loss": 1.636, + "step": 10879 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024365317617677592, + "loss": 1.6129, + "step": 10880 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024364352117634244, + "loss": 1.6716, + "step": 10881 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024363386554012112, + "loss": 1.661, + "step": 10882 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002436242092681775, + "loss": 1.6482, + "step": 10883 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024361455236057716, + "loss": 1.6345, + "step": 10884 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002436048948173857, + "loss": 1.6189, + "step": 10885 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024359523663866866, + "loss": 1.6153, + "step": 10886 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024358557782449162, + "loss": 1.5983, + "step": 10887 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002435759183749201, + "loss": 1.6228, + "step": 10888 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002435662582900198, + "loss": 1.6621, + "step": 10889 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024355659756985617, + "loss": 1.6146, + "step": 10890 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002435469362144949, + "loss": 1.6192, + "step": 10891 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024353727422400158, + "loss": 1.5741, + "step": 10892 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024352761159844181, + "loss": 1.567, + "step": 10893 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002435179483378811, + "loss": 1.6012, + "step": 10894 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024350828444238517, + "loss": 1.5872, + "step": 10895 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002434986199120196, + "loss": 1.6136, + "step": 10896 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024348895474684995, + "loss": 1.6398, + "step": 10897 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002434792889469419, + "loss": 1.58, + "step": 10898 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024346962251236109, + "loss": 1.69, + "step": 10899 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002434599554431731, + "loss": 1.6065, + "step": 10900 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002434502877394436, + "loss": 1.5887, + "step": 10901 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024344061940123824, + "loss": 1.6324, + "step": 10902 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024343095042862262, + "loss": 1.6537, + "step": 10903 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002434212808216624, + "loss": 1.6594, + "step": 10904 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024341161058042323, + "loss": 1.6473, + "step": 10905 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002434019397049708, + "loss": 1.5956, + "step": 10906 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024339226819537074, + "loss": 1.5811, + "step": 10907 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024338259605168871, + "loss": 1.5784, + "step": 10908 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024337292327399036, + "loss": 1.6222, + "step": 10909 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024336324986234142, + "loss": 1.6289, + "step": 10910 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002433535758168075, + "loss": 1.5911, + "step": 10911 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024334390113745437, + "loss": 1.6125, + "step": 10912 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002433342258243476, + "loss": 1.633, + "step": 10913 + }, + { + "epoch": 0.86, + "learning_rate": 0.000243324549877553, + "loss": 1.6574, + "step": 10914 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002433148732971362, + "loss": 1.6109, + "step": 10915 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002433051960831629, + "loss": 1.596, + "step": 10916 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024329551823569875, + "loss": 1.6062, + "step": 10917 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002432858397548096, + "loss": 1.648, + "step": 10918 + }, + { + "epoch": 0.86, + "learning_rate": 0.000243276160640561, + "loss": 1.6647, + "step": 10919 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002432664808930188, + "loss": 1.6204, + "step": 10920 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024325680051224866, + "loss": 1.6211, + "step": 10921 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024324711949831628, + "loss": 1.6118, + "step": 10922 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024323743785128744, + "loss": 1.6318, + "step": 10923 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024322775557122787, + "loss": 1.624, + "step": 10924 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024321807265820325, + "loss": 1.6374, + "step": 10925 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024320838911227936, + "loss": 1.6134, + "step": 10926 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024319870493352195, + "loss": 1.5472, + "step": 10927 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024318902012199678, + "loss": 1.622, + "step": 10928 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024317933467776954, + "loss": 1.585, + "step": 10929 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024316964860090609, + "loss": 1.5608, + "step": 10930 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002431599618914721, + "loss": 1.5804, + "step": 10931 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024315027454953345, + "loss": 1.6444, + "step": 10932 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002431405865751558, + "loss": 1.6544, + "step": 10933 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024313089796840494, + "loss": 1.598, + "step": 10934 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002431212087293467, + "loss": 1.6491, + "step": 10935 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024311151885804684, + "loss": 1.6483, + "step": 10936 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024310182835457112, + "loss": 1.5891, + "step": 10937 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024309213721898545, + "loss": 1.6446, + "step": 10938 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024308244545135548, + "loss": 1.6153, + "step": 10939 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024307275305174707, + "loss": 1.5836, + "step": 10940 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024306306002022603, + "loss": 1.5294, + "step": 10941 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002430533663568582, + "loss": 1.5866, + "step": 10942 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024304367206170929, + "loss": 1.6164, + "step": 10943 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024303397713484526, + "loss": 1.6086, + "step": 10944 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024302428157633183, + "loss": 1.6246, + "step": 10945 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024301458538623488, + "loss": 1.6202, + "step": 10946 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024300488856462025, + "loss": 1.5638, + "step": 10947 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024299519111155372, + "loss": 1.6145, + "step": 10948 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024298549302710117, + "loss": 1.6074, + "step": 10949 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024297579431132842, + "loss": 1.5933, + "step": 10950 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024296609496430132, + "loss": 1.5895, + "step": 10951 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024295639498608573, + "loss": 1.6108, + "step": 10952 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002429466943767476, + "loss": 1.5989, + "step": 10953 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024293699313635266, + "loss": 1.6189, + "step": 10954 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024292729126496683, + "loss": 1.6355, + "step": 10955 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024291758876265594, + "loss": 1.6195, + "step": 10956 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024290788562948592, + "loss": 1.5841, + "step": 10957 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024289818186552263, + "loss": 1.6679, + "step": 10958 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024288847747083197, + "loss": 1.6538, + "step": 10959 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002428787724454798, + "loss": 1.5647, + "step": 10960 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024286906678953202, + "loss": 1.6234, + "step": 10961 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002428593605030545, + "loss": 1.5553, + "step": 10962 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024284965358611316, + "loss": 1.5744, + "step": 10963 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024283994603877397, + "loss": 1.6459, + "step": 10964 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024283023786110273, + "loss": 1.5688, + "step": 10965 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024282052905316538, + "loss": 1.6502, + "step": 10966 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024281081961502793, + "loss": 1.5617, + "step": 10967 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002428011095467562, + "loss": 1.6131, + "step": 10968 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024279139884841611, + "loss": 1.6286, + "step": 10969 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002427816875200737, + "loss": 1.5963, + "step": 10970 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024277197556179478, + "loss": 1.5818, + "step": 10971 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024276226297364537, + "loss": 1.5591, + "step": 10972 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024275254975569138, + "loss": 1.6313, + "step": 10973 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024274283590799872, + "loss": 1.6386, + "step": 10974 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024273312143063342, + "loss": 1.6174, + "step": 10975 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024272340632366143, + "loss": 1.6124, + "step": 10976 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024271369058714864, + "loss": 1.5646, + "step": 10977 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024270397422116106, + "loss": 1.5862, + "step": 10978 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024269425722576467, + "loss": 1.6312, + "step": 10979 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024268453960102538, + "loss": 1.588, + "step": 10980 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024267482134700927, + "loss": 1.5916, + "step": 10981 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024266510246378223, + "loss": 1.5888, + "step": 10982 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024265538295141032, + "loss": 1.5994, + "step": 10983 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024264566280995944, + "loss": 1.6544, + "step": 10984 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024263594203949567, + "loss": 1.5419, + "step": 10985 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024262622064008494, + "loss": 1.6299, + "step": 10986 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024261649861179334, + "loss": 1.6187, + "step": 10987 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002426067759546868, + "loss": 1.5761, + "step": 10988 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002425970526688314, + "loss": 1.5964, + "step": 10989 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024258732875429302, + "loss": 1.5997, + "step": 10990 + }, + { + "epoch": 0.86, + "learning_rate": 0.0002425776042111378, + "loss": 1.649, + "step": 10991 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024256787903943172, + "loss": 1.6075, + "step": 10992 + }, + { + "epoch": 0.86, + "learning_rate": 0.00024255815323924088, + "loss": 1.5818, + "step": 10993 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024254842681063128, + "loss": 1.5734, + "step": 10994 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024253869975366884, + "loss": 1.6722, + "step": 10995 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024252897206841976, + "loss": 1.5994, + "step": 10996 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024251924375495, + "loss": 1.6722, + "step": 10997 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024250951481332561, + "loss": 1.612, + "step": 10998 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002424997852436127, + "loss": 1.6224, + "step": 10999 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002424900550458773, + "loss": 1.6593, + "step": 11000 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024248032422018547, + "loss": 1.5982, + "step": 11001 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024247059276660325, + "loss": 1.6075, + "step": 11002 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024246086068519673, + "loss": 1.6609, + "step": 11003 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024245112797603203, + "loss": 1.6728, + "step": 11004 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024244139463917513, + "loss": 1.5893, + "step": 11005 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002424316606746922, + "loss": 1.62, + "step": 11006 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002424219260826493, + "loss": 1.6114, + "step": 11007 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024241219086311251, + "loss": 1.6555, + "step": 11008 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024240245501614796, + "loss": 1.6058, + "step": 11009 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002423927185418218, + "loss": 1.6214, + "step": 11010 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002423829814402, + "loss": 1.6611, + "step": 11011 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024237324371134873, + "loss": 1.6162, + "step": 11012 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024236350535533407, + "loss": 1.6297, + "step": 11013 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024235376637222222, + "loss": 1.6052, + "step": 11014 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002423440267620793, + "loss": 1.6225, + "step": 11015 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024233428652497137, + "loss": 1.6672, + "step": 11016 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024232454566096458, + "loss": 1.6585, + "step": 11017 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024231480417012511, + "loss": 1.5782, + "step": 11018 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024230506205251903, + "loss": 1.6485, + "step": 11019 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002422953193082125, + "loss": 1.5799, + "step": 11020 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002422855759372717, + "loss": 1.6171, + "step": 11021 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002422758319397628, + "loss": 1.608, + "step": 11022 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024226608731575187, + "loss": 1.6681, + "step": 11023 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024225634206530514, + "loss": 1.569, + "step": 11024 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024224659618848877, + "loss": 1.6273, + "step": 11025 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024223684968536892, + "loss": 1.6502, + "step": 11026 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024222710255601178, + "loss": 1.6239, + "step": 11027 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024221735480048348, + "loss": 1.5972, + "step": 11028 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002422076064188502, + "loss": 1.6249, + "step": 11029 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024219785741117823, + "loss": 1.6236, + "step": 11030 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024218810777753365, + "loss": 1.6115, + "step": 11031 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024217835751798268, + "loss": 1.6321, + "step": 11032 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024216860663259153, + "loss": 1.6355, + "step": 11033 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002421588551214264, + "loss": 1.6416, + "step": 11034 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024214910298455354, + "loss": 1.6129, + "step": 11035 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002421393502220391, + "loss": 1.6787, + "step": 11036 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024212959683394929, + "loss": 1.5931, + "step": 11037 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002421198428203504, + "loss": 1.6508, + "step": 11038 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002421100881813086, + "loss": 1.637, + "step": 11039 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024210033291689016, + "loss": 1.5627, + "step": 11040 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024209057702716125, + "loss": 1.6017, + "step": 11041 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024208082051218815, + "loss": 1.6246, + "step": 11042 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002420710633720371, + "loss": 1.5897, + "step": 11043 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024206130560677433, + "loss": 1.6566, + "step": 11044 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002420515472164661, + "loss": 1.5771, + "step": 11045 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024204178820117864, + "loss": 1.6203, + "step": 11046 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024203202856097822, + "loss": 1.6005, + "step": 11047 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024202226829593117, + "loss": 1.636, + "step": 11048 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002420125074061037, + "loss": 1.5595, + "step": 11049 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024200274589156206, + "loss": 1.611, + "step": 11050 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024199298375237254, + "loss": 1.6096, + "step": 11051 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024198322098860142, + "loss": 1.6202, + "step": 11052 + }, + { + "epoch": 0.87, + "learning_rate": 0.000241973457600315, + "loss": 1.6055, + "step": 11053 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024196369358757956, + "loss": 1.5777, + "step": 11054 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024195392895046141, + "loss": 1.6325, + "step": 11055 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002419441636890268, + "loss": 1.5823, + "step": 11056 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024193439780334207, + "loss": 1.6212, + "step": 11057 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002419246312934735, + "loss": 1.6108, + "step": 11058 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024191486415948743, + "loss": 1.5527, + "step": 11059 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024190509640145013, + "loss": 1.633, + "step": 11060 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024189532801942795, + "loss": 1.6111, + "step": 11061 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024188555901348717, + "loss": 1.6389, + "step": 11062 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024187578938369422, + "loss": 1.5961, + "step": 11063 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024186601913011533, + "loss": 1.6371, + "step": 11064 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024185624825281686, + "loss": 1.6363, + "step": 11065 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024184647675186521, + "loss": 1.6277, + "step": 11066 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002418367046273266, + "loss": 1.6119, + "step": 11067 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024182693187926746, + "loss": 1.5937, + "step": 11068 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024181715850775417, + "loss": 1.616, + "step": 11069 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024180738451285295, + "loss": 1.6139, + "step": 11070 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024179760989463035, + "loss": 1.6296, + "step": 11071 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024178783465315256, + "loss": 1.6283, + "step": 11072 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002417780587884861, + "loss": 1.5892, + "step": 11073 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024176828230069723, + "loss": 1.5874, + "step": 11074 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024175850518985234, + "loss": 1.612, + "step": 11075 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024174872745601789, + "loss": 1.5765, + "step": 11076 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024173894909926017, + "loss": 1.6183, + "step": 11077 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024172917011964563, + "loss": 1.6212, + "step": 11078 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002417193905172406, + "loss": 1.669, + "step": 11079 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024170961029211158, + "loss": 1.6459, + "step": 11080 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002416998294443249, + "loss": 1.634, + "step": 11081 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024169004797394702, + "loss": 1.658, + "step": 11082 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024168026588104426, + "loss": 1.6377, + "step": 11083 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024167048316568306, + "loss": 1.6101, + "step": 11084 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024166069982792994, + "loss": 1.5828, + "step": 11085 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024165091586785122, + "loss": 1.6031, + "step": 11086 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024164113128551334, + "loss": 1.5942, + "step": 11087 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024163134608098276, + "loss": 1.6409, + "step": 11088 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024162156025432595, + "loss": 1.629, + "step": 11089 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024161177380560927, + "loss": 1.6838, + "step": 11090 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002416019867348992, + "loss": 1.6122, + "step": 11091 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024159219904226216, + "loss": 1.6247, + "step": 11092 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024158241072776468, + "loss": 1.6191, + "step": 11093 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024157262179147314, + "loss": 1.6421, + "step": 11094 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002415628322334541, + "loss": 1.6294, + "step": 11095 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002415530420537739, + "loss": 1.6342, + "step": 11096 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024154325125249905, + "loss": 1.5836, + "step": 11097 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002415334598296961, + "loss": 1.5217, + "step": 11098 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002415236677854314, + "loss": 1.5885, + "step": 11099 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024151387511977157, + "loss": 1.6705, + "step": 11100 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024150408183278298, + "loss": 1.6544, + "step": 11101 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002414942879245322, + "loss": 1.5796, + "step": 11102 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024148449339508565, + "loss": 1.6512, + "step": 11103 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024147469824450994, + "loss": 1.5832, + "step": 11104 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002414649024728715, + "loss": 1.5627, + "step": 11105 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024145510608023678, + "loss": 1.6442, + "step": 11106 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024144530906667245, + "loss": 1.5958, + "step": 11107 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024143551143224486, + "loss": 1.6585, + "step": 11108 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024142571317702064, + "loss": 1.6667, + "step": 11109 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024141591430106626, + "loss": 1.5954, + "step": 11110 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024140611480444828, + "loss": 1.5957, + "step": 11111 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024139631468723325, + "loss": 1.5929, + "step": 11112 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024138651394948766, + "loss": 1.5659, + "step": 11113 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024137671259127807, + "loss": 1.6026, + "step": 11114 + }, + { + "epoch": 0.87, + "learning_rate": 0.000241366910612671, + "loss": 1.637, + "step": 11115 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024135710801373304, + "loss": 1.6419, + "step": 11116 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024134730479453078, + "loss": 1.6255, + "step": 11117 + }, + { + "epoch": 0.87, + "learning_rate": 0.00024133750095513067, + "loss": 1.6021, + "step": 11118 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002413276964955994, + "loss": 1.6005, + "step": 11119 + }, + { + "epoch": 0.87, + "learning_rate": 0.0002413178914160034, + "loss": 1.609, + "step": 11120 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024130808571640934, + "loss": 1.6062, + "step": 11121 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024129827939688375, + "loss": 1.6143, + "step": 11122 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024128847245749322, + "loss": 1.5732, + "step": 11123 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024127866489830437, + "loss": 1.5496, + "step": 11124 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024126885671938377, + "loss": 1.6169, + "step": 11125 + }, + { + "epoch": 0.88, + "learning_rate": 0.000241259047920798, + "loss": 1.6087, + "step": 11126 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002412492385026136, + "loss": 1.6081, + "step": 11127 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024123942846489727, + "loss": 1.5741, + "step": 11128 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024122961780771558, + "loss": 1.5678, + "step": 11129 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024121980653113507, + "loss": 1.6017, + "step": 11130 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024120999463522242, + "loss": 1.6645, + "step": 11131 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024120018212004431, + "loss": 1.6178, + "step": 11132 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002411903689856672, + "loss": 1.6119, + "step": 11133 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002411805552321579, + "loss": 1.5741, + "step": 11134 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002411707408595829, + "loss": 1.574, + "step": 11135 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024116092586800892, + "loss": 1.6379, + "step": 11136 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024115111025750253, + "loss": 1.5832, + "step": 11137 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024114129402813038, + "loss": 1.6383, + "step": 11138 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024113147717995915, + "loss": 1.6275, + "step": 11139 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002411216597130555, + "loss": 1.6401, + "step": 11140 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024111184162748604, + "loss": 1.6499, + "step": 11141 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002411020229233175, + "loss": 1.5724, + "step": 11142 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024109220360061644, + "loss": 1.5918, + "step": 11143 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024108238365944964, + "loss": 1.5522, + "step": 11144 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002410725630998837, + "loss": 1.5375, + "step": 11145 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024106274192198533, + "loss": 1.6458, + "step": 11146 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024105292012582117, + "loss": 1.5791, + "step": 11147 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024104309771145793, + "loss": 1.5612, + "step": 11148 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024103327467896228, + "loss": 1.6115, + "step": 11149 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024102345102840095, + "loss": 1.6747, + "step": 11150 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024101362675984066, + "loss": 1.6345, + "step": 11151 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024100380187334802, + "loss": 1.5654, + "step": 11152 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024099397636898978, + "loss": 1.6005, + "step": 11153 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024098415024683268, + "loss": 1.5749, + "step": 11154 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002409743235069434, + "loss": 1.5834, + "step": 11155 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002409644961493887, + "loss": 1.6048, + "step": 11156 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002409546681742352, + "loss": 1.6022, + "step": 11157 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024094483958154973, + "loss": 1.6187, + "step": 11158 + }, + { + "epoch": 0.88, + "learning_rate": 0.000240935010371399, + "loss": 1.5612, + "step": 11159 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024092518054384972, + "loss": 1.577, + "step": 11160 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024091535009896866, + "loss": 1.6369, + "step": 11161 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024090551903682253, + "loss": 1.5824, + "step": 11162 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024089568735747807, + "loss": 1.6228, + "step": 11163 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024088585506100207, + "loss": 1.6131, + "step": 11164 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024087602214746128, + "loss": 1.634, + "step": 11165 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002408661886169224, + "loss": 1.6416, + "step": 11166 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024085635446945234, + "loss": 1.6045, + "step": 11167 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024084651970511772, + "loss": 1.6165, + "step": 11168 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024083668432398536, + "loss": 1.5882, + "step": 11169 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024082684832612202, + "loss": 1.6203, + "step": 11170 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002408170117115945, + "loss": 1.6181, + "step": 11171 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024080717448046962, + "loss": 1.6201, + "step": 11172 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024079733663281413, + "loss": 1.6258, + "step": 11173 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024078749816869484, + "loss": 1.6196, + "step": 11174 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024077765908817853, + "loss": 1.6341, + "step": 11175 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024076781939133201, + "loss": 1.6723, + "step": 11176 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002407579790782221, + "loss": 1.6355, + "step": 11177 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024074813814891556, + "loss": 1.6496, + "step": 11178 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024073829660347927, + "loss": 1.6015, + "step": 11179 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024072845444198, + "loss": 1.6202, + "step": 11180 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024071861166448464, + "loss": 1.6076, + "step": 11181 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024070876827105987, + "loss": 1.6017, + "step": 11182 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002406989242617727, + "loss": 1.5539, + "step": 11183 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002406890796366899, + "loss": 1.5802, + "step": 11184 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024067923439587824, + "loss": 1.6066, + "step": 11185 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024066938853940464, + "loss": 1.6228, + "step": 11186 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024065954206733592, + "loss": 1.5727, + "step": 11187 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024064969497973894, + "loss": 1.6016, + "step": 11188 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002406398472766806, + "loss": 1.6232, + "step": 11189 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024062999895822765, + "loss": 1.5939, + "step": 11190 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024062015002444709, + "loss": 1.6172, + "step": 11191 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002406103004754057, + "loss": 1.5981, + "step": 11192 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024060045031117034, + "loss": 1.6426, + "step": 11193 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024059059953180793, + "loss": 1.5578, + "step": 11194 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024058074813738533, + "loss": 1.6006, + "step": 11195 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024057089612796945, + "loss": 1.6082, + "step": 11196 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024056104350362716, + "loss": 1.6283, + "step": 11197 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024055119026442543, + "loss": 1.605, + "step": 11198 + }, + { + "epoch": 0.88, + "learning_rate": 0.000240541336410431, + "loss": 1.6037, + "step": 11199 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024053148194171087, + "loss": 1.5952, + "step": 11200 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024052162685833198, + "loss": 1.6169, + "step": 11201 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024051177116036116, + "loss": 1.5987, + "step": 11202 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024050191484786538, + "loss": 1.6703, + "step": 11203 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024049205792091156, + "loss": 1.565, + "step": 11204 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024048220037956657, + "loss": 1.6087, + "step": 11205 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024047234222389737, + "loss": 1.5867, + "step": 11206 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002404624834539709, + "loss": 1.618, + "step": 11207 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002404526240698541, + "loss": 1.559, + "step": 11208 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002404427640716139, + "loss": 1.5937, + "step": 11209 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024043290345931724, + "loss": 1.6289, + "step": 11210 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024042304223303104, + "loss": 1.5809, + "step": 11211 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024041318039282232, + "loss": 1.5888, + "step": 11212 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024040331793875799, + "loss": 1.5769, + "step": 11213 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024039345487090504, + "loss": 1.6093, + "step": 11214 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002403835911893304, + "loss": 1.6149, + "step": 11215 + }, + { + "epoch": 0.88, + "learning_rate": 0.000240373726894101, + "loss": 1.5835, + "step": 11216 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024036386198528393, + "loss": 1.612, + "step": 11217 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024035399646294607, + "loss": 1.5382, + "step": 11218 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024034413032715445, + "loss": 1.601, + "step": 11219 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002403342635779761, + "loss": 1.6222, + "step": 11220 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024032439621547786, + "loss": 1.5884, + "step": 11221 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024031452823972685, + "loss": 1.5299, + "step": 11222 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024030465965079004, + "loss": 1.6656, + "step": 11223 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002402947904487344, + "loss": 1.5758, + "step": 11224 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024028492063362698, + "loss": 1.6135, + "step": 11225 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002402750502055348, + "loss": 1.5665, + "step": 11226 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002402651791645248, + "loss": 1.6702, + "step": 11227 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024025530751066405, + "loss": 1.6292, + "step": 11228 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024024543524401963, + "loss": 1.5687, + "step": 11229 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024023556236465844, + "loss": 1.6109, + "step": 11230 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002402256888726476, + "loss": 1.6124, + "step": 11231 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024021581476805408, + "loss": 1.5829, + "step": 11232 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024020594005094503, + "loss": 1.6157, + "step": 11233 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002401960647213874, + "loss": 1.6545, + "step": 11234 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002401861887794483, + "loss": 1.6087, + "step": 11235 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024017631222519469, + "loss": 1.6269, + "step": 11236 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024016643505869368, + "loss": 1.6178, + "step": 11237 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024015655728001236, + "loss": 1.6249, + "step": 11238 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002401466788892178, + "loss": 1.647, + "step": 11239 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024013679988637703, + "loss": 1.622, + "step": 11240 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024012692027155705, + "loss": 1.5836, + "step": 11241 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024011704004482507, + "loss": 1.5313, + "step": 11242 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024010715920624816, + "loss": 1.607, + "step": 11243 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002400972777558933, + "loss": 1.6103, + "step": 11244 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024008739569382766, + "loss": 1.6137, + "step": 11245 + }, + { + "epoch": 0.88, + "learning_rate": 0.00024007751302011836, + "loss": 1.6107, + "step": 11246 + }, + { + "epoch": 0.88, + "learning_rate": 0.0002400676297348324, + "loss": 1.636, + "step": 11247 + }, + { + "epoch": 0.89, + "learning_rate": 0.00024005774583803696, + "loss": 1.6596, + "step": 11248 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002400478613297991, + "loss": 1.631, + "step": 11249 + }, + { + "epoch": 0.89, + "learning_rate": 0.00024003797621018598, + "loss": 1.6387, + "step": 11250 + }, + { + "epoch": 0.89, + "learning_rate": 0.00024002809047926472, + "loss": 1.6506, + "step": 11251 + }, + { + "epoch": 0.89, + "learning_rate": 0.00024001820413710237, + "loss": 1.6187, + "step": 11252 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002400083171837661, + "loss": 1.6068, + "step": 11253 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023999842961932303, + "loss": 1.61, + "step": 11254 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023998854144384026, + "loss": 1.5818, + "step": 11255 + }, + { + "epoch": 0.89, + "learning_rate": 0.000239978652657385, + "loss": 1.5759, + "step": 11256 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002399687632600243, + "loss": 1.5945, + "step": 11257 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023995887325182537, + "loss": 1.6797, + "step": 11258 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023994898263285535, + "loss": 1.5869, + "step": 11259 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023993909140318132, + "loss": 1.5934, + "step": 11260 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023992919956287051, + "loss": 1.6329, + "step": 11261 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002399193071119901, + "loss": 1.5595, + "step": 11262 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002399094140506072, + "loss": 1.6069, + "step": 11263 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023989952037878898, + "loss": 1.6138, + "step": 11264 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023988962609660262, + "loss": 1.6082, + "step": 11265 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023987973120411532, + "loss": 1.6145, + "step": 11266 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002398698357013942, + "loss": 1.6266, + "step": 11267 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023985993958850656, + "loss": 1.6292, + "step": 11268 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002398500428655195, + "loss": 1.5959, + "step": 11269 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023984014553250026, + "loss": 1.5823, + "step": 11270 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023983024758951596, + "loss": 1.6635, + "step": 11271 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023982034903663387, + "loss": 1.5589, + "step": 11272 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023981044987392112, + "loss": 1.5891, + "step": 11273 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023980055010144508, + "loss": 1.5997, + "step": 11274 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002397906497192728, + "loss": 1.6442, + "step": 11275 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023978074872747158, + "loss": 1.625, + "step": 11276 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023977084712610862, + "loss": 1.6188, + "step": 11277 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023976094491525113, + "loss": 1.5332, + "step": 11278 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023975104209496634, + "loss": 1.6206, + "step": 11279 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023974113866532154, + "loss": 1.5756, + "step": 11280 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023973123462638389, + "loss": 1.6257, + "step": 11281 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023972132997822072, + "loss": 1.567, + "step": 11282 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023971142472089922, + "loss": 1.6107, + "step": 11283 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023970151885448668, + "loss": 1.6339, + "step": 11284 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002396916123790503, + "loss": 1.6176, + "step": 11285 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023968170529465734, + "loss": 1.6626, + "step": 11286 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002396717976013751, + "loss": 1.59, + "step": 11287 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023966188929927087, + "loss": 1.6095, + "step": 11288 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023965198038841188, + "loss": 1.624, + "step": 11289 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023964207086886542, + "loss": 1.5775, + "step": 11290 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023963216074069876, + "loss": 1.6203, + "step": 11291 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002396222500039792, + "loss": 1.6078, + "step": 11292 + }, + { + "epoch": 0.89, + "learning_rate": 0.000239612338658774, + "loss": 1.576, + "step": 11293 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002396024267051505, + "loss": 1.5565, + "step": 11294 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023959251414317596, + "loss": 1.5867, + "step": 11295 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023958260097291768, + "loss": 1.607, + "step": 11296 + }, + { + "epoch": 0.89, + "learning_rate": 0.000239572687194443, + "loss": 1.5743, + "step": 11297 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002395627728078192, + "loss": 1.6087, + "step": 11298 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023955285781311356, + "loss": 1.5946, + "step": 11299 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023954294221039342, + "loss": 1.5776, + "step": 11300 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023953302599972616, + "loss": 1.6585, + "step": 11301 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002395231091811791, + "loss": 1.5594, + "step": 11302 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002395131917548195, + "loss": 1.5933, + "step": 11303 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002395032737207147, + "loss": 1.6031, + "step": 11304 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023949335507893207, + "loss": 1.6679, + "step": 11305 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023948343582953893, + "loss": 1.5418, + "step": 11306 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023947351597260267, + "loss": 1.5369, + "step": 11307 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023946359550819062, + "loss": 1.6042, + "step": 11308 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023945367443637013, + "loss": 1.6443, + "step": 11309 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023944375275720853, + "loss": 1.5994, + "step": 11310 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023943383047077323, + "loss": 1.6244, + "step": 11311 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023942390757713153, + "loss": 1.6, + "step": 11312 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023941398407635088, + "loss": 1.6228, + "step": 11313 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023940405996849862, + "loss": 1.6429, + "step": 11314 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023939413525364214, + "loss": 1.6167, + "step": 11315 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002393842099318488, + "loss": 1.5846, + "step": 11316 + }, + { + "epoch": 0.89, + "learning_rate": 0.000239374284003186, + "loss": 1.5714, + "step": 11317 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023936435746772113, + "loss": 1.6067, + "step": 11318 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002393544303255216, + "loss": 1.6121, + "step": 11319 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023934450257665478, + "loss": 1.5986, + "step": 11320 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023933457422118808, + "loss": 1.6232, + "step": 11321 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023932464525918898, + "loss": 1.6356, + "step": 11322 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023931471569072478, + "loss": 1.5961, + "step": 11323 + }, + { + "epoch": 0.89, + "learning_rate": 0.000239304785515863, + "loss": 1.6255, + "step": 11324 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023929485473467093, + "loss": 1.6289, + "step": 11325 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002392849233472161, + "loss": 1.6528, + "step": 11326 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023927499135356593, + "loss": 1.6195, + "step": 11327 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023926505875378787, + "loss": 1.6592, + "step": 11328 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023925512554794927, + "loss": 1.6012, + "step": 11329 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023924519173611761, + "loss": 1.568, + "step": 11330 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002392352573183604, + "loss": 1.6183, + "step": 11331 + }, + { + "epoch": 0.89, + "learning_rate": 0.000239225322294745, + "loss": 1.6011, + "step": 11332 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002392153866653389, + "loss": 1.5986, + "step": 11333 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023920545043020958, + "loss": 1.5718, + "step": 11334 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002391955135894245, + "loss": 1.6246, + "step": 11335 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023918557614305104, + "loss": 1.6241, + "step": 11336 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023917563809115676, + "loss": 1.5754, + "step": 11337 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023916569943380913, + "loss": 1.5849, + "step": 11338 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002391557601710756, + "loss": 1.5969, + "step": 11339 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023914582030302363, + "loss": 1.5802, + "step": 11340 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023913587982972076, + "loss": 1.6619, + "step": 11341 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023912593875123446, + "loss": 1.6128, + "step": 11342 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023911599706763224, + "loss": 1.6128, + "step": 11343 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002391060547789815, + "loss": 1.5779, + "step": 11344 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002390961118853499, + "loss": 1.6012, + "step": 11345 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023908616838680483, + "loss": 1.58, + "step": 11346 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023907622428341385, + "loss": 1.6072, + "step": 11347 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023906627957524446, + "loss": 1.5984, + "step": 11348 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002390563342623642, + "loss": 1.6394, + "step": 11349 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023904638834484055, + "loss": 1.5807, + "step": 11350 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023903644182274105, + "loss": 1.59, + "step": 11351 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023902649469613327, + "loss": 1.6012, + "step": 11352 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002390165469650847, + "loss": 1.6341, + "step": 11353 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023900659862966292, + "loss": 1.5974, + "step": 11354 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023899664968993545, + "loss": 1.6587, + "step": 11355 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023898670014596985, + "loss": 1.6249, + "step": 11356 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023897674999783365, + "loss": 1.574, + "step": 11357 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023896679924559442, + "loss": 1.6153, + "step": 11358 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002389568478893197, + "loss": 1.595, + "step": 11359 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023894689592907707, + "loss": 1.6091, + "step": 11360 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023893694336493416, + "loss": 1.646, + "step": 11361 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023892699019695845, + "loss": 1.5539, + "step": 11362 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023891703642521753, + "loss": 1.5854, + "step": 11363 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023890708204977903, + "loss": 1.6038, + "step": 11364 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023889712707071052, + "loss": 1.538, + "step": 11365 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023888717148807956, + "loss": 1.5985, + "step": 11366 + }, + { + "epoch": 0.89, + "learning_rate": 0.0002388772153019537, + "loss": 1.6071, + "step": 11367 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023886725851240064, + "loss": 1.6156, + "step": 11368 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023885730111948797, + "loss": 1.6079, + "step": 11369 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023884734312328322, + "loss": 1.5805, + "step": 11370 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023883738452385405, + "loss": 1.5816, + "step": 11371 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023882742532126808, + "loss": 1.5992, + "step": 11372 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023881746551559287, + "loss": 1.5749, + "step": 11373 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023880750510689612, + "loss": 1.621, + "step": 11374 + }, + { + "epoch": 0.89, + "learning_rate": 0.00023879754409524535, + "loss": 1.6244, + "step": 11375 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023878758248070838, + "loss": 1.5995, + "step": 11376 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023877762026335266, + "loss": 1.6238, + "step": 11377 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002387676574432459, + "loss": 1.6344, + "step": 11378 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002387576940204557, + "loss": 1.578, + "step": 11379 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023874772999504972, + "loss": 1.6303, + "step": 11380 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023873776536709567, + "loss": 1.5849, + "step": 11381 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023872780013666118, + "loss": 1.6229, + "step": 11382 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023871783430381386, + "loss": 1.5879, + "step": 11383 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023870786786862143, + "loss": 1.5597, + "step": 11384 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023869790083115146, + "loss": 1.5984, + "step": 11385 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023868793319147176, + "loss": 1.5796, + "step": 11386 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023867796494964993, + "loss": 1.5724, + "step": 11387 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023866799610575368, + "loss": 1.6178, + "step": 11388 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002386580266598506, + "loss": 1.5786, + "step": 11389 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023864805661200848, + "loss": 1.6317, + "step": 11390 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023863808596229495, + "loss": 1.6439, + "step": 11391 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023862811471077775, + "loss": 1.5945, + "step": 11392 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023861814285752454, + "loss": 1.6104, + "step": 11393 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002386081704026031, + "loss": 1.5834, + "step": 11394 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023859819734608104, + "loss": 1.5618, + "step": 11395 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002385882236880261, + "loss": 1.6528, + "step": 11396 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023857824942850604, + "loss": 1.6021, + "step": 11397 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023856827456758854, + "loss": 1.5696, + "step": 11398 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023855829910534129, + "loss": 1.5791, + "step": 11399 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023854832304183213, + "loss": 1.605, + "step": 11400 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002385383463771287, + "loss": 1.6216, + "step": 11401 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023852836911129874, + "loss": 1.6024, + "step": 11402 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023851839124441, + "loss": 1.572, + "step": 11403 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023850841277653023, + "loss": 1.5959, + "step": 11404 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023849843370772722, + "loss": 1.6027, + "step": 11405 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023848845403806861, + "loss": 1.5828, + "step": 11406 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002384784737676223, + "loss": 1.6424, + "step": 11407 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023846849289645597, + "loss": 1.6418, + "step": 11408 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023845851142463738, + "loss": 1.6646, + "step": 11409 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023844852935223432, + "loss": 1.6414, + "step": 11410 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023843854667931458, + "loss": 1.5635, + "step": 11411 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023842856340594584, + "loss": 1.5628, + "step": 11412 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023841857953219597, + "loss": 1.5487, + "step": 11413 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002384085950581328, + "loss": 1.583, + "step": 11414 + }, + { + "epoch": 0.9, + "learning_rate": 0.000238398609983824, + "loss": 1.6302, + "step": 11415 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023838862430933746, + "loss": 1.6011, + "step": 11416 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023837863803474093, + "loss": 1.6312, + "step": 11417 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002383686511601022, + "loss": 1.5743, + "step": 11418 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002383586636854891, + "loss": 1.5912, + "step": 11419 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023834867561096942, + "loss": 1.6466, + "step": 11420 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023833868693661102, + "loss": 1.5784, + "step": 11421 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023832869766248166, + "loss": 1.5011, + "step": 11422 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002383187077886492, + "loss": 1.6176, + "step": 11423 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002383087173151814, + "loss": 1.5669, + "step": 11424 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023829872624214621, + "loss": 1.6743, + "step": 11425 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002382887345696114, + "loss": 1.638, + "step": 11426 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002382787422976448, + "loss": 1.6161, + "step": 11427 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023826874942631425, + "loss": 1.5575, + "step": 11428 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023825875595568754, + "loss": 1.6281, + "step": 11429 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023824876188583268, + "loss": 1.6094, + "step": 11430 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002382387672168173, + "loss": 1.5718, + "step": 11431 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002382287719487095, + "loss": 1.5855, + "step": 11432 + }, + { + "epoch": 0.9, + "learning_rate": 0.000238218776081577, + "loss": 1.5739, + "step": 11433 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023820877961548768, + "loss": 1.5873, + "step": 11434 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023819878255050943, + "loss": 1.5763, + "step": 11435 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002381887848867101, + "loss": 1.6288, + "step": 11436 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023817878662415763, + "loss": 1.5942, + "step": 11437 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002381687877629198, + "loss": 1.6023, + "step": 11438 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002381587883030646, + "loss": 1.668, + "step": 11439 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023814878824465985, + "loss": 1.538, + "step": 11440 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023813878758777352, + "loss": 1.6285, + "step": 11441 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002381287863324734, + "loss": 1.6789, + "step": 11442 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002381187844788275, + "loss": 1.5073, + "step": 11443 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002381087820269037, + "loss": 1.6241, + "step": 11444 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023809877897676982, + "loss": 1.5689, + "step": 11445 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023808877532849386, + "loss": 1.639, + "step": 11446 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002380787710821438, + "loss": 1.6095, + "step": 11447 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002380687662377874, + "loss": 1.6306, + "step": 11448 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023805876079549274, + "loss": 1.6142, + "step": 11449 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002380487547553277, + "loss": 1.6166, + "step": 11450 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023803874811736015, + "loss": 1.587, + "step": 11451 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002380287408816581, + "loss": 1.6306, + "step": 11452 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002380187330482895, + "loss": 1.6395, + "step": 11453 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023800872461732226, + "loss": 1.6021, + "step": 11454 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023799871558882434, + "loss": 1.6366, + "step": 11455 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002379887059628637, + "loss": 1.6077, + "step": 11456 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023797869573950834, + "loss": 1.6287, + "step": 11457 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023796868491882613, + "loss": 1.6274, + "step": 11458 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023795867350088514, + "loss": 1.6095, + "step": 11459 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002379486614857533, + "loss": 1.5744, + "step": 11460 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023793864887349854, + "loss": 1.6564, + "step": 11461 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002379286356641889, + "loss": 1.5879, + "step": 11462 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023791862185789238, + "loss": 1.6144, + "step": 11463 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002379086074546769, + "loss": 1.6189, + "step": 11464 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023789859245461052, + "loss": 1.6119, + "step": 11465 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023788857685776117, + "loss": 1.6139, + "step": 11466 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002378785606641969, + "loss": 1.5566, + "step": 11467 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023786854387398566, + "loss": 1.6245, + "step": 11468 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023785852648719553, + "loss": 1.6436, + "step": 11469 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023784850850389449, + "loss": 1.5784, + "step": 11470 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023783848992415052, + "loss": 1.5852, + "step": 11471 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023782847074803177, + "loss": 1.5777, + "step": 11472 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002378184509756061, + "loss": 1.5757, + "step": 11473 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023780843060694162, + "loss": 1.6092, + "step": 11474 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023779840964210637, + "loss": 1.5575, + "step": 11475 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023778838808116836, + "loss": 1.5998, + "step": 11476 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002377783659241956, + "loss": 1.612, + "step": 11477 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023776834317125624, + "loss": 1.6555, + "step": 11478 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023775831982241825, + "loss": 1.5781, + "step": 11479 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023774829587774966, + "loss": 1.6357, + "step": 11480 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002377382713373186, + "loss": 1.6817, + "step": 11481 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023772824620119307, + "loss": 1.6128, + "step": 11482 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002377182204694412, + "loss": 1.5811, + "step": 11483 + }, + { + "epoch": 0.9, + "learning_rate": 0.000237708194142131, + "loss": 1.6499, + "step": 11484 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023769816721933056, + "loss": 1.6027, + "step": 11485 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023768813970110792, + "loss": 1.5468, + "step": 11486 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023767811158753124, + "loss": 1.5542, + "step": 11487 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023766808287866857, + "loss": 1.5499, + "step": 11488 + }, + { + "epoch": 0.9, + "learning_rate": 0.000237658053574588, + "loss": 1.5858, + "step": 11489 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023764802367535765, + "loss": 1.593, + "step": 11490 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002376379931810455, + "loss": 1.6311, + "step": 11491 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002376279620917198, + "loss": 1.6422, + "step": 11492 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002376179304074486, + "loss": 1.6225, + "step": 11493 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023760789812829998, + "loss": 1.6113, + "step": 11494 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002375978652543421, + "loss": 1.6251, + "step": 11495 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023758783178564304, + "loss": 1.65, + "step": 11496 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002375777977222709, + "loss": 1.6421, + "step": 11497 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023756776306429393, + "loss": 1.6146, + "step": 11498 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023755772781178008, + "loss": 1.6307, + "step": 11499 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023754769196479764, + "loss": 1.6146, + "step": 11500 + }, + { + "epoch": 0.9, + "learning_rate": 0.00023753765552341467, + "loss": 1.5878, + "step": 11501 + }, + { + "epoch": 0.9, + "learning_rate": 0.0002375276184876993, + "loss": 1.6898, + "step": 11502 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023751758085771975, + "loss": 1.6026, + "step": 11503 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023750754263354408, + "loss": 1.5907, + "step": 11504 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002374975038152405, + "loss": 1.58, + "step": 11505 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023748746440287717, + "loss": 1.6177, + "step": 11506 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002374774243965222, + "loss": 1.59, + "step": 11507 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023746738379624383, + "loss": 1.5938, + "step": 11508 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023745734260211017, + "loss": 1.6202, + "step": 11509 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002374473008141894, + "loss": 1.6404, + "step": 11510 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023743725843254976, + "loss": 1.5898, + "step": 11511 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023742721545725936, + "loss": 1.614, + "step": 11512 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023741717188838644, + "loss": 1.5938, + "step": 11513 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023740712772599913, + "loss": 1.5829, + "step": 11514 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023739708297016565, + "loss": 1.5808, + "step": 11515 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023738703762095424, + "loss": 1.5961, + "step": 11516 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023737699167843305, + "loss": 1.5825, + "step": 11517 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023736694514267032, + "loss": 1.5999, + "step": 11518 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023735689801373424, + "loss": 1.6014, + "step": 11519 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023734685029169305, + "loss": 1.6506, + "step": 11520 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002373368019766149, + "loss": 1.5498, + "step": 11521 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002373267530685681, + "loss": 1.581, + "step": 11522 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023731670356762083, + "loss": 1.5555, + "step": 11523 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002373066534738413, + "loss": 1.6258, + "step": 11524 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023729660278729782, + "loss": 1.5373, + "step": 11525 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023728655150805856, + "loss": 1.6758, + "step": 11526 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023727649963619176, + "loss": 1.6311, + "step": 11527 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002372664471717657, + "loss": 1.6034, + "step": 11528 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023725639411484865, + "loss": 1.561, + "step": 11529 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002372463404655088, + "loss": 1.6037, + "step": 11530 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002372362862238145, + "loss": 1.5488, + "step": 11531 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002372262313898339, + "loss": 1.6326, + "step": 11532 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023721617596363535, + "loss": 1.5522, + "step": 11533 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023720611994528708, + "loss": 1.5797, + "step": 11534 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023719606333485736, + "loss": 1.5801, + "step": 11535 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023718600613241452, + "loss": 1.5963, + "step": 11536 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023717594833802685, + "loss": 1.6089, + "step": 11537 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023716588995176255, + "loss": 1.6494, + "step": 11538 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023715583097369, + "loss": 1.6217, + "step": 11539 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023714577140387737, + "loss": 1.6328, + "step": 11540 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023713571124239313, + "loss": 1.628, + "step": 11541 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023712565048930544, + "loss": 1.5788, + "step": 11542 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023711558914468267, + "loss": 1.5909, + "step": 11543 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023710552720859312, + "loss": 1.6136, + "step": 11544 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023709546468110514, + "loss": 1.5654, + "step": 11545 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023708540156228703, + "loss": 1.6195, + "step": 11546 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002370753378522071, + "loss": 1.5893, + "step": 11547 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023706527355093362, + "loss": 1.6455, + "step": 11548 + }, + { + "epoch": 0.91, + "learning_rate": 0.000237055208658535, + "loss": 1.5679, + "step": 11549 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023704514317507958, + "loss": 1.5588, + "step": 11550 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023703507710063566, + "loss": 1.5775, + "step": 11551 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002370250104352716, + "loss": 1.5967, + "step": 11552 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023701494317905574, + "loss": 1.5907, + "step": 11553 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023700487533205645, + "loss": 1.6458, + "step": 11554 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023699480689434206, + "loss": 1.5948, + "step": 11555 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023698473786598094, + "loss": 1.6164, + "step": 11556 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023697466824704143, + "loss": 1.6076, + "step": 11557 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023696459803759193, + "loss": 1.6092, + "step": 11558 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023695452723770079, + "loss": 1.6054, + "step": 11559 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023694445584743643, + "loss": 1.5407, + "step": 11560 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023693438386686717, + "loss": 1.6246, + "step": 11561 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023692431129606142, + "loss": 1.6089, + "step": 11562 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023691423813508762, + "loss": 1.7036, + "step": 11563 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023690416438401402, + "loss": 1.6066, + "step": 11564 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023689409004290914, + "loss": 1.616, + "step": 11565 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023688401511184133, + "loss": 1.5739, + "step": 11566 + }, + { + "epoch": 0.91, + "learning_rate": 0.000236873939590879, + "loss": 1.6029, + "step": 11567 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002368638634800906, + "loss": 1.5968, + "step": 11568 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023685378677954449, + "loss": 1.5495, + "step": 11569 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023684370948930905, + "loss": 1.5316, + "step": 11570 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023683363160945277, + "loss": 1.6172, + "step": 11571 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023682355314004407, + "loss": 1.6294, + "step": 11572 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023681347408115137, + "loss": 1.6345, + "step": 11573 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023680339443284305, + "loss": 1.559, + "step": 11574 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002367933141951876, + "loss": 1.5339, + "step": 11575 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023678323336825342, + "loss": 1.5619, + "step": 11576 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023677315195210904, + "loss": 1.5978, + "step": 11577 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023676306994682277, + "loss": 1.5164, + "step": 11578 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023675298735246315, + "loss": 1.6016, + "step": 11579 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023674290416909866, + "loss": 1.6059, + "step": 11580 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023673282039679772, + "loss": 1.5943, + "step": 11581 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023672273603562874, + "loss": 1.5852, + "step": 11582 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002367126510856603, + "loss": 1.6039, + "step": 11583 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023670256554696076, + "loss": 1.5636, + "step": 11584 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023669247941959868, + "loss": 1.593, + "step": 11585 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023668239270364252, + "loss": 1.5866, + "step": 11586 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023667230539916066, + "loss": 1.5395, + "step": 11587 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023666221750622175, + "loss": 1.571, + "step": 11588 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002366521290248942, + "loss": 1.6096, + "step": 11589 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002366420399552465, + "loss": 1.6102, + "step": 11590 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002366319502973472, + "loss": 1.6356, + "step": 11591 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002366218600512647, + "loss": 1.6123, + "step": 11592 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002366117692170676, + "loss": 1.6392, + "step": 11593 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023660167779482444, + "loss": 1.6046, + "step": 11594 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002365915857846036, + "loss": 1.5837, + "step": 11595 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002365814931864737, + "loss": 1.5807, + "step": 11596 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023657140000050327, + "loss": 1.5478, + "step": 11597 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002365613062267608, + "loss": 1.6194, + "step": 11598 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002365512118653148, + "loss": 1.6623, + "step": 11599 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023654111691623385, + "loss": 1.6768, + "step": 11600 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023653102137958647, + "loss": 1.6164, + "step": 11601 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023652092525544124, + "loss": 1.6425, + "step": 11602 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002365108285438666, + "loss": 1.548, + "step": 11603 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023650073124493123, + "loss": 1.5832, + "step": 11604 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002364906333587036, + "loss": 1.6284, + "step": 11605 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023648053488525234, + "loss": 1.5669, + "step": 11606 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023647043582464595, + "loss": 1.6663, + "step": 11607 + }, + { + "epoch": 0.91, + "learning_rate": 0.000236460336176953, + "loss": 1.5609, + "step": 11608 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002364502359422421, + "loss": 1.6292, + "step": 11609 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002364401351205818, + "loss": 1.6125, + "step": 11610 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023643003371204068, + "loss": 1.5857, + "step": 11611 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002364199317166873, + "loss": 1.5755, + "step": 11612 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023640982913459036, + "loss": 1.6658, + "step": 11613 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023639972596581831, + "loss": 1.6047, + "step": 11614 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002363896222104398, + "loss": 1.6337, + "step": 11615 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023637951786852345, + "loss": 1.5597, + "step": 11616 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002363694129401378, + "loss": 1.5994, + "step": 11617 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023635930742535154, + "loss": 1.6088, + "step": 11618 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002363492013242332, + "loss": 1.6576, + "step": 11619 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023633909463685148, + "loss": 1.594, + "step": 11620 + }, + { + "epoch": 0.91, + "learning_rate": 0.0002363289873632749, + "loss": 1.6213, + "step": 11621 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023631887950357217, + "loss": 1.6, + "step": 11622 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023630877105781188, + "loss": 1.616, + "step": 11623 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023629866202606268, + "loss": 1.5863, + "step": 11624 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023628855240839314, + "loss": 1.6373, + "step": 11625 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023627844220487198, + "loss": 1.5659, + "step": 11626 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023626833141556782, + "loss": 1.5961, + "step": 11627 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023625822004054927, + "loss": 1.6479, + "step": 11628 + }, + { + "epoch": 0.91, + "learning_rate": 0.00023624810807988504, + "loss": 1.6202, + "step": 11629 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023623799553364373, + "loss": 1.651, + "step": 11630 + }, + { + "epoch": 0.92, + "learning_rate": 0.000236227882401894, + "loss": 1.5609, + "step": 11631 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023621776868470458, + "loss": 1.6076, + "step": 11632 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023620765438214406, + "loss": 1.6447, + "step": 11633 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023619753949428115, + "loss": 1.6212, + "step": 11634 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002361874240211845, + "loss": 1.6699, + "step": 11635 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023617730796292283, + "loss": 1.6344, + "step": 11636 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023616719131956478, + "loss": 1.6268, + "step": 11637 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023615707409117904, + "loss": 1.6005, + "step": 11638 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002361469562778343, + "loss": 1.6236, + "step": 11639 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023613683787959932, + "loss": 1.5976, + "step": 11640 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023612671889654271, + "loss": 1.5778, + "step": 11641 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002361165993287332, + "loss": 1.5658, + "step": 11642 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023610647917623955, + "loss": 1.5113, + "step": 11643 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023609635843913038, + "loss": 1.6214, + "step": 11644 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023608623711747446, + "loss": 1.6737, + "step": 11645 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023607611521134046, + "loss": 1.6033, + "step": 11646 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023606599272079723, + "loss": 1.5772, + "step": 11647 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023605586964591332, + "loss": 1.6151, + "step": 11648 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023604574598675755, + "loss": 1.6165, + "step": 11649 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002360356217433987, + "loss": 1.6165, + "step": 11650 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023602549691590543, + "loss": 1.6176, + "step": 11651 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023601537150434647, + "loss": 1.5869, + "step": 11652 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023600524550879067, + "loss": 1.6145, + "step": 11653 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023599511892930666, + "loss": 1.6153, + "step": 11654 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023598499176596328, + "loss": 1.6333, + "step": 11655 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002359748640188293, + "loss": 1.4794, + "step": 11656 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023596473568797337, + "loss": 1.6229, + "step": 11657 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023595460677346434, + "loss": 1.5977, + "step": 11658 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023594447727537095, + "loss": 1.6453, + "step": 11659 + }, + { + "epoch": 0.92, + "learning_rate": 0.000235934347193762, + "loss": 1.6182, + "step": 11660 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023592421652870625, + "loss": 1.6196, + "step": 11661 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023591408528027253, + "loss": 1.5761, + "step": 11662 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023590395344852953, + "loss": 1.6637, + "step": 11663 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023589382103354612, + "loss": 1.6194, + "step": 11664 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023588368803539105, + "loss": 1.5611, + "step": 11665 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023587355445413313, + "loss": 1.6235, + "step": 11666 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023586342028984115, + "loss": 1.6085, + "step": 11667 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023585328554258397, + "loss": 1.6316, + "step": 11668 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023584315021243034, + "loss": 1.5609, + "step": 11669 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002358330142994491, + "loss": 1.5266, + "step": 11670 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023582287780370907, + "loss": 1.6266, + "step": 11671 + }, + { + "epoch": 0.92, + "learning_rate": 0.000235812740725279, + "loss": 1.6306, + "step": 11672 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023580260306422783, + "loss": 1.6312, + "step": 11673 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023579246482062431, + "loss": 1.6195, + "step": 11674 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002357823259945373, + "loss": 1.5751, + "step": 11675 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002357721865860357, + "loss": 1.5981, + "step": 11676 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023576204659518817, + "loss": 1.6082, + "step": 11677 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023575190602206377, + "loss": 1.6097, + "step": 11678 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002357417648667312, + "loss": 1.6055, + "step": 11679 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023573162312925938, + "loss": 1.599, + "step": 11680 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023572148080971714, + "loss": 1.6285, + "step": 11681 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002357113379081734, + "loss": 1.5977, + "step": 11682 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023570119442469688, + "loss": 1.6359, + "step": 11683 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023569105035935664, + "loss": 1.5805, + "step": 11684 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002356809057122214, + "loss": 1.5849, + "step": 11685 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002356707604833601, + "loss": 1.5446, + "step": 11686 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023566061467284163, + "loss": 1.6111, + "step": 11687 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023565046828073484, + "loss": 1.6375, + "step": 11688 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023564032130710862, + "loss": 1.5672, + "step": 11689 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002356301737520319, + "loss": 1.6115, + "step": 11690 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023562002561557354, + "loss": 1.5747, + "step": 11691 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002356098768978025, + "loss": 1.6111, + "step": 11692 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023559972759878764, + "loss": 1.6245, + "step": 11693 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002355895777185978, + "loss": 1.5746, + "step": 11694 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023557942725730202, + "loss": 1.608, + "step": 11695 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023556927621496912, + "loss": 1.6194, + "step": 11696 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023555912459166805, + "loss": 1.5804, + "step": 11697 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023554897238746775, + "loss": 1.61, + "step": 11698 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023553881960243717, + "loss": 1.5545, + "step": 11699 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023552866623664516, + "loss": 1.5947, + "step": 11700 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023551851229016072, + "loss": 1.6171, + "step": 11701 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002355083577630528, + "loss": 1.5477, + "step": 11702 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002354982026553903, + "loss": 1.5781, + "step": 11703 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023548804696724217, + "loss": 1.5994, + "step": 11704 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002354778906986774, + "loss": 1.6066, + "step": 11705 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002354677338497649, + "loss": 1.5794, + "step": 11706 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023545757642057369, + "loss": 1.6542, + "step": 11707 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002354474184111727, + "loss": 1.5594, + "step": 11708 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023543725982163086, + "loss": 1.5952, + "step": 11709 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023542710065201715, + "loss": 1.6267, + "step": 11710 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023541694090240063, + "loss": 1.5831, + "step": 11711 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002354067805728502, + "loss": 1.6368, + "step": 11712 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023539661966343484, + "loss": 1.6043, + "step": 11713 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023538645817422358, + "loss": 1.6464, + "step": 11714 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023537629610528537, + "loss": 1.6353, + "step": 11715 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023536613345668923, + "loss": 1.6063, + "step": 11716 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023535597022850414, + "loss": 1.6345, + "step": 11717 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023534580642079915, + "loss": 1.6128, + "step": 11718 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002353356420336432, + "loss": 1.5719, + "step": 11719 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023532547706710537, + "loss": 1.5849, + "step": 11720 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023531531152125456, + "loss": 1.5889, + "step": 11721 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023530514539615993, + "loss": 1.6154, + "step": 11722 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002352949786918904, + "loss": 1.5177, + "step": 11723 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023528481140851508, + "loss": 1.6136, + "step": 11724 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023527464354610296, + "loss": 1.5577, + "step": 11725 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023526447510472304, + "loss": 1.5549, + "step": 11726 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023525430608444436, + "loss": 1.6567, + "step": 11727 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023524413648533604, + "loss": 1.5567, + "step": 11728 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023523396630746704, + "loss": 1.5812, + "step": 11729 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023522379555090646, + "loss": 1.5311, + "step": 11730 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002352136242157233, + "loss": 1.6268, + "step": 11731 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023520345230198674, + "loss": 1.5619, + "step": 11732 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002351932798097657, + "loss": 1.6235, + "step": 11733 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002351831067391293, + "loss": 1.5728, + "step": 11734 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023517293309014664, + "loss": 1.5843, + "step": 11735 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023516275886288672, + "loss": 1.5437, + "step": 11736 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023515258405741875, + "loss": 1.5365, + "step": 11737 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023514240867381168, + "loss": 1.6155, + "step": 11738 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002351322327121346, + "loss": 1.6356, + "step": 11739 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002351220561724567, + "loss": 1.5482, + "step": 11740 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023511187905484699, + "loss": 1.6199, + "step": 11741 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002351017013593746, + "loss": 1.5994, + "step": 11742 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002350915230861086, + "loss": 1.673, + "step": 11743 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023508134423511808, + "loss": 1.6264, + "step": 11744 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023507116480647223, + "loss": 1.6198, + "step": 11745 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023506098480024012, + "loss": 1.5559, + "step": 11746 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023505080421649087, + "loss": 1.5963, + "step": 11747 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002350406230552936, + "loss": 1.5472, + "step": 11748 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023503044131671741, + "loss": 1.6148, + "step": 11749 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023502025900083145, + "loss": 1.6263, + "step": 11750 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023501007610770484, + "loss": 1.5985, + "step": 11751 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023499989263740673, + "loss": 1.5899, + "step": 11752 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002349897085900063, + "loss": 1.5628, + "step": 11753 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023497952396557258, + "loss": 1.6147, + "step": 11754 + }, + { + "epoch": 0.92, + "learning_rate": 0.00023496933876417483, + "loss": 1.5549, + "step": 11755 + }, + { + "epoch": 0.92, + "learning_rate": 0.0002349591529858821, + "loss": 1.6594, + "step": 11756 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002349489666307637, + "loss": 1.5941, + "step": 11757 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023493877969888867, + "loss": 1.5904, + "step": 11758 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023492859219032615, + "loss": 1.6314, + "step": 11759 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023491840410514535, + "loss": 1.6003, + "step": 11760 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002349082154434155, + "loss": 1.519, + "step": 11761 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002348980262052057, + "loss": 1.6089, + "step": 11762 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023488783639058516, + "loss": 1.573, + "step": 11763 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023487764599962308, + "loss": 1.6487, + "step": 11764 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023486745503238857, + "loss": 1.5818, + "step": 11765 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002348572634889509, + "loss": 1.5879, + "step": 11766 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023484707136937923, + "loss": 1.6077, + "step": 11767 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023483687867374277, + "loss": 1.6012, + "step": 11768 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023482668540211074, + "loss": 1.5668, + "step": 11769 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023481649155455232, + "loss": 1.5786, + "step": 11770 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002348062971311367, + "loss": 1.6017, + "step": 11771 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023479610213193318, + "loss": 1.5873, + "step": 11772 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023478590655701085, + "loss": 1.5605, + "step": 11773 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023477571040643908, + "loss": 1.601, + "step": 11774 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023476551368028698, + "loss": 1.606, + "step": 11775 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023475531637862378, + "loss": 1.6631, + "step": 11776 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002347451185015188, + "loss": 1.6055, + "step": 11777 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023473492004904122, + "loss": 1.5506, + "step": 11778 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023472472102126029, + "loss": 1.5802, + "step": 11779 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023471452141824532, + "loss": 1.6272, + "step": 11780 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002347043212400654, + "loss": 1.6161, + "step": 11781 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023469412048678995, + "loss": 1.5724, + "step": 11782 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002346839191584881, + "loss": 1.593, + "step": 11783 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023467371725522924, + "loss": 1.6126, + "step": 11784 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023466351477708253, + "loss": 1.6372, + "step": 11785 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023465331172411728, + "loss": 1.5723, + "step": 11786 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023464310809640277, + "loss": 1.5968, + "step": 11787 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023463290389400828, + "loss": 1.6556, + "step": 11788 + }, + { + "epoch": 0.93, + "learning_rate": 0.000234622699117003, + "loss": 1.5736, + "step": 11789 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002346124937654564, + "loss": 1.6134, + "step": 11790 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023460228783943755, + "loss": 1.6356, + "step": 11791 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023459208133901592, + "loss": 1.6317, + "step": 11792 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023458187426426074, + "loss": 1.6355, + "step": 11793 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002345716666152413, + "loss": 1.6237, + "step": 11794 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023456145839202694, + "loss": 1.625, + "step": 11795 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023455124959468693, + "loss": 1.5573, + "step": 11796 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023454104022329058, + "loss": 1.5876, + "step": 11797 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002345308302779072, + "loss": 1.623, + "step": 11798 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023452061975860614, + "loss": 1.6419, + "step": 11799 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023451040866545673, + "loss": 1.5952, + "step": 11800 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023450019699852826, + "loss": 1.6572, + "step": 11801 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023448998475789008, + "loss": 1.6161, + "step": 11802 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023447977194361155, + "loss": 1.558, + "step": 11803 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023446955855576203, + "loss": 1.5848, + "step": 11804 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023445934459441077, + "loss": 1.6554, + "step": 11805 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023444913005962718, + "loss": 1.5816, + "step": 11806 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023443891495148058, + "loss": 1.6105, + "step": 11807 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023442869927004032, + "loss": 1.6236, + "step": 11808 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023441848301537587, + "loss": 1.5724, + "step": 11809 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023440826618755645, + "loss": 1.5733, + "step": 11810 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002343980487866515, + "loss": 1.6671, + "step": 11811 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023438783081273037, + "loss": 1.5864, + "step": 11812 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023437761226586244, + "loss": 1.568, + "step": 11813 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002343673931461171, + "loss": 1.6219, + "step": 11814 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023435717345356367, + "loss": 1.6193, + "step": 11815 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023434695318827164, + "loss": 1.6087, + "step": 11816 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002343367323503103, + "loss": 1.5785, + "step": 11817 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002343265109397491, + "loss": 1.6371, + "step": 11818 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023431628895665747, + "loss": 1.6078, + "step": 11819 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002343060664011047, + "loss": 1.6491, + "step": 11820 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002342958432731603, + "loss": 1.5982, + "step": 11821 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023428561957289365, + "loss": 1.5763, + "step": 11822 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023427539530037413, + "loss": 1.6113, + "step": 11823 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023426517045567116, + "loss": 1.5718, + "step": 11824 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023425494503885423, + "loss": 1.6198, + "step": 11825 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023424471904999274, + "loss": 1.6334, + "step": 11826 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023423449248915603, + "loss": 1.5946, + "step": 11827 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023422426535641365, + "loss": 1.5889, + "step": 11828 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023421403765183497, + "loss": 1.628, + "step": 11829 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023420380937548948, + "loss": 1.5813, + "step": 11830 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023419358052744653, + "loss": 1.5912, + "step": 11831 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023418335110777567, + "loss": 1.5792, + "step": 11832 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023417312111654633, + "loss": 1.6303, + "step": 11833 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023416289055382792, + "loss": 1.6035, + "step": 11834 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002341526594196899, + "loss": 1.5835, + "step": 11835 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023414242771420182, + "loss": 1.6372, + "step": 11836 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023413219543743307, + "loss": 1.6387, + "step": 11837 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023412196258945314, + "loss": 1.5888, + "step": 11838 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023411172917033146, + "loss": 1.6075, + "step": 11839 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002341014951801376, + "loss": 1.6289, + "step": 11840 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023409126061894103, + "loss": 1.5279, + "step": 11841 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023408102548681112, + "loss": 1.6228, + "step": 11842 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023407078978381751, + "loss": 1.5872, + "step": 11843 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023406055351002963, + "loss": 1.5919, + "step": 11844 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023405031666551697, + "loss": 1.6256, + "step": 11845 + }, + { + "epoch": 0.93, + "learning_rate": 0.000234040079250349, + "loss": 1.5778, + "step": 11846 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023402984126459533, + "loss": 1.6115, + "step": 11847 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023401960270832538, + "loss": 1.5896, + "step": 11848 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023400936358160872, + "loss": 1.5463, + "step": 11849 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023399912388451482, + "loss": 1.644, + "step": 11850 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023398888361711323, + "loss": 1.6021, + "step": 11851 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002339786427794735, + "loss": 1.6217, + "step": 11852 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023396840137166508, + "loss": 1.6156, + "step": 11853 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023395815939375754, + "loss": 1.6228, + "step": 11854 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023394791684582043, + "loss": 1.5812, + "step": 11855 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023393767372792336, + "loss": 1.681, + "step": 11856 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023392743004013576, + "loss": 1.5439, + "step": 11857 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002339171857825272, + "loss": 1.6097, + "step": 11858 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023390694095516733, + "loss": 1.5747, + "step": 11859 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002338966955581256, + "loss": 1.6451, + "step": 11860 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002338864495914716, + "loss": 1.646, + "step": 11861 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023387620305527485, + "loss": 1.5969, + "step": 11862 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023386595594960505, + "loss": 1.5837, + "step": 11863 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023385570827453162, + "loss": 1.5959, + "step": 11864 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023384546003012423, + "loss": 1.5389, + "step": 11865 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023383521121645248, + "loss": 1.5974, + "step": 11866 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023382496183358588, + "loss": 1.5836, + "step": 11867 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023381471188159403, + "loss": 1.5477, + "step": 11868 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023380446136054658, + "loss": 1.5741, + "step": 11869 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023379421027051303, + "loss": 1.6234, + "step": 11870 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023378395861156306, + "loss": 1.605, + "step": 11871 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023377370638376626, + "loss": 1.5719, + "step": 11872 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002337634535871922, + "loss": 1.5769, + "step": 11873 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002337532002219105, + "loss": 1.5633, + "step": 11874 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023374294628799086, + "loss": 1.5658, + "step": 11875 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023373269178550277, + "loss": 1.5937, + "step": 11876 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002337224367145159, + "loss": 1.5378, + "step": 11877 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023371218107509994, + "loss": 1.6127, + "step": 11878 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002337019248673244, + "loss": 1.5804, + "step": 11879 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023369166809125906, + "loss": 1.5737, + "step": 11880 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023368141074697342, + "loss": 1.5825, + "step": 11881 + }, + { + "epoch": 0.93, + "learning_rate": 0.0002336711528345372, + "loss": 1.5394, + "step": 11882 + }, + { + "epoch": 0.93, + "learning_rate": 0.00023366089435402002, + "loss": 1.6509, + "step": 11883 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023365063530549155, + "loss": 1.6047, + "step": 11884 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023364037568902142, + "loss": 1.536, + "step": 11885 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023363011550467925, + "loss": 1.5978, + "step": 11886 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002336198547525348, + "loss": 1.6574, + "step": 11887 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023360959343265772, + "loss": 1.621, + "step": 11888 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023359933154511758, + "loss": 1.5853, + "step": 11889 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002335890690899841, + "loss": 1.6128, + "step": 11890 + }, + { + "epoch": 0.94, + "learning_rate": 0.000233578806067327, + "loss": 1.609, + "step": 11891 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023356854247721592, + "loss": 1.569, + "step": 11892 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023355827831972057, + "loss": 1.6178, + "step": 11893 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023354801359491058, + "loss": 1.6383, + "step": 11894 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023353774830285568, + "loss": 1.5824, + "step": 11895 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023352748244362566, + "loss": 1.6016, + "step": 11896 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023351721601729005, + "loss": 1.6047, + "step": 11897 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023350694902391866, + "loss": 1.5829, + "step": 11898 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023349668146358115, + "loss": 1.6077, + "step": 11899 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023348641333634728, + "loss": 1.5625, + "step": 11900 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002334761446422867, + "loss": 1.5767, + "step": 11901 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023346587538146916, + "loss": 1.6118, + "step": 11902 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023345560555396437, + "loss": 1.5809, + "step": 11903 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023344533515984217, + "loss": 1.5834, + "step": 11904 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023343506419917212, + "loss": 1.656, + "step": 11905 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023342479267202403, + "loss": 1.6175, + "step": 11906 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023341452057846763, + "loss": 1.5987, + "step": 11907 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023340424791857268, + "loss": 1.5948, + "step": 11908 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023339397469240893, + "loss": 1.596, + "step": 11909 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023338370090004608, + "loss": 1.5781, + "step": 11910 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023337342654155397, + "loss": 1.6096, + "step": 11911 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023336315161700223, + "loss": 1.5663, + "step": 11912 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023335287612646073, + "loss": 1.6633, + "step": 11913 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002333426000699992, + "loss": 1.6674, + "step": 11914 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002333323234476874, + "loss": 1.5718, + "step": 11915 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023332204625959514, + "loss": 1.5708, + "step": 11916 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023331176850579211, + "loss": 1.5891, + "step": 11917 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023330149018634819, + "loss": 1.569, + "step": 11918 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002332912113013331, + "loss": 1.5957, + "step": 11919 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023328093185081663, + "loss": 1.6236, + "step": 11920 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023327065183486868, + "loss": 1.5761, + "step": 11921 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002332603712535589, + "loss": 1.607, + "step": 11922 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023325009010695714, + "loss": 1.5809, + "step": 11923 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002332398083951332, + "loss": 1.5768, + "step": 11924 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002332295261181569, + "loss": 1.6197, + "step": 11925 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023321924327609806, + "loss": 1.6097, + "step": 11926 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023320895986902646, + "loss": 1.5361, + "step": 11927 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023319867589701194, + "loss": 1.5523, + "step": 11928 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023318839136012438, + "loss": 1.574, + "step": 11929 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002331781062584335, + "loss": 1.5838, + "step": 11930 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002331678205920092, + "loss": 1.5897, + "step": 11931 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002331575343609213, + "loss": 1.5942, + "step": 11932 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002331472475652396, + "loss": 1.6013, + "step": 11933 + }, + { + "epoch": 0.94, + "learning_rate": 0.000233136960205034, + "loss": 1.6216, + "step": 11934 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023312667228037433, + "loss": 1.5956, + "step": 11935 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023311638379133038, + "loss": 1.6379, + "step": 11936 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002331060947379721, + "loss": 1.6597, + "step": 11937 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002330958051203693, + "loss": 1.5619, + "step": 11938 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023308551493859183, + "loss": 1.5832, + "step": 11939 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023307522419270952, + "loss": 1.6468, + "step": 11940 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023306493288279234, + "loss": 1.5585, + "step": 11941 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023305464100891005, + "loss": 1.5834, + "step": 11942 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002330443485711326, + "loss": 1.5315, + "step": 11943 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002330340555695299, + "loss": 1.552, + "step": 11944 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023302376200417174, + "loss": 1.6029, + "step": 11945 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023301346787512806, + "loss": 1.5584, + "step": 11946 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023300317318246874, + "loss": 1.5691, + "step": 11947 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023299287792626368, + "loss": 1.6016, + "step": 11948 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023298258210658276, + "loss": 1.596, + "step": 11949 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002329722857234959, + "loss": 1.5492, + "step": 11950 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023296198877707306, + "loss": 1.5938, + "step": 11951 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023295169126738409, + "loss": 1.6049, + "step": 11952 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023294139319449887, + "loss": 1.6011, + "step": 11953 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002329310945584874, + "loss": 1.6509, + "step": 11954 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023292079535941953, + "loss": 1.6095, + "step": 11955 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002329104955973652, + "loss": 1.6162, + "step": 11956 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023290019527239444, + "loss": 1.6465, + "step": 11957 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023288989438457705, + "loss": 1.5498, + "step": 11958 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023287959293398302, + "loss": 1.5884, + "step": 11959 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002328692909206823, + "loss": 1.5542, + "step": 11960 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023285898834474482, + "loss": 1.6394, + "step": 11961 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002328486852062405, + "loss": 1.6069, + "step": 11962 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023283838150523937, + "loss": 1.5836, + "step": 11963 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002328280772418113, + "loss": 1.6012, + "step": 11964 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023281777241602637, + "loss": 1.6207, + "step": 11965 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023280746702795442, + "loss": 1.5681, + "step": 11966 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023279716107766548, + "loss": 1.5826, + "step": 11967 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002327868545652295, + "loss": 1.5936, + "step": 11968 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023277654749071647, + "loss": 1.5819, + "step": 11969 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023276623985419635, + "loss": 1.5534, + "step": 11970 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023275593165573915, + "loss": 1.5524, + "step": 11971 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002327456228954148, + "loss": 1.6547, + "step": 11972 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023273531357329336, + "loss": 1.6, + "step": 11973 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023272500368944483, + "loss": 1.582, + "step": 11974 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023271469324393914, + "loss": 1.5801, + "step": 11975 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023270438223684634, + "loss": 1.624, + "step": 11976 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023269407066823643, + "loss": 1.5835, + "step": 11977 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023268375853817942, + "loss": 1.5658, + "step": 11978 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023267344584674535, + "loss": 1.5644, + "step": 11979 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023266313259400414, + "loss": 1.5869, + "step": 11980 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023265281878002587, + "loss": 1.5442, + "step": 11981 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002326425044048806, + "loss": 1.5913, + "step": 11982 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023263218946863832, + "loss": 1.6146, + "step": 11983 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023262187397136912, + "loss": 1.5938, + "step": 11984 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023261155791314296, + "loss": 1.6108, + "step": 11985 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002326012412940299, + "loss": 1.6597, + "step": 11986 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002325909241141, + "loss": 1.667, + "step": 11987 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002325806063734233, + "loss": 1.5553, + "step": 11988 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023257028807206986, + "loss": 1.5634, + "step": 11989 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023255996921010973, + "loss": 1.6145, + "step": 11990 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023254964978761298, + "loss": 1.5876, + "step": 11991 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023253932980464966, + "loss": 1.583, + "step": 11992 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023252900926128982, + "loss": 1.5935, + "step": 11993 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023251868815760357, + "loss": 1.6404, + "step": 11994 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023250836649366097, + "loss": 1.5727, + "step": 11995 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023249804426953206, + "loss": 1.6222, + "step": 11996 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023248772148528699, + "loss": 1.6212, + "step": 11997 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023247739814099576, + "loss": 1.5705, + "step": 11998 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023246707423672856, + "loss": 1.5762, + "step": 11999 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023245674977255543, + "loss": 1.6297, + "step": 12000 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023244642474854648, + "loss": 1.5446, + "step": 12001 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002324360991647718, + "loss": 1.6001, + "step": 12002 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002324257730213015, + "loss": 1.597, + "step": 12003 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023241544631820562, + "loss": 1.6072, + "step": 12004 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002324051190555544, + "loss": 1.5339, + "step": 12005 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023239479123341792, + "loss": 1.634, + "step": 12006 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023238446285186624, + "loss": 1.6459, + "step": 12007 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023237413391096953, + "loss": 1.5499, + "step": 12008 + }, + { + "epoch": 0.94, + "learning_rate": 0.0002323638044107979, + "loss": 1.5893, + "step": 12009 + }, + { + "epoch": 0.94, + "learning_rate": 0.00023235347435142153, + "loss": 1.6417, + "step": 12010 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023234314373291043, + "loss": 1.6003, + "step": 12011 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002323328125553349, + "loss": 1.5961, + "step": 12012 + }, + { + "epoch": 0.95, + "learning_rate": 0.000232322480818765, + "loss": 1.5622, + "step": 12013 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023231214852327087, + "loss": 1.5473, + "step": 12014 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023230181566892265, + "loss": 1.6196, + "step": 12015 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002322914822557906, + "loss": 1.59, + "step": 12016 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002322811482839447, + "loss": 1.5966, + "step": 12017 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023227081375345527, + "loss": 1.5676, + "step": 12018 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002322604786643924, + "loss": 1.5831, + "step": 12019 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002322501430168263, + "loss": 1.5835, + "step": 12020 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023223980681082705, + "loss": 1.5548, + "step": 12021 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023222947004646497, + "loss": 1.6072, + "step": 12022 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002322191327238101, + "loss": 1.6321, + "step": 12023 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002322087948429328, + "loss": 1.6059, + "step": 12024 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023219845640390304, + "loss": 1.6409, + "step": 12025 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023218811740679114, + "loss": 1.6039, + "step": 12026 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023217777785166727, + "loss": 1.5901, + "step": 12027 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023216743773860166, + "loss": 1.6537, + "step": 12028 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023215709706766451, + "loss": 1.5828, + "step": 12029 + }, + { + "epoch": 0.95, + "learning_rate": 0.000232146755838926, + "loss": 1.5581, + "step": 12030 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023213641405245636, + "loss": 1.6129, + "step": 12031 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023212607170832578, + "loss": 1.6401, + "step": 12032 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002321157288066045, + "loss": 1.5846, + "step": 12033 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023210538534736272, + "loss": 1.6186, + "step": 12034 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023209504133067066, + "loss": 1.6279, + "step": 12035 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023208469675659862, + "loss": 1.6113, + "step": 12036 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023207435162521676, + "loss": 1.6306, + "step": 12037 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023206400593659538, + "loss": 1.6242, + "step": 12038 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023205365969080466, + "loss": 1.6149, + "step": 12039 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023204331288791488, + "loss": 1.6101, + "step": 12040 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023203296552799628, + "loss": 1.5289, + "step": 12041 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002320226176111191, + "loss": 1.5669, + "step": 12042 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023201226913735363, + "loss": 1.5557, + "step": 12043 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023200192010677006, + "loss": 1.5804, + "step": 12044 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023199157051943876, + "loss": 1.5223, + "step": 12045 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023198122037542993, + "loss": 1.613, + "step": 12046 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023197086967481384, + "loss": 1.639, + "step": 12047 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023196051841766082, + "loss": 1.5396, + "step": 12048 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023195016660404108, + "loss": 1.5394, + "step": 12049 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023193981423402495, + "loss": 1.656, + "step": 12050 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023192946130768267, + "loss": 1.6499, + "step": 12051 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023191910782508453, + "loss": 1.5852, + "step": 12052 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023190875378630092, + "loss": 1.6913, + "step": 12053 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023189839919140207, + "loss": 1.5358, + "step": 12054 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023188804404045826, + "loss": 1.5415, + "step": 12055 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023187768833353984, + "loss": 1.6041, + "step": 12056 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023186733207071708, + "loss": 1.6272, + "step": 12057 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023185697525206033, + "loss": 1.646, + "step": 12058 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023184661787763986, + "loss": 1.5499, + "step": 12059 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023183625994752604, + "loss": 1.5582, + "step": 12060 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023182590146178918, + "loss": 1.6022, + "step": 12061 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023181554242049962, + "loss": 1.5718, + "step": 12062 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023180518282372764, + "loss": 1.5859, + "step": 12063 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023179482267154364, + "loss": 1.5955, + "step": 12064 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023178446196401794, + "loss": 1.6684, + "step": 12065 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023177410070122082, + "loss": 1.6504, + "step": 12066 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023176373888322274, + "loss": 1.5966, + "step": 12067 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023175337651009395, + "loss": 1.6034, + "step": 12068 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023174301358190494, + "loss": 1.5718, + "step": 12069 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002317326500987259, + "loss": 1.5695, + "step": 12070 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023172228606062724, + "loss": 1.579, + "step": 12071 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002317119214676794, + "loss": 1.6085, + "step": 12072 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023170155631995276, + "loss": 1.6487, + "step": 12073 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023169119061751755, + "loss": 1.6387, + "step": 12074 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023168082436044425, + "loss": 1.6107, + "step": 12075 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023167045754880324, + "loss": 1.5734, + "step": 12076 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023166009018266493, + "loss": 1.6318, + "step": 12077 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023164972226209963, + "loss": 1.5961, + "step": 12078 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023163935378717779, + "loss": 1.546, + "step": 12079 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002316289847579698, + "loss": 1.5752, + "step": 12080 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023161861517454602, + "loss": 1.5578, + "step": 12081 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023160824503697688, + "loss": 1.6314, + "step": 12082 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023159787434533281, + "loss": 1.6238, + "step": 12083 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002315875030996842, + "loss": 1.6207, + "step": 12084 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002315771313001015, + "loss": 1.5959, + "step": 12085 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023156675894665506, + "loss": 1.6171, + "step": 12086 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023155638603941534, + "loss": 1.58, + "step": 12087 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023154601257845277, + "loss": 1.5805, + "step": 12088 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023153563856383776, + "loss": 1.6134, + "step": 12089 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023152526399564078, + "loss": 1.5749, + "step": 12090 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023151488887393224, + "loss": 1.5557, + "step": 12091 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023150451319878262, + "loss": 1.6285, + "step": 12092 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023149413697026228, + "loss": 1.4656, + "step": 12093 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023148376018844176, + "loss": 1.5341, + "step": 12094 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023147338285339148, + "loss": 1.6022, + "step": 12095 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023146300496518186, + "loss": 1.5813, + "step": 12096 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023145262652388338, + "loss": 1.6149, + "step": 12097 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023144224752956653, + "loss": 1.6205, + "step": 12098 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023143186798230177, + "loss": 1.6214, + "step": 12099 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023142148788215958, + "loss": 1.6025, + "step": 12100 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002314111072292104, + "loss": 1.5774, + "step": 12101 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023140072602352476, + "loss": 1.5734, + "step": 12102 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023139034426517308, + "loss": 1.6139, + "step": 12103 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002313799619542259, + "loss": 1.5944, + "step": 12104 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023136957909075366, + "loss": 1.5838, + "step": 12105 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002313591956748269, + "loss": 1.5964, + "step": 12106 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023134881170651606, + "loss": 1.5841, + "step": 12107 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023133842718589174, + "loss": 1.6049, + "step": 12108 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023132804211302435, + "loss": 1.5895, + "step": 12109 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023131765648798442, + "loss": 1.6146, + "step": 12110 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023130727031084252, + "loss": 1.5607, + "step": 12111 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002312968835816691, + "loss": 1.6033, + "step": 12112 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002312864963005347, + "loss": 1.6044, + "step": 12113 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023127610846750984, + "loss": 1.5643, + "step": 12114 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023126572008266507, + "loss": 1.5714, + "step": 12115 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023125533114607089, + "loss": 1.5884, + "step": 12116 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023124494165779785, + "loss": 1.5174, + "step": 12117 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023123455161791652, + "loss": 1.6119, + "step": 12118 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023122416102649743, + "loss": 1.6462, + "step": 12119 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023121376988361107, + "loss": 1.5557, + "step": 12120 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023120337818932803, + "loss": 1.5445, + "step": 12121 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023119298594371888, + "loss": 1.5355, + "step": 12122 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023118259314685414, + "loss": 1.6143, + "step": 12123 + }, + { + "epoch": 0.95, + "learning_rate": 0.0002311721997988044, + "loss": 1.6105, + "step": 12124 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023116180589964025, + "loss": 1.5687, + "step": 12125 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023115141144943222, + "loss": 1.5966, + "step": 12126 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023114101644825086, + "loss": 1.5868, + "step": 12127 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023113062089616677, + "loss": 1.614, + "step": 12128 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023112022479325058, + "loss": 1.6039, + "step": 12129 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023110982813957283, + "loss": 1.6429, + "step": 12130 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023109943093520404, + "loss": 1.5768, + "step": 12131 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023108903318021495, + "loss": 1.6336, + "step": 12132 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023107863487467598, + "loss": 1.6002, + "step": 12133 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023106823601865792, + "loss": 1.5778, + "step": 12134 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023105783661223121, + "loss": 1.5862, + "step": 12135 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023104743665546654, + "loss": 1.648, + "step": 12136 + }, + { + "epoch": 0.95, + "learning_rate": 0.00023103703614843447, + "loss": 1.628, + "step": 12137 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023102663509120568, + "loss": 1.6201, + "step": 12138 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023101623348385078, + "loss": 1.6382, + "step": 12139 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002310058313264403, + "loss": 1.5956, + "step": 12140 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023099542861904497, + "loss": 1.5882, + "step": 12141 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002309850253617354, + "loss": 1.5881, + "step": 12142 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023097462155458216, + "loss": 1.6091, + "step": 12143 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023096421719765594, + "loss": 1.6096, + "step": 12144 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023095381229102732, + "loss": 1.5869, + "step": 12145 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023094340683476702, + "loss": 1.5454, + "step": 12146 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023093300082894567, + "loss": 1.6077, + "step": 12147 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023092259427363388, + "loss": 1.6052, + "step": 12148 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002309121871689024, + "loss": 1.5389, + "step": 12149 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023090177951482171, + "loss": 1.5861, + "step": 12150 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002308913713114627, + "loss": 1.5633, + "step": 12151 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023088096255889583, + "loss": 1.5407, + "step": 12152 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023087055325719187, + "loss": 1.5893, + "step": 12153 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023086014340642147, + "loss": 1.5975, + "step": 12154 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023084973300665536, + "loss": 1.6251, + "step": 12155 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002308393220579642, + "loss": 1.6288, + "step": 12156 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002308289105604186, + "loss": 1.5156, + "step": 12157 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023081849851408934, + "loss": 1.5859, + "step": 12158 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023080808591904707, + "loss": 1.5252, + "step": 12159 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023079767277536244, + "loss": 1.5974, + "step": 12160 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023078725908310622, + "loss": 1.5866, + "step": 12161 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023077684484234913, + "loss": 1.6197, + "step": 12162 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023076643005316184, + "loss": 1.6371, + "step": 12163 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023075601471561502, + "loss": 1.6013, + "step": 12164 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002307455988297794, + "loss": 1.5409, + "step": 12165 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023073518239572583, + "loss": 1.5646, + "step": 12166 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023072476541352485, + "loss": 1.6417, + "step": 12167 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023071434788324725, + "loss": 1.5874, + "step": 12168 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002307039298049638, + "loss": 1.5952, + "step": 12169 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023069351117874516, + "loss": 1.6136, + "step": 12170 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002306830920046622, + "loss": 1.6201, + "step": 12171 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023067267228278547, + "loss": 1.5919, + "step": 12172 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002306622520131859, + "loss": 1.652, + "step": 12173 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023065183119593411, + "loss": 1.584, + "step": 12174 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023064140983110088, + "loss": 1.5859, + "step": 12175 + }, + { + "epoch": 0.96, + "learning_rate": 0.000230630987918757, + "loss": 1.5582, + "step": 12176 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023062056545897317, + "loss": 1.5923, + "step": 12177 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023061014245182024, + "loss": 1.5859, + "step": 12178 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002305997188973689, + "loss": 1.6573, + "step": 12179 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023058929479568999, + "loss": 1.6167, + "step": 12180 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002305788701468542, + "loss": 1.5987, + "step": 12181 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023056844495093236, + "loss": 1.5961, + "step": 12182 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023055801920799526, + "loss": 1.6451, + "step": 12183 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002305475929181136, + "loss": 1.6015, + "step": 12184 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023053716608135828, + "loss": 1.5855, + "step": 12185 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023052673869780003, + "loss": 1.5673, + "step": 12186 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023051631076750968, + "loss": 1.5618, + "step": 12187 + }, + { + "epoch": 0.96, + "learning_rate": 0.000230505882290558, + "loss": 1.522, + "step": 12188 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023049545326701582, + "loss": 1.5648, + "step": 12189 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023048502369695393, + "loss": 1.6331, + "step": 12190 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023047459358044314, + "loss": 1.5742, + "step": 12191 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023046416291755425, + "loss": 1.6055, + "step": 12192 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023045373170835814, + "loss": 1.6248, + "step": 12193 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023044329995292555, + "loss": 1.5577, + "step": 12194 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002304328676513274, + "loss": 1.6179, + "step": 12195 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023042243480363443, + "loss": 1.628, + "step": 12196 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023041200140991747, + "loss": 1.6048, + "step": 12197 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023040156747024745, + "loss": 1.5902, + "step": 12198 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023039113298469513, + "loss": 1.5838, + "step": 12199 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002303806979533314, + "loss": 1.6123, + "step": 12200 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023037026237622706, + "loss": 1.5689, + "step": 12201 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023035982625345305, + "loss": 1.6482, + "step": 12202 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023034938958508012, + "loss": 1.6459, + "step": 12203 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023033895237117914, + "loss": 1.6465, + "step": 12204 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023032851461182106, + "loss": 1.5552, + "step": 12205 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023031807630707668, + "loss": 1.6254, + "step": 12206 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002303076374570169, + "loss": 1.5904, + "step": 12207 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023029719806171253, + "loss": 1.6086, + "step": 12208 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023028675812123456, + "loss": 1.5872, + "step": 12209 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023027631763565374, + "loss": 1.6249, + "step": 12210 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023026587660504108, + "loss": 1.5873, + "step": 12211 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023025543502946743, + "loss": 1.5635, + "step": 12212 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002302449929090036, + "loss": 1.5799, + "step": 12213 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023023455024372057, + "loss": 1.5841, + "step": 12214 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023022410703368927, + "loss": 1.5993, + "step": 12215 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023021366327898049, + "loss": 1.5913, + "step": 12216 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023020321897966522, + "loss": 1.5697, + "step": 12217 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023019277413581437, + "loss": 1.5986, + "step": 12218 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023018232874749884, + "loss": 1.6199, + "step": 12219 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023017188281478955, + "loss": 1.6052, + "step": 12220 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002301614363377574, + "loss": 1.5676, + "step": 12221 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023015098931647334, + "loss": 1.5651, + "step": 12222 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002301405417510083, + "loss": 1.5805, + "step": 12223 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002301300936414332, + "loss": 1.6393, + "step": 12224 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023011964498781897, + "loss": 1.6018, + "step": 12225 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023010919579023658, + "loss": 1.6329, + "step": 12226 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023009874604875696, + "loss": 1.5669, + "step": 12227 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023008829576345104, + "loss": 1.5599, + "step": 12228 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023007784493438981, + "loss": 1.641, + "step": 12229 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023006739356164422, + "loss": 1.5706, + "step": 12230 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023005694164528515, + "loss": 1.5978, + "step": 12231 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023004648918538366, + "loss": 1.5916, + "step": 12232 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023003603618201065, + "loss": 1.6839, + "step": 12233 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023002558263523717, + "loss": 1.5917, + "step": 12234 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023001512854513412, + "loss": 1.6006, + "step": 12235 + }, + { + "epoch": 0.96, + "learning_rate": 0.00023000467391177257, + "loss": 1.5934, + "step": 12236 + }, + { + "epoch": 0.96, + "learning_rate": 0.00022999421873522337, + "loss": 1.6619, + "step": 12237 + }, + { + "epoch": 0.96, + "learning_rate": 0.00022998376301555757, + "loss": 1.6727, + "step": 12238 + }, + { + "epoch": 0.96, + "learning_rate": 0.00022997330675284615, + "loss": 1.5839, + "step": 12239 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002299628499471601, + "loss": 1.5293, + "step": 12240 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002299523925985705, + "loss": 1.627, + "step": 12241 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002299419347071482, + "loss": 1.664, + "step": 12242 + }, + { + "epoch": 0.96, + "learning_rate": 0.00022993147627296432, + "loss": 1.5309, + "step": 12243 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002299210172960898, + "loss": 1.6219, + "step": 12244 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002299105577765957, + "loss": 1.6225, + "step": 12245 + }, + { + "epoch": 0.96, + "learning_rate": 0.00022990009771455303, + "loss": 1.6082, + "step": 12246 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002298896371100327, + "loss": 1.5736, + "step": 12247 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002298791759631059, + "loss": 1.565, + "step": 12248 + }, + { + "epoch": 0.96, + "learning_rate": 0.00022986871427384354, + "loss": 1.6264, + "step": 12249 + }, + { + "epoch": 0.96, + "learning_rate": 0.00022985825204231673, + "loss": 1.5974, + "step": 12250 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002298477892685964, + "loss": 1.628, + "step": 12251 + }, + { + "epoch": 0.96, + "learning_rate": 0.00022983732595275368, + "loss": 1.6045, + "step": 12252 + }, + { + "epoch": 0.96, + "learning_rate": 0.00022982686209485956, + "loss": 1.6021, + "step": 12253 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002298163976949851, + "loss": 1.6189, + "step": 12254 + }, + { + "epoch": 0.96, + "learning_rate": 0.00022980593275320134, + "loss": 1.6163, + "step": 12255 + }, + { + "epoch": 0.96, + "learning_rate": 0.00022979546726957937, + "loss": 1.5956, + "step": 12256 + }, + { + "epoch": 0.96, + "learning_rate": 0.00022978500124419017, + "loss": 1.6163, + "step": 12257 + }, + { + "epoch": 0.96, + "learning_rate": 0.00022977453467710486, + "loss": 1.5697, + "step": 12258 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002297640675683945, + "loss": 1.5704, + "step": 12259 + }, + { + "epoch": 0.96, + "learning_rate": 0.00022975359991813011, + "loss": 1.574, + "step": 12260 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002297431317263828, + "loss": 1.5508, + "step": 12261 + }, + { + "epoch": 0.96, + "learning_rate": 0.00022973266299322365, + "loss": 1.5525, + "step": 12262 + }, + { + "epoch": 0.96, + "learning_rate": 0.0002297221937187237, + "loss": 1.5637, + "step": 12263 + }, + { + "epoch": 0.96, + "learning_rate": 0.00022971172390295406, + "loss": 1.5917, + "step": 12264 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022970125354598576, + "loss": 1.5813, + "step": 12265 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022969078264789, + "loss": 1.6486, + "step": 12266 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022968031120873775, + "loss": 1.6006, + "step": 12267 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022966983922860021, + "loss": 1.6177, + "step": 12268 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002296593667075484, + "loss": 1.5336, + "step": 12269 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002296488936456534, + "loss": 1.6373, + "step": 12270 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002296384200429864, + "loss": 1.5723, + "step": 12271 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002296279458996185, + "loss": 1.5537, + "step": 12272 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022961747121562077, + "loss": 1.589, + "step": 12273 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022960699599106435, + "loss": 1.6058, + "step": 12274 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022959652022602037, + "loss": 1.5777, + "step": 12275 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022958604392055995, + "loss": 1.57, + "step": 12276 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022957556707475416, + "loss": 1.6111, + "step": 12277 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022956508968867425, + "loss": 1.6056, + "step": 12278 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002295546117623912, + "loss": 1.5518, + "step": 12279 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022954413329597632, + "loss": 1.5646, + "step": 12280 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022953365428950064, + "loss": 1.5744, + "step": 12281 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022952317474303534, + "loss": 1.5838, + "step": 12282 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022951269465665156, + "loss": 1.583, + "step": 12283 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022950221403042047, + "loss": 1.586, + "step": 12284 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022949173286441324, + "loss": 1.6242, + "step": 12285 + }, + { + "epoch": 0.97, + "learning_rate": 0.000229481251158701, + "loss": 1.596, + "step": 12286 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002294707689133549, + "loss": 1.6291, + "step": 12287 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022946028612844615, + "loss": 1.5801, + "step": 12288 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022944980280404593, + "loss": 1.6093, + "step": 12289 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022943931894022537, + "loss": 1.6817, + "step": 12290 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022942883453705567, + "loss": 1.6039, + "step": 12291 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022941834959460804, + "loss": 1.58, + "step": 12292 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002294078641129536, + "loss": 1.5915, + "step": 12293 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002293973780921636, + "loss": 1.5297, + "step": 12294 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022938689153230926, + "loss": 1.5302, + "step": 12295 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022937640443346165, + "loss": 1.6028, + "step": 12296 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022936591679569216, + "loss": 1.5989, + "step": 12297 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022935542861907184, + "loss": 1.637, + "step": 12298 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022934493990367193, + "loss": 1.5556, + "step": 12299 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022933445064956368, + "loss": 1.5738, + "step": 12300 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002293239608568183, + "loss": 1.6255, + "step": 12301 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022931347052550702, + "loss": 1.5935, + "step": 12302 + }, + { + "epoch": 0.97, + "learning_rate": 0.000229302979655701, + "loss": 1.6499, + "step": 12303 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022929248824747153, + "loss": 1.604, + "step": 12304 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022928199630088984, + "loss": 1.6174, + "step": 12305 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002292715038160271, + "loss": 1.6406, + "step": 12306 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022926101079295464, + "loss": 1.636, + "step": 12307 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022925051723174364, + "loss": 1.6114, + "step": 12308 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002292400231324654, + "loss": 1.6177, + "step": 12309 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022922952849519106, + "loss": 1.6022, + "step": 12310 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022921903331999196, + "loss": 1.6178, + "step": 12311 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002292085376069394, + "loss": 1.5214, + "step": 12312 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002291980413561045, + "loss": 1.5548, + "step": 12313 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002291875445675587, + "loss": 1.6072, + "step": 12314 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022917704724137312, + "loss": 1.6181, + "step": 12315 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022916654937761905, + "loss": 1.6327, + "step": 12316 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022915605097636785, + "loss": 1.5766, + "step": 12317 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002291455520376907, + "loss": 1.6649, + "step": 12318 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022913505256165896, + "loss": 1.5681, + "step": 12319 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022912455254834387, + "loss": 1.5744, + "step": 12320 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022911405199781674, + "loss": 1.5638, + "step": 12321 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022910355091014886, + "loss": 1.5952, + "step": 12322 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002290930492854115, + "loss": 1.5577, + "step": 12323 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022908254712367604, + "loss": 1.6067, + "step": 12324 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022907204442501367, + "loss": 1.5507, + "step": 12325 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022906154118949575, + "loss": 1.5255, + "step": 12326 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002290510374171936, + "loss": 1.6081, + "step": 12327 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022904053310817855, + "loss": 1.5772, + "step": 12328 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002290300282625219, + "loss": 1.5816, + "step": 12329 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022901952288029493, + "loss": 1.5791, + "step": 12330 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022900901696156907, + "loss": 1.5436, + "step": 12331 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022899851050641552, + "loss": 1.6774, + "step": 12332 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022898800351490572, + "loss": 1.5933, + "step": 12333 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022897749598711097, + "loss": 1.641, + "step": 12334 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022896698792310258, + "loss": 1.6051, + "step": 12335 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022895647932295196, + "loss": 1.6288, + "step": 12336 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002289459701867304, + "loss": 1.5421, + "step": 12337 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022893546051450925, + "loss": 1.564, + "step": 12338 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022892495030635987, + "loss": 1.6064, + "step": 12339 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022891443956235365, + "loss": 1.5668, + "step": 12340 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022890392828256193, + "loss": 1.576, + "step": 12341 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022889341646705608, + "loss": 1.5654, + "step": 12342 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022888290411590752, + "loss": 1.578, + "step": 12343 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002288723912291875, + "loss": 1.5837, + "step": 12344 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022886187780696748, + "loss": 1.5782, + "step": 12345 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022885136384931891, + "loss": 1.553, + "step": 12346 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022884084935631297, + "loss": 1.5655, + "step": 12347 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022883033432802123, + "loss": 1.593, + "step": 12348 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022881981876451501, + "loss": 1.5853, + "step": 12349 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022880930266586572, + "loss": 1.6328, + "step": 12350 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022879878603214478, + "loss": 1.5501, + "step": 12351 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022878826886342358, + "loss": 1.6271, + "step": 12352 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022877775115977348, + "loss": 1.5767, + "step": 12353 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022876723292126596, + "loss": 1.5972, + "step": 12354 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022875671414797233, + "loss": 1.577, + "step": 12355 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022874619483996414, + "loss": 1.5697, + "step": 12356 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022873567499731264, + "loss": 1.5977, + "step": 12357 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022872515462008948, + "loss": 1.5528, + "step": 12358 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022871463370836593, + "loss": 1.5531, + "step": 12359 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022870411226221343, + "loss": 1.5556, + "step": 12360 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022869359028170345, + "loss": 1.5978, + "step": 12361 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002286830677669074, + "loss": 1.6069, + "step": 12362 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002286725447178968, + "loss": 1.5883, + "step": 12363 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022866202113474294, + "loss": 1.5243, + "step": 12364 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022865149701751744, + "loss": 1.5684, + "step": 12365 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022864097236629163, + "loss": 1.6339, + "step": 12366 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022863044718113702, + "loss": 1.614, + "step": 12367 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002286199214621251, + "loss": 1.6113, + "step": 12368 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002286093952093273, + "loss": 1.5998, + "step": 12369 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002285988684228151, + "loss": 1.6124, + "step": 12370 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022858834110265993, + "loss": 1.6505, + "step": 12371 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002285778132489333, + "loss": 1.5944, + "step": 12372 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022856728486170665, + "loss": 1.592, + "step": 12373 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022855675594105152, + "loss": 1.5867, + "step": 12374 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022854622648703935, + "loss": 1.5714, + "step": 12375 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022853569649974168, + "loss": 1.585, + "step": 12376 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022852516597922997, + "loss": 1.5492, + "step": 12377 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002285146349255757, + "loss": 1.5897, + "step": 12378 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022850410333885037, + "loss": 1.648, + "step": 12379 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022849357121912554, + "loss": 1.5934, + "step": 12380 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022848303856647263, + "loss": 1.5661, + "step": 12381 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022847250538096322, + "loss": 1.6381, + "step": 12382 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002284619716626688, + "loss": 1.6273, + "step": 12383 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022845143741166089, + "loss": 1.5604, + "step": 12384 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022844090262801107, + "loss": 1.5559, + "step": 12385 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022843036731179074, + "loss": 1.5588, + "step": 12386 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002284198314630715, + "loss": 1.575, + "step": 12387 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022840929508192496, + "loss": 1.6581, + "step": 12388 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002283987581684225, + "loss": 1.6517, + "step": 12389 + }, + { + "epoch": 0.97, + "learning_rate": 0.00022838822072263572, + "loss": 1.5884, + "step": 12390 + }, + { + "epoch": 0.97, + "learning_rate": 0.0002283776827446362, + "loss": 1.5738, + "step": 12391 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002283671442344955, + "loss": 1.5593, + "step": 12392 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002283566051922851, + "loss": 1.6052, + "step": 12393 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022834606561807663, + "loss": 1.5977, + "step": 12394 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022833552551194158, + "loss": 1.5864, + "step": 12395 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002283249848739515, + "loss": 1.5958, + "step": 12396 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022831444370417808, + "loss": 1.5817, + "step": 12397 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022830390200269277, + "loss": 1.5966, + "step": 12398 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022829335976956718, + "loss": 1.597, + "step": 12399 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022828281700487286, + "loss": 1.6187, + "step": 12400 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002282722737086814, + "loss": 1.573, + "step": 12401 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022826172988106447, + "loss": 1.5948, + "step": 12402 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022825118552209352, + "loss": 1.6082, + "step": 12403 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002282406406318402, + "loss": 1.601, + "step": 12404 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022823009521037615, + "loss": 1.5791, + "step": 12405 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022821954925777288, + "loss": 1.5669, + "step": 12406 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002282090027741021, + "loss": 1.5354, + "step": 12407 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022819845575943528, + "loss": 1.6254, + "step": 12408 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022818790821384414, + "loss": 1.6127, + "step": 12409 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022817736013740024, + "loss": 1.5615, + "step": 12410 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002281668115301752, + "loss": 1.5787, + "step": 12411 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022815626239224061, + "loss": 1.5614, + "step": 12412 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002281457127236682, + "loss": 1.5551, + "step": 12413 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002281351625245295, + "loss": 1.5652, + "step": 12414 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022812461179489614, + "loss": 1.5817, + "step": 12415 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002281140605348398, + "loss": 1.5836, + "step": 12416 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022810350874443211, + "loss": 1.6376, + "step": 12417 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022809295642374464, + "loss": 1.6469, + "step": 12418 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002280824035728492, + "loss": 1.6602, + "step": 12419 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002280718501918172, + "loss": 1.6022, + "step": 12420 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002280612962807205, + "loss": 1.5787, + "step": 12421 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022805074183963065, + "loss": 1.6219, + "step": 12422 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022804018686861937, + "loss": 1.5957, + "step": 12423 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022802963136775824, + "loss": 1.5596, + "step": 12424 + }, + { + "epoch": 0.98, + "learning_rate": 0.000228019075337119, + "loss": 1.5419, + "step": 12425 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002280085187767733, + "loss": 1.6158, + "step": 12426 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022799796168679277, + "loss": 1.5837, + "step": 12427 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022798740406724917, + "loss": 1.5915, + "step": 12428 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022797684591821407, + "loss": 1.6172, + "step": 12429 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022796628723975926, + "loss": 1.5887, + "step": 12430 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002279557280319564, + "loss": 1.6068, + "step": 12431 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022794516829487713, + "loss": 1.5897, + "step": 12432 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002279346080285932, + "loss": 1.6628, + "step": 12433 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022792404723317628, + "loss": 1.5889, + "step": 12434 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002279134859086981, + "loss": 1.5493, + "step": 12435 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022790292405523035, + "loss": 1.5733, + "step": 12436 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002278923616728447, + "loss": 1.6007, + "step": 12437 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022788179876161293, + "loss": 1.5947, + "step": 12438 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022787123532160667, + "loss": 1.5944, + "step": 12439 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022786067135289773, + "loss": 1.6136, + "step": 12440 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022785010685555786, + "loss": 1.6007, + "step": 12441 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022783954182965867, + "loss": 1.6805, + "step": 12442 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022782897627527196, + "loss": 1.5473, + "step": 12443 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002278184101924694, + "loss": 1.6305, + "step": 12444 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022780784358132283, + "loss": 1.5752, + "step": 12445 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022779727644190394, + "loss": 1.5621, + "step": 12446 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022778670877428444, + "loss": 1.5999, + "step": 12447 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022777614057853618, + "loss": 1.5815, + "step": 12448 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002277655718547308, + "loss": 1.6327, + "step": 12449 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002277550026029401, + "loss": 1.555, + "step": 12450 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022774443282323582, + "loss": 1.5437, + "step": 12451 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022773386251568977, + "loss": 1.6098, + "step": 12452 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002277232916803737, + "loss": 1.5907, + "step": 12453 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002277127203173594, + "loss": 1.6053, + "step": 12454 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022770214842671854, + "loss": 1.6188, + "step": 12455 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022769157600852302, + "loss": 1.6011, + "step": 12456 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022768100306284452, + "loss": 1.5606, + "step": 12457 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022767042958975498, + "loss": 1.5999, + "step": 12458 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022765985558932601, + "loss": 1.531, + "step": 12459 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002276492810616295, + "loss": 1.602, + "step": 12460 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022763870600673718, + "loss": 1.5669, + "step": 12461 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002276281304247209, + "loss": 1.5491, + "step": 12462 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022761755431565251, + "loss": 1.5682, + "step": 12463 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022760697767960374, + "loss": 1.5657, + "step": 12464 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022759640051664637, + "loss": 1.6032, + "step": 12465 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022758582282685232, + "loss": 1.6213, + "step": 12466 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022757524461029333, + "loss": 1.6192, + "step": 12467 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022756466586704123, + "loss": 1.5315, + "step": 12468 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022755408659716782, + "loss": 1.541, + "step": 12469 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022754350680074503, + "loss": 1.5598, + "step": 12470 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022753292647784455, + "loss": 1.5769, + "step": 12471 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022752234562853837, + "loss": 1.579, + "step": 12472 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022751176425289817, + "loss": 1.6202, + "step": 12473 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002275011823509959, + "loss": 1.5865, + "step": 12474 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022749059992290333, + "loss": 1.5761, + "step": 12475 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022748001696869239, + "loss": 1.5751, + "step": 12476 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022746943348843493, + "loss": 1.5715, + "step": 12477 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022745884948220267, + "loss": 1.5933, + "step": 12478 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022744826495006766, + "loss": 1.5797, + "step": 12479 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022743767989210161, + "loss": 1.6091, + "step": 12480 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022742709430837647, + "loss": 1.5522, + "step": 12481 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002274165081989641, + "loss": 1.5935, + "step": 12482 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022740592156393632, + "loss": 1.5957, + "step": 12483 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022739533440336508, + "loss": 1.579, + "step": 12484 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002273847467173222, + "loss": 1.6389, + "step": 12485 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022737415850587964, + "loss": 1.6025, + "step": 12486 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022736356976910924, + "loss": 1.6102, + "step": 12487 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022735298050708284, + "loss": 1.6008, + "step": 12488 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002273423907198724, + "loss": 1.5583, + "step": 12489 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022733180040754983, + "loss": 1.6031, + "step": 12490 + }, + { + "epoch": 0.98, + "learning_rate": 0.000227321209570187, + "loss": 1.5508, + "step": 12491 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022731061820785586, + "loss": 1.6445, + "step": 12492 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022730002632062826, + "loss": 1.5815, + "step": 12493 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022728943390857616, + "loss": 1.5966, + "step": 12494 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022727884097177142, + "loss": 1.5887, + "step": 12495 + }, + { + "epoch": 0.98, + "learning_rate": 0.000227268247510286, + "loss": 1.5751, + "step": 12496 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022725765352419187, + "loss": 1.6288, + "step": 12497 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022724705901356086, + "loss": 1.5305, + "step": 12498 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022723646397846496, + "loss": 1.6169, + "step": 12499 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022722586841897606, + "loss": 1.5722, + "step": 12500 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022721527233516618, + "loss": 1.5924, + "step": 12501 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022720467572710716, + "loss": 1.5829, + "step": 12502 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022719407859487104, + "loss": 1.5912, + "step": 12503 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022718348093852975, + "loss": 1.5803, + "step": 12504 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022717288275815516, + "loss": 1.6048, + "step": 12505 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022716228405381928, + "loss": 1.5759, + "step": 12506 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002271516848255941, + "loss": 1.5827, + "step": 12507 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022714108507355154, + "loss": 1.6094, + "step": 12508 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022713048479776362, + "loss": 1.6211, + "step": 12509 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022711988399830223, + "loss": 1.5627, + "step": 12510 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022710928267523941, + "loss": 1.6087, + "step": 12511 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022709868082864713, + "loss": 1.5885, + "step": 12512 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022708807845859733, + "loss": 1.5696, + "step": 12513 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022707747556516202, + "loss": 1.5652, + "step": 12514 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022706687214841314, + "loss": 1.6078, + "step": 12515 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022705626820842279, + "loss": 1.5382, + "step": 12516 + }, + { + "epoch": 0.98, + "learning_rate": 0.0002270456637452629, + "loss": 1.6627, + "step": 12517 + }, + { + "epoch": 0.98, + "learning_rate": 0.00022703505875900544, + "loss": 1.6019, + "step": 12518 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022702445324972246, + "loss": 1.614, + "step": 12519 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022701384721748595, + "loss": 1.559, + "step": 12520 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022700324066236795, + "loss": 1.5435, + "step": 12521 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022699263358444036, + "loss": 1.6076, + "step": 12522 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022698202598377533, + "loss": 1.5997, + "step": 12523 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002269714178604448, + "loss": 1.5586, + "step": 12524 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002269608092145208, + "loss": 1.6355, + "step": 12525 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022695020004607548, + "loss": 1.5779, + "step": 12526 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002269395903551807, + "loss": 1.6294, + "step": 12527 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022692898014190855, + "loss": 1.599, + "step": 12528 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022691836940633107, + "loss": 1.535, + "step": 12529 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022690775814852032, + "loss": 1.5794, + "step": 12530 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022689714636854832, + "loss": 1.5763, + "step": 12531 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022688653406648714, + "loss": 1.6237, + "step": 12532 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022687592124240885, + "loss": 1.5676, + "step": 12533 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022686530789638547, + "loss": 1.6662, + "step": 12534 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022685469402848902, + "loss": 1.5755, + "step": 12535 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002268440796387917, + "loss": 1.6288, + "step": 12536 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022683346472736538, + "loss": 1.5502, + "step": 12537 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022682284929428229, + "loss": 1.5816, + "step": 12538 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022681223333961443, + "loss": 1.5686, + "step": 12539 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022680161686343392, + "loss": 1.5742, + "step": 12540 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002267909998658128, + "loss": 1.6289, + "step": 12541 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002267803823468232, + "loss": 1.6127, + "step": 12542 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022676976430653715, + "loss": 1.5777, + "step": 12543 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022675914574502677, + "loss": 1.5505, + "step": 12544 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002267485266623641, + "loss": 1.5362, + "step": 12545 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022673790705862132, + "loss": 1.5517, + "step": 12546 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002267272869338705, + "loss": 1.5796, + "step": 12547 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022671666628818377, + "loss": 1.5527, + "step": 12548 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002267060451216332, + "loss": 1.5487, + "step": 12549 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022669542343429092, + "loss": 1.5547, + "step": 12550 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022668480122622897, + "loss": 1.6274, + "step": 12551 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022667417849751959, + "loss": 1.6069, + "step": 12552 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022666355524823486, + "loss": 1.6267, + "step": 12553 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022665293147844685, + "loss": 1.5486, + "step": 12554 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002266423071882278, + "loss": 1.5662, + "step": 12555 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022663168237764975, + "loss": 1.6135, + "step": 12556 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002266210570467849, + "loss": 1.5489, + "step": 12557 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002266104311957053, + "loss": 1.5926, + "step": 12558 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002265998048244832, + "loss": 1.6073, + "step": 12559 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022658917793319064, + "loss": 1.5501, + "step": 12560 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022657855052189986, + "loss": 1.6009, + "step": 12561 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022656792259068297, + "loss": 1.557, + "step": 12562 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022655729413961211, + "loss": 1.6037, + "step": 12563 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022654666516875953, + "loss": 1.5963, + "step": 12564 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022653603567819732, + "loss": 1.6278, + "step": 12565 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022652540566799764, + "loss": 1.6209, + "step": 12566 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022651477513823274, + "loss": 1.6265, + "step": 12567 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002265041440889747, + "loss": 1.5955, + "step": 12568 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022649351252029574, + "loss": 1.5794, + "step": 12569 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022648288043226804, + "loss": 1.5962, + "step": 12570 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022647224782496378, + "loss": 1.5634, + "step": 12571 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002264616146984552, + "loss": 1.5974, + "step": 12572 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002264509810528144, + "loss": 1.5984, + "step": 12573 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022644034688811365, + "loss": 1.5789, + "step": 12574 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022642971220442515, + "loss": 1.5912, + "step": 12575 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022641907700182107, + "loss": 1.6386, + "step": 12576 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002264084412803736, + "loss": 1.6094, + "step": 12577 + }, + { + "epoch": 0.99, + "learning_rate": 0.000226397805040155, + "loss": 1.5724, + "step": 12578 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022638716828123748, + "loss": 1.63, + "step": 12579 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022637653100369322, + "loss": 1.5805, + "step": 12580 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022636589320759441, + "loss": 1.6087, + "step": 12581 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022635525489301343, + "loss": 1.542, + "step": 12582 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022634461606002235, + "loss": 1.5816, + "step": 12583 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002263339767086935, + "loss": 1.5448, + "step": 12584 + }, + { + "epoch": 0.99, + "learning_rate": 0.000226323336839099, + "loss": 1.5721, + "step": 12585 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002263126964513112, + "loss": 1.5623, + "step": 12586 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022630205554540232, + "loss": 1.5507, + "step": 12587 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002262914141214446, + "loss": 1.5447, + "step": 12588 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022628077217951023, + "loss": 1.5488, + "step": 12589 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022627012971967151, + "loss": 1.6483, + "step": 12590 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022625948674200074, + "loss": 1.6106, + "step": 12591 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022624884324657014, + "loss": 1.6406, + "step": 12592 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002262381992334519, + "loss": 1.5604, + "step": 12593 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022622755470271845, + "loss": 1.6044, + "step": 12594 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022621690965444192, + "loss": 1.6073, + "step": 12595 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022620626408869466, + "loss": 1.5937, + "step": 12596 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022619561800554892, + "loss": 1.6161, + "step": 12597 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022618497140507694, + "loss": 1.6275, + "step": 12598 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022617432428735112, + "loss": 1.5848, + "step": 12599 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002261636766524436, + "loss": 1.5441, + "step": 12600 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022615302850042675, + "loss": 1.5455, + "step": 12601 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002261423798313729, + "loss": 1.566, + "step": 12602 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022613173064535427, + "loss": 1.5974, + "step": 12603 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022612108094244328, + "loss": 1.6307, + "step": 12604 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002261104307227121, + "loss": 1.5782, + "step": 12605 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022609977998623313, + "loss": 1.592, + "step": 12606 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002260891287330786, + "loss": 1.6166, + "step": 12607 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002260784769633209, + "loss": 1.6064, + "step": 12608 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002260678246770323, + "loss": 1.5772, + "step": 12609 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022605717187428517, + "loss": 1.5655, + "step": 12610 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022604651855515185, + "loss": 1.5842, + "step": 12611 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002260358647197046, + "loss": 1.5485, + "step": 12612 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022602521036801576, + "loss": 1.6106, + "step": 12613 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022601455550015778, + "loss": 1.5921, + "step": 12614 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022600390011620283, + "loss": 1.5755, + "step": 12615 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002259932442162234, + "loss": 1.551, + "step": 12616 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022598258780029168, + "loss": 1.5531, + "step": 12617 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022597193086848025, + "loss": 1.5933, + "step": 12618 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022596127342086123, + "loss": 1.5883, + "step": 12619 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022595061545750713, + "loss": 1.6076, + "step": 12620 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002259399569784903, + "loss": 1.5924, + "step": 12621 + }, + { + "epoch": 0.99, + "learning_rate": 0.000225929297983883, + "loss": 1.5831, + "step": 12622 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022591863847375772, + "loss": 1.647, + "step": 12623 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022590797844818672, + "loss": 1.6436, + "step": 12624 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022589731790724252, + "loss": 1.5894, + "step": 12625 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022588665685099735, + "loss": 1.6032, + "step": 12626 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022587599527952365, + "loss": 1.5954, + "step": 12627 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022586533319289386, + "loss": 1.6194, + "step": 12628 + }, + { + "epoch": 0.99, + "learning_rate": 0.0002258546705911803, + "loss": 1.5773, + "step": 12629 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022584400747445536, + "loss": 1.5993, + "step": 12630 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022583334384279155, + "loss": 1.6108, + "step": 12631 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022582267969626111, + "loss": 1.5828, + "step": 12632 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022581201503493652, + "loss": 1.5952, + "step": 12633 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022580134985889023, + "loss": 1.5659, + "step": 12634 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022579068416819458, + "loss": 1.5873, + "step": 12635 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022578001796292197, + "loss": 1.5775, + "step": 12636 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022576935124314488, + "loss": 1.549, + "step": 12637 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022575868400893578, + "loss": 1.6088, + "step": 12638 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022574801626036695, + "loss": 1.5899, + "step": 12639 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022573734799751088, + "loss": 1.6224, + "step": 12640 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022572667922044002, + "loss": 1.6124, + "step": 12641 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022571600992922678, + "loss": 1.5923, + "step": 12642 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022570534012394367, + "loss": 1.5509, + "step": 12643 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022569466980466307, + "loss": 1.5504, + "step": 12644 + }, + { + "epoch": 0.99, + "learning_rate": 0.00022568399897145744, + "loss": 1.5701, + "step": 12645 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002256733276243992, + "loss": 1.5698, + "step": 12646 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022566265576356084, + "loss": 1.6058, + "step": 12647 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022565198338901478, + "loss": 1.5262, + "step": 12648 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002256413105008335, + "loss": 1.6294, + "step": 12649 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022563063709908946, + "loss": 1.5668, + "step": 12650 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022561996318385517, + "loss": 1.6042, + "step": 12651 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022560928875520306, + "loss": 1.583, + "step": 12652 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022559861381320556, + "loss": 1.5638, + "step": 12653 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022558793835793518, + "loss": 1.6016, + "step": 12654 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022557726238946448, + "loss": 1.6071, + "step": 12655 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022556658590786578, + "loss": 1.5974, + "step": 12656 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002255559089132118, + "loss": 1.5929, + "step": 12657 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022554523140557478, + "loss": 1.6263, + "step": 12658 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022553455338502736, + "loss": 1.6059, + "step": 12659 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022552387485164202, + "loss": 1.5304, + "step": 12660 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022551319580549123, + "loss": 1.593, + "step": 12661 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022550251624664755, + "loss": 1.5504, + "step": 12662 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002254918361751834, + "loss": 1.5655, + "step": 12663 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022548115559117135, + "loss": 1.5817, + "step": 12664 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002254704744946839, + "loss": 1.5986, + "step": 12665 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002254597928857936, + "loss": 1.6303, + "step": 12666 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022544911076457296, + "loss": 1.6426, + "step": 12667 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022543842813109447, + "loss": 1.5656, + "step": 12668 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022542774498543073, + "loss": 1.6326, + "step": 12669 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022541706132765414, + "loss": 1.5846, + "step": 12670 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022540637715783737, + "loss": 1.6251, + "step": 12671 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002253956924760529, + "loss": 1.5935, + "step": 12672 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022538500728237328, + "loss": 1.6438, + "step": 12673 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002253743215768711, + "loss": 1.603, + "step": 12674 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022536363535961886, + "loss": 1.5739, + "step": 12675 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002253529486306891, + "loss": 1.6244, + "step": 12676 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002253422613901544, + "loss": 1.5618, + "step": 12677 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002253315736380874, + "loss": 1.5876, + "step": 12678 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022532088537456047, + "loss": 1.5571, + "step": 12679 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022531019659964634, + "loss": 1.5593, + "step": 12680 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022529950731341755, + "loss": 1.586, + "step": 12681 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022528881751594668, + "loss": 1.5566, + "step": 12682 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022527812720730622, + "loss": 1.5613, + "step": 12683 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022526743638756887, + "loss": 1.5695, + "step": 12684 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022525674505680717, + "loss": 1.6052, + "step": 12685 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022524605321509365, + "loss": 1.5881, + "step": 12686 + }, + { + "epoch": 1.0, + "learning_rate": 0.000225235360862501, + "loss": 1.6302, + "step": 12687 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022522466799910175, + "loss": 1.5983, + "step": 12688 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002252139746249685, + "loss": 1.5641, + "step": 12689 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022520328074017388, + "loss": 1.591, + "step": 12690 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022519258634479052, + "loss": 1.6098, + "step": 12691 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022518189143889096, + "loss": 1.6391, + "step": 12692 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022517119602254783, + "loss": 1.5737, + "step": 12693 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022516050009583385, + "loss": 1.6284, + "step": 12694 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002251498036588214, + "loss": 1.5684, + "step": 12695 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002251391067115834, + "loss": 1.5697, + "step": 12696 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022512840925419222, + "loss": 1.5683, + "step": 12697 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022511771128672068, + "loss": 1.5834, + "step": 12698 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002251070128092413, + "loss": 1.6082, + "step": 12699 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022509631382182675, + "loss": 1.5829, + "step": 12700 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002250856143245497, + "loss": 1.5954, + "step": 12701 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022507491431748272, + "loss": 1.5967, + "step": 12702 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022506421380069853, + "loss": 1.5937, + "step": 12703 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002250535127742697, + "loss": 1.5679, + "step": 12704 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022504281123826903, + "loss": 1.5984, + "step": 12705 + }, + { + "epoch": 1.0, + "learning_rate": 0.000225032109192769, + "loss": 1.5512, + "step": 12706 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022502140663784238, + "loss": 1.5817, + "step": 12707 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022501070357356187, + "loss": 1.6012, + "step": 12708 + }, + { + "epoch": 1.0, + "learning_rate": 0.000225, + "loss": 1.5703, + "step": 12709 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022498929591722953, + "loss": 1.6076, + "step": 12710 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022497859132532315, + "loss": 1.5634, + "step": 12711 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022496788622435347, + "loss": 1.5549, + "step": 12712 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022495718061439328, + "loss": 1.5171, + "step": 12713 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002249464744955151, + "loss": 1.5547, + "step": 12714 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022493576786779179, + "loss": 1.5623, + "step": 12715 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022492506073129597, + "loss": 1.5476, + "step": 12716 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002249143530861003, + "loss": 1.5405, + "step": 12717 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022490364493227757, + "loss": 1.5766, + "step": 12718 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022489293626990034, + "loss": 1.5565, + "step": 12719 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022488222709904148, + "loss": 1.5565, + "step": 12720 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002248715174197736, + "loss": 1.5791, + "step": 12721 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002248608072321694, + "loss": 1.5086, + "step": 12722 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022485009653630167, + "loss": 1.609, + "step": 12723 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022483938533224306, + "loss": 1.6191, + "step": 12724 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022482867362006635, + "loss": 1.5766, + "step": 12725 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022481796139984424, + "loss": 1.5776, + "step": 12726 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022480724867164942, + "loss": 1.5708, + "step": 12727 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022479653543555473, + "loss": 1.6023, + "step": 12728 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022478582169163278, + "loss": 1.5851, + "step": 12729 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022477510743995643, + "loss": 1.5701, + "step": 12730 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022476439268059834, + "loss": 1.5311, + "step": 12731 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022475367741363125, + "loss": 1.5708, + "step": 12732 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022474296163912797, + "loss": 1.5256, + "step": 12733 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002247322453571612, + "loss": 1.5429, + "step": 12734 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022472152856780378, + "loss": 1.5558, + "step": 12735 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022471081127112836, + "loss": 1.5746, + "step": 12736 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022470009346720778, + "loss": 1.566, + "step": 12737 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002246893751561148, + "loss": 1.5642, + "step": 12738 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022467865633792218, + "loss": 1.5734, + "step": 12739 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022466793701270268, + "loss": 1.5814, + "step": 12740 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022465721718052908, + "loss": 1.5865, + "step": 12741 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022464649684147422, + "loss": 1.611, + "step": 12742 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022463577599561078, + "loss": 1.5309, + "step": 12743 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022462505464301163, + "loss": 1.5629, + "step": 12744 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002246143327837496, + "loss": 1.5453, + "step": 12745 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022460361041789739, + "loss": 1.5616, + "step": 12746 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022459288754552782, + "loss": 1.5717, + "step": 12747 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002245821641667137, + "loss": 1.565, + "step": 12748 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022457144028152783, + "loss": 1.5945, + "step": 12749 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022456071589004308, + "loss": 1.5355, + "step": 12750 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022454999099233216, + "loss": 1.5215, + "step": 12751 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022453926558846802, + "loss": 1.5736, + "step": 12752 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022452853967852332, + "loss": 1.5793, + "step": 12753 + }, + { + "epoch": 1.0, + "learning_rate": 0.000224517813262571, + "loss": 1.5752, + "step": 12754 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022450708634068385, + "loss": 1.5909, + "step": 12755 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022449635891293472, + "loss": 1.5237, + "step": 12756 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002244856309793964, + "loss": 1.5917, + "step": 12757 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022447490254014172, + "loss": 1.5519, + "step": 12758 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022446417359524358, + "loss": 1.5484, + "step": 12759 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002244534441447748, + "loss": 1.5631, + "step": 12760 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002244427141888082, + "loss": 1.6429, + "step": 12761 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002244319837274167, + "loss": 1.6174, + "step": 12762 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022442125276067308, + "loss": 1.5602, + "step": 12763 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022441052128865021, + "loss": 1.5686, + "step": 12764 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022439978931142096, + "loss": 1.5839, + "step": 12765 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022438905682905825, + "loss": 1.595, + "step": 12766 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002243783238416348, + "loss": 1.5596, + "step": 12767 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022436759034922364, + "loss": 1.5859, + "step": 12768 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002243568563518976, + "loss": 1.5822, + "step": 12769 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022434612184972947, + "loss": 1.5838, + "step": 12770 + }, + { + "epoch": 1.0, + "learning_rate": 0.00022433538684279224, + "loss": 1.5921, + "step": 12771 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002243246513311588, + "loss": 1.5726, + "step": 12772 + }, + { + "epoch": 1.0, + "learning_rate": 0.0002243139153149019, + "loss": 1.6001, + "step": 12773 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022430317879409457, + "loss": 1.5696, + "step": 12774 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022429244176880967, + "loss": 1.5999, + "step": 12775 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002242817042391201, + "loss": 1.5566, + "step": 12776 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022427096620509872, + "loss": 1.5675, + "step": 12777 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022426022766681845, + "loss": 1.6168, + "step": 12778 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022424948862435226, + "loss": 1.6123, + "step": 12779 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022423874907777299, + "loss": 1.5662, + "step": 12780 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002242280090271536, + "loss": 1.5403, + "step": 12781 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022421726847256696, + "loss": 1.4945, + "step": 12782 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022420652741408605, + "loss": 1.611, + "step": 12783 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022419578585178377, + "loss": 1.5785, + "step": 12784 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022418504378573305, + "loss": 1.5752, + "step": 12785 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022417430121600683, + "loss": 1.5389, + "step": 12786 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022416355814267803, + "loss": 1.5723, + "step": 12787 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022415281456581956, + "loss": 1.6173, + "step": 12788 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022414207048550443, + "loss": 1.5503, + "step": 12789 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022413132590180557, + "loss": 1.5905, + "step": 12790 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002241205808147959, + "loss": 1.5662, + "step": 12791 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022410983522454838, + "loss": 1.5507, + "step": 12792 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022409908913113602, + "loss": 1.5314, + "step": 12793 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022408834253463165, + "loss": 1.5925, + "step": 12794 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022407759543510838, + "loss": 1.5844, + "step": 12795 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022406684783263914, + "loss": 1.5908, + "step": 12796 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002240560997272968, + "loss": 1.6089, + "step": 12797 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022404535111915448, + "loss": 1.5557, + "step": 12798 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022403460200828506, + "loss": 1.5585, + "step": 12799 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022402385239476155, + "loss": 1.5847, + "step": 12800 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022401310227865696, + "loss": 1.5673, + "step": 12801 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022400235166004418, + "loss": 1.5216, + "step": 12802 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022399160053899637, + "loss": 1.6005, + "step": 12803 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022398084891558633, + "loss": 1.5364, + "step": 12804 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002239700967898872, + "loss": 1.5447, + "step": 12805 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002239593441619719, + "loss": 1.5333, + "step": 12806 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002239485910319135, + "loss": 1.5439, + "step": 12807 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022393783739978497, + "loss": 1.5849, + "step": 12808 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002239270832656593, + "loss": 1.553, + "step": 12809 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022391632862960953, + "loss": 1.5324, + "step": 12810 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022390557349170873, + "loss": 1.6348, + "step": 12811 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022389481785202984, + "loss": 1.5242, + "step": 12812 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002238840617106459, + "loss": 1.5984, + "step": 12813 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022387330506763, + "loss": 1.5729, + "step": 12814 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002238625479230551, + "loss": 1.5439, + "step": 12815 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022385179027699422, + "loss": 1.5362, + "step": 12816 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002238410321295205, + "loss": 1.5656, + "step": 12817 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002238302734807069, + "loss": 1.5915, + "step": 12818 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022381951433062645, + "loss": 1.5599, + "step": 12819 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002238087546793523, + "loss": 1.5692, + "step": 12820 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022379799452695734, + "loss": 1.5669, + "step": 12821 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022378723387351485, + "loss": 1.5768, + "step": 12822 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002237764727190977, + "loss": 1.5931, + "step": 12823 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022376571106377897, + "loss": 1.5853, + "step": 12824 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002237549489076318, + "loss": 1.5369, + "step": 12825 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022374418625072925, + "loss": 1.616, + "step": 12826 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022373342309314436, + "loss": 1.5545, + "step": 12827 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022372265943495026, + "loss": 1.5766, + "step": 12828 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022371189527621989, + "loss": 1.5599, + "step": 12829 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022370113061702645, + "loss": 1.5616, + "step": 12830 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022369036545744303, + "loss": 1.5843, + "step": 12831 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022367959979754275, + "loss": 1.5699, + "step": 12832 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022366883363739856, + "loss": 1.5194, + "step": 12833 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002236580669770837, + "loss": 1.5358, + "step": 12834 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002236472998166712, + "loss": 1.5797, + "step": 12835 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022363653215623416, + "loss": 1.5229, + "step": 12836 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022362576399584567, + "loss": 1.582, + "step": 12837 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022361499533557892, + "loss": 1.5767, + "step": 12838 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022360422617550695, + "loss": 1.5873, + "step": 12839 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022359345651570297, + "loss": 1.5708, + "step": 12840 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022358268635623997, + "loss": 1.5444, + "step": 12841 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022357191569719116, + "loss": 1.5909, + "step": 12842 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022356114453862962, + "loss": 1.5707, + "step": 12843 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022355037288062851, + "loss": 1.5262, + "step": 12844 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022353960072326096, + "loss": 1.5964, + "step": 12845 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002235288280666001, + "loss": 1.6067, + "step": 12846 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002235180549107191, + "loss": 1.6097, + "step": 12847 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022350728125569106, + "loss": 1.5079, + "step": 12848 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022349650710158913, + "loss": 1.5432, + "step": 12849 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002234857324484865, + "loss": 1.5512, + "step": 12850 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022347495729645628, + "loss": 1.5179, + "step": 12851 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022346418164557162, + "loss": 1.5642, + "step": 12852 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022345340549590576, + "loss": 1.6375, + "step": 12853 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022344262884753182, + "loss": 1.5717, + "step": 12854 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002234318517005229, + "loss": 1.5243, + "step": 12855 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022342107405495226, + "loss": 1.5669, + "step": 12856 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022341029591089307, + "loss": 1.553, + "step": 12857 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022339951726841844, + "loss": 1.6142, + "step": 12858 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022338873812760164, + "loss": 1.5519, + "step": 12859 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022337795848851574, + "loss": 1.5165, + "step": 12860 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022336717835123407, + "loss": 1.5779, + "step": 12861 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022335639771582966, + "loss": 1.6213, + "step": 12862 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022334561658237585, + "loss": 1.6038, + "step": 12863 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002233348349509458, + "loss": 1.5734, + "step": 12864 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022332405282161265, + "loss": 1.5347, + "step": 12865 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022331327019444963, + "loss": 1.5676, + "step": 12866 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022330248706953, + "loss": 1.606, + "step": 12867 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022329170344692688, + "loss": 1.5473, + "step": 12868 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022328091932671362, + "loss": 1.5691, + "step": 12869 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022327013470896333, + "loss": 1.6428, + "step": 12870 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022325934959374925, + "loss": 1.5478, + "step": 12871 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002232485639811446, + "loss": 1.5801, + "step": 12872 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002232377778712226, + "loss": 1.5864, + "step": 12873 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022322699126405658, + "loss": 1.5576, + "step": 12874 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002232162041597197, + "loss": 1.5487, + "step": 12875 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002232054165582851, + "loss": 1.5291, + "step": 12876 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002231946284598262, + "loss": 1.5736, + "step": 12877 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022318383986441614, + "loss": 1.5259, + "step": 12878 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022317305077212816, + "loss": 1.5355, + "step": 12879 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002231622611830356, + "loss": 1.5456, + "step": 12880 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022315147109721166, + "loss": 1.5803, + "step": 12881 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022314068051472956, + "loss": 1.5745, + "step": 12882 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022312988943566262, + "loss": 1.6124, + "step": 12883 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022311909786008408, + "loss": 1.6066, + "step": 12884 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022310830578806722, + "loss": 1.5796, + "step": 12885 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022309751321968532, + "loss": 1.6492, + "step": 12886 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022308672015501166, + "loss": 1.5245, + "step": 12887 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022307592659411945, + "loss": 1.532, + "step": 12888 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022306513253708208, + "loss": 1.5152, + "step": 12889 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022305433798397274, + "loss": 1.6107, + "step": 12890 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022304354293486482, + "loss": 1.5952, + "step": 12891 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022303274738983144, + "loss": 1.5696, + "step": 12892 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002230219513489461, + "loss": 1.5699, + "step": 12893 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022301115481228195, + "loss": 1.5138, + "step": 12894 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022300035777991239, + "loss": 1.5703, + "step": 12895 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022298956025191072, + "loss": 1.6115, + "step": 12896 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022297876222835016, + "loss": 1.5839, + "step": 12897 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002229679637093041, + "loss": 1.5145, + "step": 12898 + }, + { + "epoch": 1.01, + "learning_rate": 0.0002229571646948458, + "loss": 1.5895, + "step": 12899 + }, + { + "epoch": 1.01, + "learning_rate": 0.00022294636518504864, + "loss": 1.5815, + "step": 12900 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002229355651799859, + "loss": 1.5524, + "step": 12901 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022292476467973094, + "loss": 1.6086, + "step": 12902 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022291396368435707, + "loss": 1.614, + "step": 12903 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002229031621939376, + "loss": 1.5722, + "step": 12904 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022289236020854594, + "loss": 1.5736, + "step": 12905 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022288155772825534, + "loss": 1.5372, + "step": 12906 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002228707547531392, + "loss": 1.5627, + "step": 12907 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022285995128327083, + "loss": 1.5067, + "step": 12908 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002228491473187236, + "loss": 1.6282, + "step": 12909 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022283834285957086, + "loss": 1.5346, + "step": 12910 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022282753790588597, + "loss": 1.6062, + "step": 12911 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022281673245774227, + "loss": 1.5768, + "step": 12912 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002228059265152132, + "loss": 1.5961, + "step": 12913 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022279512007837205, + "loss": 1.6004, + "step": 12914 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022278431314729215, + "loss": 1.6025, + "step": 12915 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022277350572204695, + "loss": 1.5462, + "step": 12916 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022276269780270987, + "loss": 1.5645, + "step": 12917 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022275188938935417, + "loss": 1.5028, + "step": 12918 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022274108048205325, + "loss": 1.5501, + "step": 12919 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022273027108088065, + "loss": 1.5388, + "step": 12920 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022271946118590955, + "loss": 1.5813, + "step": 12921 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022270865079721344, + "loss": 1.6022, + "step": 12922 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022269783991486574, + "loss": 1.6066, + "step": 12923 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022268702853893982, + "loss": 1.5844, + "step": 12924 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022267621666950912, + "loss": 1.5676, + "step": 12925 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022266540430664696, + "loss": 1.5804, + "step": 12926 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022265459145042686, + "loss": 1.5435, + "step": 12927 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022264377810092214, + "loss": 1.5871, + "step": 12928 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022263296425820627, + "loss": 1.5755, + "step": 12929 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022262214992235265, + "loss": 1.5691, + "step": 12930 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002226113350934347, + "loss": 1.5873, + "step": 12931 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022260051977152586, + "loss": 1.5803, + "step": 12932 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022258970395669958, + "loss": 1.6099, + "step": 12933 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022257888764902925, + "loss": 1.6084, + "step": 12934 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002225680708485883, + "loss": 1.573, + "step": 12935 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022255725355545023, + "loss": 1.5501, + "step": 12936 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022254643576968846, + "loss": 1.589, + "step": 12937 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002225356174913764, + "loss": 1.557, + "step": 12938 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002225247987205875, + "loss": 1.6282, + "step": 12939 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022251397945739526, + "loss": 1.5555, + "step": 12940 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022250315970187313, + "loss": 1.5573, + "step": 12941 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022249233945409458, + "loss": 1.5591, + "step": 12942 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022248151871413297, + "loss": 1.5818, + "step": 12943 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022247069748206194, + "loss": 1.5731, + "step": 12944 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002224598757579548, + "loss": 1.5645, + "step": 12945 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022244905354188512, + "loss": 1.6237, + "step": 12946 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022243823083392631, + "loss": 1.569, + "step": 12947 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022242740763415194, + "loss": 1.5595, + "step": 12948 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022241658394263542, + "loss": 1.555, + "step": 12949 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022240575975945024, + "loss": 1.5565, + "step": 12950 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022239493508466993, + "loss": 1.6198, + "step": 12951 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022238410991836798, + "loss": 1.6036, + "step": 12952 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022237328426061783, + "loss": 1.5187, + "step": 12953 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022236245811149303, + "loss": 1.5594, + "step": 12954 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022235163147106706, + "loss": 1.5909, + "step": 12955 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022234080433941348, + "loss": 1.5982, + "step": 12956 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022232997671660574, + "loss": 1.584, + "step": 12957 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022231914860271733, + "loss": 1.542, + "step": 12958 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022230831999782186, + "loss": 1.6387, + "step": 12959 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002222974909019928, + "loss": 1.6186, + "step": 12960 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022228666131530366, + "loss": 1.5631, + "step": 12961 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022227583123782794, + "loss": 1.5677, + "step": 12962 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022226500066963926, + "loss": 1.5856, + "step": 12963 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022225416961081112, + "loss": 1.5581, + "step": 12964 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022224333806141703, + "loss": 1.5023, + "step": 12965 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022223250602153055, + "loss": 1.5463, + "step": 12966 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022222167349122518, + "loss": 1.5329, + "step": 12967 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002222108404705745, + "loss": 1.5496, + "step": 12968 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002222000069596521, + "loss": 1.5387, + "step": 12969 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022218917295853145, + "loss": 1.5037, + "step": 12970 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022217833846728622, + "loss": 1.5783, + "step": 12971 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022216750348598983, + "loss": 1.65, + "step": 12972 + }, + { + "epoch": 1.02, + "learning_rate": 0.000222156668014716, + "loss": 1.6246, + "step": 12973 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022214583205353814, + "loss": 1.5719, + "step": 12974 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002221349956025299, + "loss": 1.5717, + "step": 12975 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022212415866176488, + "loss": 1.5632, + "step": 12976 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002221133212313166, + "loss": 1.5807, + "step": 12977 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022210248331125867, + "loss": 1.5827, + "step": 12978 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022209164490166465, + "loss": 1.5819, + "step": 12979 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022208080600260815, + "loss": 1.5274, + "step": 12980 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022206996661416282, + "loss": 1.5935, + "step": 12981 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022205912673640212, + "loss": 1.5686, + "step": 12982 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022204828636939976, + "loss": 1.5366, + "step": 12983 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022203744551322922, + "loss": 1.5499, + "step": 12984 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022202660416796425, + "loss": 1.5735, + "step": 12985 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022201576233367833, + "loss": 1.5675, + "step": 12986 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022200492001044517, + "loss": 1.5769, + "step": 12987 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022199407719833831, + "loss": 1.6106, + "step": 12988 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022198323389743143, + "loss": 1.6385, + "step": 12989 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022197239010779808, + "loss": 1.6015, + "step": 12990 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022196154582951194, + "loss": 1.5195, + "step": 12991 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022195070106264663, + "loss": 1.5573, + "step": 12992 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022193985580727576, + "loss": 1.6263, + "step": 12993 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002219290100634729, + "loss": 1.5938, + "step": 12994 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002219181638313118, + "loss": 1.5931, + "step": 12995 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002219073171108661, + "loss": 1.5371, + "step": 12996 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022189646990220934, + "loss": 1.625, + "step": 12997 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002218856222054153, + "loss": 1.5833, + "step": 12998 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022187477402055747, + "loss": 1.594, + "step": 12999 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022186392534770963, + "loss": 1.6006, + "step": 13000 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002218530761869454, + "loss": 1.6179, + "step": 13001 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002218422265383384, + "loss": 1.5422, + "step": 13002 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022183137640196233, + "loss": 1.5836, + "step": 13003 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022182052577789088, + "loss": 1.5648, + "step": 13004 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002218096746661977, + "loss": 1.6029, + "step": 13005 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022179882306695643, + "loss": 1.57, + "step": 13006 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002217879709802408, + "loss": 1.5806, + "step": 13007 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022177711840612447, + "loss": 1.585, + "step": 13008 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022176626534468107, + "loss": 1.5812, + "step": 13009 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022175541179598435, + "loss": 1.5386, + "step": 13010 + }, + { + "epoch": 1.02, + "learning_rate": 0.000221744557760108, + "loss": 1.5731, + "step": 13011 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002217337032371257, + "loss": 1.563, + "step": 13012 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002217228482271111, + "loss": 1.5541, + "step": 13013 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022171199273013798, + "loss": 1.5158, + "step": 13014 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022170113674627997, + "loss": 1.5674, + "step": 13015 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022169028027561085, + "loss": 1.5621, + "step": 13016 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022167942331820426, + "loss": 1.5241, + "step": 13017 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022166856587413396, + "loss": 1.558, + "step": 13018 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022165770794347361, + "loss": 1.5289, + "step": 13019 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022164684952629703, + "loss": 1.5952, + "step": 13020 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002216359906226778, + "loss": 1.5298, + "step": 13021 + }, + { + "epoch": 1.02, + "learning_rate": 0.0002216251312326898, + "loss": 1.6042, + "step": 13022 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022161427135640666, + "loss": 1.5422, + "step": 13023 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022160341099390212, + "loss": 1.5521, + "step": 13024 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022159255014524991, + "loss": 1.6151, + "step": 13025 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022158168881052386, + "loss": 1.5719, + "step": 13026 + }, + { + "epoch": 1.02, + "learning_rate": 0.00022157082698979761, + "loss": 1.5696, + "step": 13027 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022155996468314494, + "loss": 1.5272, + "step": 13028 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022154910189063962, + "loss": 1.5539, + "step": 13029 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022153823861235534, + "loss": 1.5456, + "step": 13030 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022152737484836595, + "loss": 1.5787, + "step": 13031 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022151651059874517, + "loss": 1.5683, + "step": 13032 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022150564586356664, + "loss": 1.55, + "step": 13033 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002214947806429043, + "loss": 1.5298, + "step": 13034 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022148391493683188, + "loss": 1.5785, + "step": 13035 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002214730487454231, + "loss": 1.6301, + "step": 13036 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002214621820687518, + "loss": 1.5962, + "step": 13037 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022145131490689164, + "loss": 1.5122, + "step": 13038 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022144044725991654, + "loss": 1.5746, + "step": 13039 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022142957912790021, + "loss": 1.6018, + "step": 13040 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022141871051091646, + "loss": 1.5769, + "step": 13041 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022140784140903906, + "loss": 1.6113, + "step": 13042 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022139697182234184, + "loss": 1.5662, + "step": 13043 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002213861017508986, + "loss": 1.5961, + "step": 13044 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002213752311947831, + "loss": 1.5725, + "step": 13045 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022136436015406918, + "loss": 1.5518, + "step": 13046 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022135348862883063, + "loss": 1.5165, + "step": 13047 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022134261661914127, + "loss": 1.6185, + "step": 13048 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022133174412507488, + "loss": 1.5526, + "step": 13049 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022132087114670537, + "loss": 1.5696, + "step": 13050 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022130999768410646, + "loss": 1.5924, + "step": 13051 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022129912373735204, + "loss": 1.5269, + "step": 13052 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002212882493065159, + "loss": 1.6137, + "step": 13053 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002212773743916719, + "loss": 1.5659, + "step": 13054 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022126649899289387, + "loss": 1.555, + "step": 13055 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022125562311025565, + "loss": 1.5826, + "step": 13056 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022124474674383102, + "loss": 1.5928, + "step": 13057 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022123386989369393, + "loss": 1.5164, + "step": 13058 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022122299255991813, + "loss": 1.5189, + "step": 13059 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002212121147425775, + "loss": 1.4595, + "step": 13060 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022120123644174598, + "loss": 1.5635, + "step": 13061 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022119035765749733, + "loss": 1.6173, + "step": 13062 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002211794783899054, + "loss": 1.5862, + "step": 13063 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022116859863904412, + "loss": 1.5988, + "step": 13064 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002211577184049873, + "loss": 1.5771, + "step": 13065 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002211468376878089, + "loss": 1.5188, + "step": 13066 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002211359564875827, + "loss": 1.5221, + "step": 13067 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022112507480438263, + "loss": 1.5356, + "step": 13068 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022111419263828253, + "loss": 1.6176, + "step": 13069 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022110330998935631, + "loss": 1.5327, + "step": 13070 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022109242685767786, + "loss": 1.6169, + "step": 13071 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022108154324332102, + "loss": 1.5447, + "step": 13072 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002210706591463598, + "loss": 1.5192, + "step": 13073 + }, + { + "epoch": 1.03, + "learning_rate": 0.000221059774566868, + "loss": 1.556, + "step": 13074 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002210488895049195, + "loss": 1.5468, + "step": 13075 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022103800396058832, + "loss": 1.5532, + "step": 13076 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022102711793394825, + "loss": 1.5709, + "step": 13077 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022101623142507326, + "loss": 1.5237, + "step": 13078 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022100534443403726, + "loss": 1.5336, + "step": 13079 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022099445696091411, + "loss": 1.6235, + "step": 13080 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002209835690057778, + "loss": 1.6045, + "step": 13081 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022097268056870222, + "loss": 1.6023, + "step": 13082 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022096179164976136, + "loss": 1.5852, + "step": 13083 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022095090224902902, + "loss": 1.5824, + "step": 13084 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022094001236657926, + "loss": 1.6005, + "step": 13085 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022092912200248594, + "loss": 1.5858, + "step": 13086 + }, + { + "epoch": 1.03, + "learning_rate": 0.000220918231156823, + "loss": 1.5629, + "step": 13087 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002209073398296644, + "loss": 1.6149, + "step": 13088 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022089644802108417, + "loss": 1.5474, + "step": 13089 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022088555573115612, + "loss": 1.6006, + "step": 13090 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002208746629599543, + "loss": 1.548, + "step": 13091 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002208637697075526, + "loss": 1.5448, + "step": 13092 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022085287597402504, + "loss": 1.6067, + "step": 13093 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022084198175944552, + "loss": 1.5731, + "step": 13094 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022083108706388808, + "loss": 1.5673, + "step": 13095 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002208201918874266, + "loss": 1.5787, + "step": 13096 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022080929623013513, + "loss": 1.5829, + "step": 13097 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022079840009208755, + "loss": 1.5479, + "step": 13098 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022078750347335796, + "loss": 1.5671, + "step": 13099 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002207766063740203, + "loss": 1.5946, + "step": 13100 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022076570879414853, + "loss": 1.5336, + "step": 13101 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022075481073381662, + "loss": 1.5719, + "step": 13102 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022074391219309861, + "loss": 1.6146, + "step": 13103 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022073301317206845, + "loss": 1.5436, + "step": 13104 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022072211367080025, + "loss": 1.5821, + "step": 13105 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022071121368936783, + "loss": 1.5666, + "step": 13106 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022070031322784535, + "loss": 1.5747, + "step": 13107 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022068941228630675, + "loss": 1.6303, + "step": 13108 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022067851086482603, + "loss": 1.5886, + "step": 13109 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002206676089634772, + "loss": 1.5317, + "step": 13110 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022065670658233435, + "loss": 1.5128, + "step": 13111 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022064580372147143, + "loss": 1.5206, + "step": 13112 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022063490038096248, + "loss": 1.5921, + "step": 13113 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022062399656088156, + "loss": 1.6043, + "step": 13114 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002206130922613027, + "loss": 1.5227, + "step": 13115 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022060218748229984, + "loss": 1.5594, + "step": 13116 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022059128222394716, + "loss": 1.5875, + "step": 13117 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022058037648631858, + "loss": 1.5, + "step": 13118 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022056947026948822, + "loss": 1.5429, + "step": 13119 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022055856357353006, + "loss": 1.5512, + "step": 13120 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022054765639851822, + "loss": 1.5143, + "step": 13121 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022053674874452677, + "loss": 1.5462, + "step": 13122 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022052584061162966, + "loss": 1.5916, + "step": 13123 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022051493199990103, + "loss": 1.543, + "step": 13124 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022050402290941493, + "loss": 1.6087, + "step": 13125 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022049311334024538, + "loss": 1.5231, + "step": 13126 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022048220329246655, + "loss": 1.6186, + "step": 13127 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002204712927661524, + "loss": 1.5477, + "step": 13128 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022046038176137714, + "loss": 1.6007, + "step": 13129 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002204494702782147, + "loss": 1.5725, + "step": 13130 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022043855831673924, + "loss": 1.6043, + "step": 13131 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022042764587702489, + "loss": 1.5431, + "step": 13132 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022041673295914563, + "loss": 1.5494, + "step": 13133 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022040581956317567, + "loss": 1.5427, + "step": 13134 + }, + { + "epoch": 1.03, + "learning_rate": 0.000220394905689189, + "loss": 1.5869, + "step": 13135 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022038399133725978, + "loss": 1.5472, + "step": 13136 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022037307650746212, + "loss": 1.5744, + "step": 13137 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002203621611998701, + "loss": 1.5365, + "step": 13138 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022035124541455785, + "loss": 1.5206, + "step": 13139 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022034032915159942, + "loss": 1.5656, + "step": 13140 + }, + { + "epoch": 1.03, + "learning_rate": 0.000220329412411069, + "loss": 1.5653, + "step": 13141 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022031849519304068, + "loss": 1.5356, + "step": 13142 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022030757749758856, + "loss": 1.5565, + "step": 13143 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002202966593247868, + "loss": 1.6126, + "step": 13144 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022028574067470952, + "loss": 1.5567, + "step": 13145 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022027482154743087, + "loss": 1.5106, + "step": 13146 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022026390194302493, + "loss": 1.5435, + "step": 13147 + }, + { + "epoch": 1.03, + "learning_rate": 0.0002202529818615659, + "loss": 1.5571, + "step": 13148 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022024206130312788, + "loss": 1.5958, + "step": 13149 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022023114026778503, + "loss": 1.5903, + "step": 13150 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022022021875561147, + "loss": 1.5188, + "step": 13151 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022020929676668137, + "loss": 1.5837, + "step": 13152 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022019837430106893, + "loss": 1.5436, + "step": 13153 + }, + { + "epoch": 1.03, + "learning_rate": 0.00022018745135884824, + "loss": 1.6005, + "step": 13154 + }, + { + "epoch": 1.04, + "learning_rate": 0.00022017652794009348, + "loss": 1.5811, + "step": 13155 + }, + { + "epoch": 1.04, + "learning_rate": 0.00022016560404487887, + "loss": 1.5656, + "step": 13156 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002201546796732785, + "loss": 1.5265, + "step": 13157 + }, + { + "epoch": 1.04, + "learning_rate": 0.00022014375482536655, + "loss": 1.5292, + "step": 13158 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002201328295012172, + "loss": 1.5694, + "step": 13159 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002201219037009047, + "loss": 1.555, + "step": 13160 + }, + { + "epoch": 1.04, + "learning_rate": 0.00022011097742450316, + "loss": 1.5903, + "step": 13161 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002201000506720867, + "loss": 1.5731, + "step": 13162 + }, + { + "epoch": 1.04, + "learning_rate": 0.00022008912344372968, + "loss": 1.6098, + "step": 13163 + }, + { + "epoch": 1.04, + "learning_rate": 0.00022007819573950614, + "loss": 1.5223, + "step": 13164 + }, + { + "epoch": 1.04, + "learning_rate": 0.00022006726755949033, + "loss": 1.5604, + "step": 13165 + }, + { + "epoch": 1.04, + "learning_rate": 0.00022005633890375645, + "loss": 1.4896, + "step": 13166 + }, + { + "epoch": 1.04, + "learning_rate": 0.00022004540977237867, + "loss": 1.5852, + "step": 13167 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002200344801654312, + "loss": 1.5973, + "step": 13168 + }, + { + "epoch": 1.04, + "learning_rate": 0.00022002355008298826, + "loss": 1.517, + "step": 13169 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002200126195251241, + "loss": 1.5914, + "step": 13170 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002200016884919129, + "loss": 1.5571, + "step": 13171 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002199907569834288, + "loss": 1.6102, + "step": 13172 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021997982499974612, + "loss": 1.5174, + "step": 13173 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021996889254093902, + "loss": 1.5694, + "step": 13174 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002199579596070818, + "loss": 1.5672, + "step": 13175 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021994702619824858, + "loss": 1.6213, + "step": 13176 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021993609231451368, + "loss": 1.5697, + "step": 13177 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021992515795595132, + "loss": 1.5594, + "step": 13178 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021991422312263575, + "loss": 1.6254, + "step": 13179 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021990328781464115, + "loss": 1.6169, + "step": 13180 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002198923520320418, + "loss": 1.5538, + "step": 13181 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021988141577491193, + "loss": 1.558, + "step": 13182 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002198704790433258, + "loss": 1.6071, + "step": 13183 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021985954183735773, + "loss": 1.5684, + "step": 13184 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021984860415708192, + "loss": 1.5828, + "step": 13185 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021983766600257263, + "loss": 1.6016, + "step": 13186 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002198267273739041, + "loss": 1.6679, + "step": 13187 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021981578827115063, + "loss": 1.6116, + "step": 13188 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021980484869438648, + "loss": 1.6306, + "step": 13189 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021979390864368593, + "loss": 1.5847, + "step": 13190 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021978296811912327, + "loss": 1.5809, + "step": 13191 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002197720271207728, + "loss": 1.5469, + "step": 13192 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021976108564870873, + "loss": 1.5419, + "step": 13193 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002197501437030054, + "loss": 1.5784, + "step": 13194 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021973920128373706, + "loss": 1.5654, + "step": 13195 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021972825839097803, + "loss": 1.625, + "step": 13196 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021971731502480265, + "loss": 1.5625, + "step": 13197 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002197063711852851, + "loss": 1.5649, + "step": 13198 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002196954268724998, + "loss": 1.5251, + "step": 13199 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021968448208652103, + "loss": 1.6216, + "step": 13200 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021967353682742305, + "loss": 1.5568, + "step": 13201 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021966259109528025, + "loss": 1.5873, + "step": 13202 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021965164489016684, + "loss": 1.5478, + "step": 13203 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002196406982121572, + "loss": 1.567, + "step": 13204 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002196297510613257, + "loss": 1.5459, + "step": 13205 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021961880343774657, + "loss": 1.5921, + "step": 13206 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021960785534149422, + "loss": 1.513, + "step": 13207 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002195969067726429, + "loss": 1.5519, + "step": 13208 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021958595773126705, + "loss": 1.5647, + "step": 13209 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002195750082174409, + "loss": 1.586, + "step": 13210 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021956405823123884, + "loss": 1.6158, + "step": 13211 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021955310777273528, + "loss": 1.5901, + "step": 13212 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021954215684200442, + "loss": 1.5541, + "step": 13213 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002195312054391207, + "loss": 1.5339, + "step": 13214 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021952025356415848, + "loss": 1.6325, + "step": 13215 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021950930121719211, + "loss": 1.593, + "step": 13216 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021949834839829596, + "loss": 1.5262, + "step": 13217 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021948739510754435, + "loss": 1.5632, + "step": 13218 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002194764413450117, + "loss": 1.5556, + "step": 13219 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021946548711077233, + "loss": 1.6297, + "step": 13220 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021945453240490066, + "loss": 1.5822, + "step": 13221 + }, + { + "epoch": 1.04, + "learning_rate": 0.000219443577227471, + "loss": 1.5225, + "step": 13222 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021943262157855776, + "loss": 1.5889, + "step": 13223 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021942166545823542, + "loss": 1.5825, + "step": 13224 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021941070886657824, + "loss": 1.591, + "step": 13225 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021939975180366064, + "loss": 1.572, + "step": 13226 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021938879426955705, + "loss": 1.5793, + "step": 13227 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021937783626434178, + "loss": 1.4996, + "step": 13228 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002193668777880893, + "loss": 1.5794, + "step": 13229 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021935591884087404, + "loss": 1.5321, + "step": 13230 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002193449594227704, + "loss": 1.5565, + "step": 13231 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021933399953385268, + "loss": 1.5516, + "step": 13232 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021932303917419538, + "loss": 1.5769, + "step": 13233 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002193120783438729, + "loss": 1.5985, + "step": 13234 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021930111704295967, + "loss": 1.6331, + "step": 13235 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002192901552715301, + "loss": 1.5775, + "step": 13236 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002192791930296586, + "loss": 1.6029, + "step": 13237 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021926823031741962, + "loss": 1.5746, + "step": 13238 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021925726713488758, + "loss": 1.5051, + "step": 13239 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021924630348213692, + "loss": 1.5342, + "step": 13240 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002192353393592421, + "loss": 1.5725, + "step": 13241 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021922437476627746, + "loss": 1.5601, + "step": 13242 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021921340970331755, + "loss": 1.5324, + "step": 13243 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002192024441704368, + "loss": 1.5432, + "step": 13244 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002191914781677096, + "loss": 1.6287, + "step": 13245 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021918051169521048, + "loss": 1.5272, + "step": 13246 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021916954475301387, + "loss": 1.6059, + "step": 13247 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021915857734119425, + "loss": 1.5795, + "step": 13248 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021914760945982603, + "loss": 1.6461, + "step": 13249 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021913664110898367, + "loss": 1.5372, + "step": 13250 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002191256722887417, + "loss": 1.5909, + "step": 13251 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021911470299917454, + "loss": 1.6018, + "step": 13252 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021910373324035668, + "loss": 1.5998, + "step": 13253 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021909276301236262, + "loss": 1.5836, + "step": 13254 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021908179231526687, + "loss": 1.5514, + "step": 13255 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021907082114914383, + "loss": 1.541, + "step": 13256 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021905984951406802, + "loss": 1.5866, + "step": 13257 + }, + { + "epoch": 1.04, + "learning_rate": 0.000219048877410114, + "loss": 1.5844, + "step": 13258 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021903790483735613, + "loss": 1.5698, + "step": 13259 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021902693179586902, + "loss": 1.5387, + "step": 13260 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021901595828572711, + "loss": 1.5642, + "step": 13261 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021900498430700493, + "loss": 1.5829, + "step": 13262 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021899400985977705, + "loss": 1.5685, + "step": 13263 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021898303494411787, + "loss": 1.545, + "step": 13264 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021897205956010197, + "loss": 1.5406, + "step": 13265 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021896108370780384, + "loss": 1.5716, + "step": 13266 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021895010738729796, + "loss": 1.6312, + "step": 13267 + }, + { + "epoch": 1.04, + "learning_rate": 0.000218939130598659, + "loss": 1.5768, + "step": 13268 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002189281533419613, + "loss": 1.5928, + "step": 13269 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002189171756172795, + "loss": 1.5745, + "step": 13270 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021890619742468814, + "loss": 1.5196, + "step": 13271 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021889521876426165, + "loss": 1.6021, + "step": 13272 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021888423963607474, + "loss": 1.5822, + "step": 13273 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002188732600402018, + "loss": 1.4956, + "step": 13274 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002188622799767175, + "loss": 1.5373, + "step": 13275 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021885129944569623, + "loss": 1.5832, + "step": 13276 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021884031844721265, + "loss": 1.554, + "step": 13277 + }, + { + "epoch": 1.04, + "learning_rate": 0.0002188293369813413, + "loss": 1.5884, + "step": 13278 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021881835504815672, + "loss": 1.5647, + "step": 13279 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021880737264773356, + "loss": 1.5707, + "step": 13280 + }, + { + "epoch": 1.04, + "learning_rate": 0.00021879638978014625, + "loss": 1.5864, + "step": 13281 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021878540644546944, + "loss": 1.6006, + "step": 13282 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021877442264377767, + "loss": 1.5641, + "step": 13283 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021876343837514553, + "loss": 1.5283, + "step": 13284 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021875245363964758, + "loss": 1.5792, + "step": 13285 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021874146843735843, + "loss": 1.556, + "step": 13286 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021873048276835263, + "loss": 1.5541, + "step": 13287 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021871949663270477, + "loss": 1.6204, + "step": 13288 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021870851003048943, + "loss": 1.5504, + "step": 13289 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002186975229617813, + "loss": 1.5363, + "step": 13290 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021868653542665484, + "loss": 1.6054, + "step": 13291 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021867554742518473, + "loss": 1.5454, + "step": 13292 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002186645589574455, + "loss": 1.6188, + "step": 13293 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002186535700235119, + "loss": 1.4926, + "step": 13294 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021864258062345837, + "loss": 1.5286, + "step": 13295 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021863159075735962, + "loss": 1.5761, + "step": 13296 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021862060042529026, + "loss": 1.5768, + "step": 13297 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002186096096273249, + "loss": 1.5876, + "step": 13298 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002185986183635381, + "loss": 1.5256, + "step": 13299 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021858762663400455, + "loss": 1.5221, + "step": 13300 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002185766344387989, + "loss": 1.5777, + "step": 13301 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021856564177799573, + "loss": 1.5656, + "step": 13302 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021855464865166968, + "loss": 1.5568, + "step": 13303 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021854365505989543, + "loss": 1.58, + "step": 13304 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002185326610027476, + "loss": 1.5449, + "step": 13305 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021852166648030075, + "loss": 1.5926, + "step": 13306 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021851067149262967, + "loss": 1.5555, + "step": 13307 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021849967603980883, + "loss": 1.5567, + "step": 13308 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002184886801219131, + "loss": 1.5339, + "step": 13309 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021847768373901697, + "loss": 1.5611, + "step": 13310 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002184666868911952, + "loss": 1.5655, + "step": 13311 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002184556895785224, + "loss": 1.5727, + "step": 13312 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002184446918010732, + "loss": 1.5384, + "step": 13313 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021843369355892234, + "loss": 1.5824, + "step": 13314 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021842269485214448, + "loss": 1.5781, + "step": 13315 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021841169568081426, + "loss": 1.5765, + "step": 13316 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021840069604500638, + "loss": 1.5588, + "step": 13317 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021838969594479554, + "loss": 1.5729, + "step": 13318 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021837869538025642, + "loss": 1.544, + "step": 13319 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002183676943514636, + "loss": 1.5441, + "step": 13320 + }, + { + "epoch": 1.05, + "learning_rate": 0.000218356692858492, + "loss": 1.5514, + "step": 13321 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002183456909014161, + "loss": 1.5609, + "step": 13322 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021833468848031067, + "loss": 1.6014, + "step": 13323 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021832368559525042, + "loss": 1.5917, + "step": 13324 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021831268224631006, + "loss": 1.6101, + "step": 13325 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021830167843356427, + "loss": 1.565, + "step": 13326 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021829067415708782, + "loss": 1.5762, + "step": 13327 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021827966941695531, + "loss": 1.614, + "step": 13328 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002182686642132416, + "loss": 1.5847, + "step": 13329 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021825765854602128, + "loss": 1.5806, + "step": 13330 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021824665241536916, + "loss": 1.572, + "step": 13331 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021823564582135988, + "loss": 1.5846, + "step": 13332 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021822463876406827, + "loss": 1.5611, + "step": 13333 + }, + { + "epoch": 1.05, + "learning_rate": 0.000218213631243569, + "loss": 1.5591, + "step": 13334 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002182026232599368, + "loss": 1.5637, + "step": 13335 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021819161481324644, + "loss": 1.5427, + "step": 13336 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021818060590357265, + "loss": 1.5351, + "step": 13337 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002181695965309902, + "loss": 1.5392, + "step": 13338 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021815858669557372, + "loss": 1.5487, + "step": 13339 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002181475763973981, + "loss": 1.5874, + "step": 13340 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021813656563653806, + "loss": 1.5303, + "step": 13341 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021812555441306833, + "loss": 1.5851, + "step": 13342 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002181145427270637, + "loss": 1.5053, + "step": 13343 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002181035305785989, + "loss": 1.553, + "step": 13344 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002180925179677487, + "loss": 1.5625, + "step": 13345 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021808150489458788, + "loss": 1.5712, + "step": 13346 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021807049135919119, + "loss": 1.524, + "step": 13347 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021805947736163345, + "loss": 1.6045, + "step": 13348 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002180484629019894, + "loss": 1.5201, + "step": 13349 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002180374479803339, + "loss": 1.5794, + "step": 13350 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021802643259674162, + "loss": 1.5595, + "step": 13351 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002180154167512874, + "loss": 1.5889, + "step": 13352 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021800440044404605, + "loss": 1.5374, + "step": 13353 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021799338367509236, + "loss": 1.564, + "step": 13354 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002179823664445011, + "loss": 1.572, + "step": 13355 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002179713487523471, + "loss": 1.5162, + "step": 13356 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002179603305987051, + "loss": 1.5835, + "step": 13357 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021794931198365004, + "loss": 1.5896, + "step": 13358 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002179382929072566, + "loss": 1.5905, + "step": 13359 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002179272733695997, + "loss": 1.5631, + "step": 13360 + }, + { + "epoch": 1.05, + "learning_rate": 0.000217916253370754, + "loss": 1.5282, + "step": 13361 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021790523291079447, + "loss": 1.5595, + "step": 13362 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021789421198979591, + "loss": 1.5691, + "step": 13363 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021788319060783308, + "loss": 1.5781, + "step": 13364 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021787216876498086, + "loss": 1.592, + "step": 13365 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021786114646131404, + "loss": 1.6039, + "step": 13366 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021785012369690754, + "loss": 1.566, + "step": 13367 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021783910047183612, + "loss": 1.6002, + "step": 13368 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021782807678617466, + "loss": 1.5302, + "step": 13369 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021781705263999797, + "loss": 1.5444, + "step": 13370 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002178060280333809, + "loss": 1.612, + "step": 13371 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021779500296639832, + "loss": 1.5042, + "step": 13372 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002177839774391251, + "loss": 1.5382, + "step": 13373 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021777295145163607, + "loss": 1.5949, + "step": 13374 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002177619250040061, + "loss": 1.6194, + "step": 13375 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021775089809631006, + "loss": 1.5711, + "step": 13376 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021773987072862285, + "loss": 1.5354, + "step": 13377 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021772884290101926, + "loss": 1.5308, + "step": 13378 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021771781461357416, + "loss": 1.5679, + "step": 13379 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002177067858663625, + "loss": 1.5861, + "step": 13380 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021769575665945914, + "loss": 1.5861, + "step": 13381 + }, + { + "epoch": 1.05, + "learning_rate": 0.000217684726992939, + "loss": 1.5523, + "step": 13382 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002176736968668768, + "loss": 1.5399, + "step": 13383 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021766266628134764, + "loss": 1.5932, + "step": 13384 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021765163523642628, + "loss": 1.5614, + "step": 13385 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021764060373218768, + "loss": 1.5585, + "step": 13386 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021762957176870663, + "loss": 1.5957, + "step": 13387 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021761853934605817, + "loss": 1.5572, + "step": 13388 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021760750646431716, + "loss": 1.5519, + "step": 13389 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021759647312355845, + "loss": 1.5961, + "step": 13390 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021758543932385698, + "loss": 1.4874, + "step": 13391 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021757440506528774, + "loss": 1.5365, + "step": 13392 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021756337034792552, + "loss": 1.5491, + "step": 13393 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021755233517184528, + "loss": 1.5697, + "step": 13394 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021754129953712202, + "loss": 1.585, + "step": 13395 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021753026344383057, + "loss": 1.5524, + "step": 13396 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021751922689204593, + "loss": 1.6348, + "step": 13397 + }, + { + "epoch": 1.05, + "learning_rate": 0.000217508189881843, + "loss": 1.5511, + "step": 13398 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002174971524132967, + "loss": 1.544, + "step": 13399 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021748611448648198, + "loss": 1.5862, + "step": 13400 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021747507610147377, + "loss": 1.5559, + "step": 13401 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021746403725834705, + "loss": 1.5442, + "step": 13402 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021745299795717673, + "loss": 1.5757, + "step": 13403 + }, + { + "epoch": 1.05, + "learning_rate": 0.0002174419581980378, + "loss": 1.5337, + "step": 13404 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021743091798100516, + "loss": 1.562, + "step": 13405 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021741987730615386, + "loss": 1.5961, + "step": 13406 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021740883617355874, + "loss": 1.5624, + "step": 13407 + }, + { + "epoch": 1.05, + "learning_rate": 0.00021739779458329484, + "loss": 1.5305, + "step": 13408 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021738675253543712, + "loss": 1.6133, + "step": 13409 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021737571003006047, + "loss": 1.5707, + "step": 13410 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021736466706724002, + "loss": 1.5798, + "step": 13411 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002173536236470506, + "loss": 1.5143, + "step": 13412 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021734257976956727, + "loss": 1.5801, + "step": 13413 + }, + { + "epoch": 1.06, + "learning_rate": 0.000217331535434865, + "loss": 1.5763, + "step": 13414 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021732049064301874, + "loss": 1.547, + "step": 13415 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021730944539410352, + "loss": 1.5452, + "step": 13416 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002172983996881943, + "loss": 1.5773, + "step": 13417 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021728735352536605, + "loss": 1.5881, + "step": 13418 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002172763069056938, + "loss": 1.576, + "step": 13419 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021726525982925258, + "loss": 1.555, + "step": 13420 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021725421229611738, + "loss": 1.5712, + "step": 13421 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021724316430636316, + "loss": 1.5317, + "step": 13422 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021723211586006501, + "loss": 1.5569, + "step": 13423 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021722106695729786, + "loss": 1.5439, + "step": 13424 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021721001759813675, + "loss": 1.5908, + "step": 13425 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002171989677826567, + "loss": 1.5467, + "step": 13426 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002171879175109328, + "loss": 1.5516, + "step": 13427 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021717686678304, + "loss": 1.5923, + "step": 13428 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002171658155990533, + "loss": 1.5506, + "step": 13429 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021715476395904783, + "loss": 1.5773, + "step": 13430 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021714371186309857, + "loss": 1.5598, + "step": 13431 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002171326593112805, + "loss": 1.5634, + "step": 13432 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021712160630366878, + "loss": 1.4876, + "step": 13433 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021711055284033835, + "loss": 1.5538, + "step": 13434 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021709949892136432, + "loss": 1.5383, + "step": 13435 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021708844454682174, + "loss": 1.5631, + "step": 13436 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002170773897167856, + "loss": 1.6015, + "step": 13437 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002170663344313311, + "loss": 1.5734, + "step": 13438 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002170552786905331, + "loss": 1.5585, + "step": 13439 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002170442224944668, + "loss": 1.5027, + "step": 13440 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021703316584320722, + "loss": 1.5386, + "step": 13441 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021702210873682942, + "loss": 1.588, + "step": 13442 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002170110511754085, + "loss": 1.5593, + "step": 13443 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021699999315901952, + "loss": 1.4894, + "step": 13444 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002169889346877376, + "loss": 1.6082, + "step": 13445 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021697787576163772, + "loss": 1.5714, + "step": 13446 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021696681638079505, + "loss": 1.6282, + "step": 13447 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021695575654528466, + "loss": 1.5871, + "step": 13448 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002169446962551816, + "loss": 1.5966, + "step": 13449 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021693363551056102, + "loss": 1.6374, + "step": 13450 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021692257431149797, + "loss": 1.5588, + "step": 13451 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002169115126580676, + "loss": 1.57, + "step": 13452 + }, + { + "epoch": 1.06, + "learning_rate": 0.000216900450550345, + "loss": 1.5624, + "step": 13453 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021688938798840524, + "loss": 1.5738, + "step": 13454 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021687832497232346, + "loss": 1.5316, + "step": 13455 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021686726150217474, + "loss": 1.5383, + "step": 13456 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021685619757803423, + "loss": 1.5823, + "step": 13457 + }, + { + "epoch": 1.06, + "learning_rate": 0.000216845133199977, + "loss": 1.5235, + "step": 13458 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002168340683680782, + "loss": 1.5068, + "step": 13459 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021682300308241304, + "loss": 1.5826, + "step": 13460 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021681193734305647, + "loss": 1.5906, + "step": 13461 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021680087115008378, + "loss": 1.4911, + "step": 13462 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021678980450357002, + "loss": 1.4993, + "step": 13463 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021677873740359033, + "loss": 1.5869, + "step": 13464 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021676766985021987, + "loss": 1.5511, + "step": 13465 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021675660184353375, + "loss": 1.5967, + "step": 13466 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002167455333836072, + "loss": 1.5375, + "step": 13467 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021673446447051527, + "loss": 1.5719, + "step": 13468 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021672339510433317, + "loss": 1.6014, + "step": 13469 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021671232528513607, + "loss": 1.5249, + "step": 13470 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021670125501299902, + "loss": 1.5504, + "step": 13471 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021669018428799734, + "loss": 1.5619, + "step": 13472 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021667911311020602, + "loss": 1.5998, + "step": 13473 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002166680414797004, + "loss": 1.582, + "step": 13474 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021665696939655553, + "loss": 1.5754, + "step": 13475 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002166458968608466, + "loss": 1.5622, + "step": 13476 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002166348238726489, + "loss": 1.555, + "step": 13477 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021662375043203744, + "loss": 1.6117, + "step": 13478 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021661267653908748, + "loss": 1.558, + "step": 13479 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021660160219387424, + "loss": 1.5635, + "step": 13480 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021659052739647283, + "loss": 1.5426, + "step": 13481 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021657945214695852, + "loss": 1.4794, + "step": 13482 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021656837644540647, + "loss": 1.5531, + "step": 13483 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021655730029189192, + "loss": 1.556, + "step": 13484 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021654622368648995, + "loss": 1.544, + "step": 13485 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021653514662927587, + "loss": 1.5406, + "step": 13486 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021652406912032492, + "loss": 1.6195, + "step": 13487 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021651299115971217, + "loss": 1.5094, + "step": 13488 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021650191274751295, + "loss": 1.6377, + "step": 13489 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021649083388380243, + "loss": 1.5773, + "step": 13490 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021647975456865588, + "loss": 1.5862, + "step": 13491 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021646867480214845, + "loss": 1.5992, + "step": 13492 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002164575945843554, + "loss": 1.5655, + "step": 13493 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021644651391535197, + "loss": 1.6099, + "step": 13494 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021643543279521336, + "loss": 1.5384, + "step": 13495 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021642435122401482, + "loss": 1.5684, + "step": 13496 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021641326920183158, + "loss": 1.531, + "step": 13497 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021640218672873892, + "loss": 1.5498, + "step": 13498 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021639110380481207, + "loss": 1.5835, + "step": 13499 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021638002043012622, + "loss": 1.5331, + "step": 13500 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021636893660475674, + "loss": 1.5658, + "step": 13501 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021635785232877874, + "loss": 1.5123, + "step": 13502 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021634676760226752, + "loss": 1.5602, + "step": 13503 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002163356824252984, + "loss": 1.589, + "step": 13504 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002163245967979466, + "loss": 1.5982, + "step": 13505 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002163135107202874, + "loss": 1.5877, + "step": 13506 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021630242419239603, + "loss": 1.5279, + "step": 13507 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002162913372143478, + "loss": 1.5544, + "step": 13508 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021628024978621798, + "loss": 1.5629, + "step": 13509 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021626916190808186, + "loss": 1.5647, + "step": 13510 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021625807358001468, + "loss": 1.5456, + "step": 13511 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002162469848020917, + "loss": 1.5871, + "step": 13512 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021623589557438834, + "loss": 1.5973, + "step": 13513 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021622480589697973, + "loss": 1.5785, + "step": 13514 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021621371576994124, + "loss": 1.5033, + "step": 13515 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021620262519334818, + "loss": 1.5628, + "step": 13516 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021619153416727583, + "loss": 1.6004, + "step": 13517 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002161804426917995, + "loss": 1.5369, + "step": 13518 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021616935076699447, + "loss": 1.5904, + "step": 13519 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021615825839293605, + "loss": 1.5283, + "step": 13520 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021614716556969958, + "loss": 1.5917, + "step": 13521 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021613607229736036, + "loss": 1.6127, + "step": 13522 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021612497857599372, + "loss": 1.571, + "step": 13523 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021611388440567495, + "loss": 1.5297, + "step": 13524 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021610278978647938, + "loss": 1.5308, + "step": 13525 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021609169471848238, + "loss": 1.5928, + "step": 13526 + }, + { + "epoch": 1.06, + "learning_rate": 0.0002160805992017592, + "loss": 1.5682, + "step": 13527 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021606950323638526, + "loss": 1.5742, + "step": 13528 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021605840682243583, + "loss": 1.5596, + "step": 13529 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021604730995998628, + "loss": 1.5287, + "step": 13530 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021603621264911193, + "loss": 1.5751, + "step": 13531 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021602511488988814, + "loss": 1.5343, + "step": 13532 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021601401668239027, + "loss": 1.5977, + "step": 13533 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021600291802669364, + "loss": 1.6154, + "step": 13534 + }, + { + "epoch": 1.06, + "learning_rate": 0.00021599181892287362, + "loss": 1.555, + "step": 13535 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021598071937100558, + "loss": 1.5636, + "step": 13536 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021596961937116486, + "loss": 1.5717, + "step": 13537 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021595851892342686, + "loss": 1.5739, + "step": 13538 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021594741802786685, + "loss": 1.5599, + "step": 13539 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021593631668456032, + "loss": 1.5987, + "step": 13540 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002159252148935826, + "loss": 1.5399, + "step": 13541 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021591411265500899, + "loss": 1.564, + "step": 13542 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021590300996891497, + "loss": 1.5214, + "step": 13543 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021589190683537584, + "loss": 1.5477, + "step": 13544 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021588080325446706, + "loss": 1.5356, + "step": 13545 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021586969922626398, + "loss": 1.5882, + "step": 13546 + }, + { + "epoch": 1.07, + "learning_rate": 0.000215858594750842, + "loss": 1.6175, + "step": 13547 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002158474898282765, + "loss": 1.5434, + "step": 13548 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021583638445864286, + "loss": 1.5902, + "step": 13549 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021582527864201653, + "loss": 1.5542, + "step": 13550 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021581417237847284, + "loss": 1.6015, + "step": 13551 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002158030656680873, + "loss": 1.536, + "step": 13552 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021579195851093518, + "loss": 1.5795, + "step": 13553 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021578085090709202, + "loss": 1.6138, + "step": 13554 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002157697428566332, + "loss": 1.663, + "step": 13555 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021575863435963408, + "loss": 1.5657, + "step": 13556 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021574752541617015, + "loss": 1.5395, + "step": 13557 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002157364160263168, + "loss": 1.5864, + "step": 13558 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021572530619014946, + "loss": 1.5683, + "step": 13559 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021571419590774352, + "loss": 1.6056, + "step": 13560 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002157030851791745, + "loss": 1.5661, + "step": 13561 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021569197400451778, + "loss": 1.5532, + "step": 13562 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021568086238384882, + "loss": 1.532, + "step": 13563 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021566975031724303, + "loss": 1.5192, + "step": 13564 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021565863780477593, + "loss": 1.5692, + "step": 13565 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021564752484652284, + "loss": 1.5393, + "step": 13566 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002156364114425593, + "loss": 1.5636, + "step": 13567 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021562529759296077, + "loss": 1.5194, + "step": 13568 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021561418329780268, + "loss": 1.5819, + "step": 13569 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021560306855716044, + "loss": 1.5863, + "step": 13570 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021559195337110963, + "loss": 1.5575, + "step": 13571 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021558083773972567, + "loss": 1.5522, + "step": 13572 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021556972166308398, + "loss": 1.5577, + "step": 13573 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021555860514126007, + "loss": 1.5885, + "step": 13574 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021554748817432937, + "loss": 1.5757, + "step": 13575 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021553637076236743, + "loss": 1.5617, + "step": 13576 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002155252529054497, + "loss": 1.5224, + "step": 13577 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021551413460365164, + "loss": 1.5858, + "step": 13578 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021550301585704883, + "loss": 1.5724, + "step": 13579 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002154918966657166, + "loss": 1.5666, + "step": 13580 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002154807770297306, + "loss": 1.6197, + "step": 13581 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021546965694916622, + "loss": 1.5932, + "step": 13582 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021545853642409898, + "loss": 1.5456, + "step": 13583 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021544741545460446, + "loss": 1.6024, + "step": 13584 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021543629404075808, + "loss": 1.5765, + "step": 13585 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021542517218263538, + "loss": 1.5975, + "step": 13586 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021541404988031186, + "loss": 1.5559, + "step": 13587 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021540292713386305, + "loss": 1.5685, + "step": 13588 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021539180394336446, + "loss": 1.5679, + "step": 13589 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021538068030889157, + "loss": 1.5979, + "step": 13590 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021536955623051995, + "loss": 1.5585, + "step": 13591 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021535843170832511, + "loss": 1.591, + "step": 13592 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002153473067423826, + "loss": 1.5245, + "step": 13593 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021533618133276795, + "loss": 1.6036, + "step": 13594 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002153250554795567, + "loss": 1.5567, + "step": 13595 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021531392918282434, + "loss": 1.5703, + "step": 13596 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021530280244264646, + "loss": 1.5635, + "step": 13597 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002152916752590986, + "loss": 1.5332, + "step": 13598 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021528054763225626, + "loss": 1.5939, + "step": 13599 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021526941956219505, + "loss": 1.5698, + "step": 13600 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002152582910489905, + "loss": 1.56, + "step": 13601 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021524716209271816, + "loss": 1.5505, + "step": 13602 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021523603269345365, + "loss": 1.5326, + "step": 13603 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002152249028512724, + "loss": 1.5725, + "step": 13604 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021521377256625006, + "loss": 1.5391, + "step": 13605 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021520264183846227, + "loss": 1.5635, + "step": 13606 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002151915106679844, + "loss": 1.5572, + "step": 13607 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021518037905489225, + "loss": 1.5579, + "step": 13608 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021516924699926124, + "loss": 1.5992, + "step": 13609 + }, + { + "epoch": 1.07, + "learning_rate": 0.000215158114501167, + "loss": 1.5697, + "step": 13610 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021514698156068518, + "loss": 1.5652, + "step": 13611 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021513584817789126, + "loss": 1.5474, + "step": 13612 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002151247143528609, + "loss": 1.5957, + "step": 13613 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021511358008566962, + "loss": 1.6077, + "step": 13614 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021510244537639313, + "loss": 1.5703, + "step": 13615 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002150913102251069, + "loss": 1.5638, + "step": 13616 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021508017463188662, + "loss": 1.5838, + "step": 13617 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021506903859680793, + "loss": 1.5684, + "step": 13618 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021505790211994631, + "loss": 1.5954, + "step": 13619 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021504676520137746, + "loss": 1.4958, + "step": 13620 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021503562784117697, + "loss": 1.6329, + "step": 13621 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021502449003942039, + "loss": 1.5669, + "step": 13622 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021501335179618348, + "loss": 1.55, + "step": 13623 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021500221311154179, + "loss": 1.5926, + "step": 13624 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021499107398557094, + "loss": 1.5325, + "step": 13625 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002149799344183465, + "loss": 1.6094, + "step": 13626 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021496879440994425, + "loss": 1.5272, + "step": 13627 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021495765396043967, + "loss": 1.617, + "step": 13628 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021494651306990848, + "loss": 1.5665, + "step": 13629 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021493537173842634, + "loss": 1.5169, + "step": 13630 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021492422996606883, + "loss": 1.5593, + "step": 13631 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021491308775291166, + "loss": 1.5681, + "step": 13632 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002149019450990304, + "loss": 1.6085, + "step": 13633 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021489080200450079, + "loss": 1.5672, + "step": 13634 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021487965846939843, + "loss": 1.6229, + "step": 13635 + }, + { + "epoch": 1.07, + "learning_rate": 0.000214868514493799, + "loss": 1.6037, + "step": 13636 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021485737007777815, + "loss": 1.6078, + "step": 13637 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021484622522141152, + "loss": 1.5564, + "step": 13638 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002148350799247748, + "loss": 1.5393, + "step": 13639 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021482393418794372, + "loss": 1.5516, + "step": 13640 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021481278801099388, + "loss": 1.5633, + "step": 13641 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021480164139400099, + "loss": 1.5463, + "step": 13642 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021479049433704067, + "loss": 1.5657, + "step": 13643 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021477934684018866, + "loss": 1.544, + "step": 13644 + }, + { + "epoch": 1.07, + "learning_rate": 0.0002147681989035207, + "loss": 1.5763, + "step": 13645 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021475705052711232, + "loss": 1.5053, + "step": 13646 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021474590171103935, + "loss": 1.5659, + "step": 13647 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021473475245537742, + "loss": 1.5452, + "step": 13648 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021472360276020226, + "loss": 1.6075, + "step": 13649 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021471245262558953, + "loss": 1.5396, + "step": 13650 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021470130205161498, + "loss": 1.5804, + "step": 13651 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021469015103835434, + "loss": 1.5491, + "step": 13652 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021467899958588322, + "loss": 1.6211, + "step": 13653 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021466784769427733, + "loss": 1.5605, + "step": 13654 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021465669536361253, + "loss": 1.6249, + "step": 13655 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021464554259396438, + "loss": 1.5329, + "step": 13656 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021463438938540874, + "loss": 1.6086, + "step": 13657 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021462323573802125, + "loss": 1.5538, + "step": 13658 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021461208165187763, + "loss": 1.5266, + "step": 13659 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021460092712705366, + "loss": 1.5925, + "step": 13660 + }, + { + "epoch": 1.07, + "learning_rate": 0.000214589772163625, + "loss": 1.6184, + "step": 13661 + }, + { + "epoch": 1.07, + "learning_rate": 0.00021457861676166742, + "loss": 1.5373, + "step": 13662 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002145674609212567, + "loss": 1.5784, + "step": 13663 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021455630464246856, + "loss": 1.588, + "step": 13664 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021454514792537875, + "loss": 1.5689, + "step": 13665 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021453399077006296, + "loss": 1.5336, + "step": 13666 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021452283317659703, + "loss": 1.5689, + "step": 13667 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021451167514505663, + "loss": 1.5837, + "step": 13668 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021450051667551757, + "loss": 1.5869, + "step": 13669 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021448935776805558, + "loss": 1.5962, + "step": 13670 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021447819842274648, + "loss": 1.6095, + "step": 13671 + }, + { + "epoch": 1.08, + "learning_rate": 0.000214467038639666, + "loss": 1.5895, + "step": 13672 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021445587841888988, + "loss": 1.5934, + "step": 13673 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002144447177604939, + "loss": 1.564, + "step": 13674 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021443355666455387, + "loss": 1.5369, + "step": 13675 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021442239513114552, + "loss": 1.5239, + "step": 13676 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021441123316034467, + "loss": 1.5475, + "step": 13677 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021440007075222708, + "loss": 1.5008, + "step": 13678 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021438890790686862, + "loss": 1.5663, + "step": 13679 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021437774462434496, + "loss": 1.5748, + "step": 13680 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021436658090473194, + "loss": 1.5864, + "step": 13681 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021435541674810535, + "loss": 1.5801, + "step": 13682 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021434425215454097, + "loss": 1.5184, + "step": 13683 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002143330871241147, + "loss": 1.5668, + "step": 13684 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021432192165690217, + "loss": 1.5414, + "step": 13685 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021431075575297935, + "loss": 1.5696, + "step": 13686 + }, + { + "epoch": 1.08, + "learning_rate": 0.000214299589412422, + "loss": 1.6006, + "step": 13687 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002142884226353059, + "loss": 1.5411, + "step": 13688 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002142772554217069, + "loss": 1.569, + "step": 13689 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021426608777170078, + "loss": 1.576, + "step": 13690 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021425491968536341, + "loss": 1.558, + "step": 13691 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002142437511627706, + "loss": 1.54, + "step": 13692 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021423258220399816, + "loss": 1.5963, + "step": 13693 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021422141280912194, + "loss": 1.6287, + "step": 13694 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021421024297821773, + "loss": 1.5534, + "step": 13695 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021419907271136147, + "loss": 1.5886, + "step": 13696 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021418790200862888, + "loss": 1.5539, + "step": 13697 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002141767308700959, + "loss": 1.5612, + "step": 13698 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021416555929583831, + "loss": 1.5863, + "step": 13699 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021415438728593196, + "loss": 1.6106, + "step": 13700 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021414321484045275, + "loss": 1.5618, + "step": 13701 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002141320419594765, + "loss": 1.5289, + "step": 13702 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021412086864307911, + "loss": 1.513, + "step": 13703 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021410969489133635, + "loss": 1.5279, + "step": 13704 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021409852070432416, + "loss": 1.5774, + "step": 13705 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021408734608211843, + "loss": 1.5874, + "step": 13706 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021407617102479494, + "loss": 1.6025, + "step": 13707 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021406499553242963, + "loss": 1.5554, + "step": 13708 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021405381960509833, + "loss": 1.5917, + "step": 13709 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021404264324287697, + "loss": 1.5381, + "step": 13710 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002140314664458414, + "loss": 1.5163, + "step": 13711 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021402028921406745, + "loss": 1.5724, + "step": 13712 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021400911154763116, + "loss": 1.5897, + "step": 13713 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021399793344660826, + "loss": 1.5977, + "step": 13714 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021398675491107475, + "loss": 1.5494, + "step": 13715 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021397557594110648, + "loss": 1.5493, + "step": 13716 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021396439653677927, + "loss": 1.5714, + "step": 13717 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021395321669816922, + "loss": 1.5732, + "step": 13718 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021394203642535205, + "loss": 1.5318, + "step": 13719 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002139308557184038, + "loss": 1.629, + "step": 13720 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021391967457740026, + "loss": 1.5534, + "step": 13721 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002139084930024174, + "loss": 1.5681, + "step": 13722 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021389731099353122, + "loss": 1.5454, + "step": 13723 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021388612855081747, + "loss": 1.5267, + "step": 13724 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021387494567435221, + "loss": 1.616, + "step": 13725 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021386376236421132, + "loss": 1.5868, + "step": 13726 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021385257862047074, + "loss": 1.573, + "step": 13727 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002138413944432063, + "loss": 1.5653, + "step": 13728 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021383020983249413, + "loss": 1.5359, + "step": 13729 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021381902478841, + "loss": 1.5714, + "step": 13730 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021380783931102993, + "loss": 1.6057, + "step": 13731 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021379665340042983, + "loss": 1.56, + "step": 13732 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021378546705668564, + "loss": 1.621, + "step": 13733 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021377428027987336, + "loss": 1.5337, + "step": 13734 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021376309307006894, + "loss": 1.5875, + "step": 13735 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021375190542734826, + "loss": 1.5301, + "step": 13736 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021374071735178737, + "loss": 1.6265, + "step": 13737 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021372952884346212, + "loss": 1.5243, + "step": 13738 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021371833990244856, + "loss": 1.5229, + "step": 13739 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002137071505288226, + "loss": 1.5682, + "step": 13740 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021369596072266033, + "loss": 1.5871, + "step": 13741 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021368477048403758, + "loss": 1.5526, + "step": 13742 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002136735798130304, + "loss": 1.5245, + "step": 13743 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021366238870971477, + "loss": 1.5797, + "step": 13744 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021365119717416662, + "loss": 1.541, + "step": 13745 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021364000520646196, + "loss": 1.5175, + "step": 13746 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021362881280667683, + "loss": 1.5445, + "step": 13747 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021361761997488711, + "loss": 1.6199, + "step": 13748 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021360642671116892, + "loss": 1.6328, + "step": 13749 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021359523301559815, + "loss": 1.5415, + "step": 13750 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021358403888825086, + "loss": 1.567, + "step": 13751 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021357284432920305, + "loss": 1.58, + "step": 13752 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021356164933853067, + "loss": 1.4754, + "step": 13753 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021355045391630983, + "loss": 1.5454, + "step": 13754 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021353925806261642, + "loss": 1.5632, + "step": 13755 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021352806177752653, + "loss": 1.5678, + "step": 13756 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021351686506111613, + "loss": 1.5549, + "step": 13757 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021350566791346128, + "loss": 1.5182, + "step": 13758 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021349447033463804, + "loss": 1.5279, + "step": 13759 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021348327232472233, + "loss": 1.5534, + "step": 13760 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021347207388379026, + "loss": 1.5814, + "step": 13761 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021346087501191785, + "loss": 1.5881, + "step": 13762 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002134496757091811, + "loss": 1.6034, + "step": 13763 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021343847597565604, + "loss": 1.5585, + "step": 13764 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021342727581141874, + "loss": 1.5602, + "step": 13765 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021341607521654528, + "loss": 1.5517, + "step": 13766 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021340487419111166, + "loss": 1.5326, + "step": 13767 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002133936727351939, + "loss": 1.6128, + "step": 13768 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002133824708488681, + "loss": 1.5648, + "step": 13769 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021337126853221034, + "loss": 1.5633, + "step": 13770 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021336006578529662, + "loss": 1.5098, + "step": 13771 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021334886260820294, + "loss": 1.5765, + "step": 13772 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002133376590010055, + "loss": 1.5852, + "step": 13773 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021332645496378034, + "loss": 1.534, + "step": 13774 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021331525049660347, + "loss": 1.562, + "step": 13775 + }, + { + "epoch": 1.08, + "learning_rate": 0.000213304045599551, + "loss": 1.5563, + "step": 13776 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021329284027269899, + "loss": 1.5877, + "step": 13777 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002132816345161235, + "loss": 1.5688, + "step": 13778 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021327042832990062, + "loss": 1.5748, + "step": 13779 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021325922171410648, + "loss": 1.558, + "step": 13780 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021324801466881716, + "loss": 1.5238, + "step": 13781 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021323680719410868, + "loss": 1.5598, + "step": 13782 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002132255992900572, + "loss": 1.5432, + "step": 13783 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021321439095673875, + "loss": 1.5414, + "step": 13784 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002132031821942295, + "loss": 1.5405, + "step": 13785 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021319197300260554, + "loss": 1.5485, + "step": 13786 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002131807633819429, + "loss": 1.5231, + "step": 13787 + }, + { + "epoch": 1.08, + "learning_rate": 0.00021316955333231782, + "loss": 1.5259, + "step": 13788 + }, + { + "epoch": 1.08, + "learning_rate": 0.0002131583428538063, + "loss": 1.5796, + "step": 13789 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021314713194648443, + "loss": 1.5942, + "step": 13790 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021313592061042848, + "loss": 1.5776, + "step": 13791 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002131247088457144, + "loss": 1.5367, + "step": 13792 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021311349665241843, + "loss": 1.5359, + "step": 13793 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002131022840306166, + "loss": 1.6022, + "step": 13794 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002130910709803851, + "loss": 1.5774, + "step": 13795 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021307985750180006, + "loss": 1.5854, + "step": 13796 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021306864359493756, + "loss": 1.5436, + "step": 13797 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021305742925987382, + "loss": 1.5997, + "step": 13798 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002130462144966849, + "loss": 1.5488, + "step": 13799 + }, + { + "epoch": 1.09, + "learning_rate": 0.000213034999305447, + "loss": 1.5624, + "step": 13800 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021302378368623622, + "loss": 1.5119, + "step": 13801 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021301256763912876, + "loss": 1.5029, + "step": 13802 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002130013511642007, + "loss": 1.5923, + "step": 13803 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021299013426152822, + "loss": 1.5796, + "step": 13804 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021297891693118753, + "loss": 1.5327, + "step": 13805 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021296769917325474, + "loss": 1.5372, + "step": 13806 + }, + { + "epoch": 1.09, + "learning_rate": 0.000212956480987806, + "loss": 1.5349, + "step": 13807 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021294526237491753, + "loss": 1.5378, + "step": 13808 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021293404333466546, + "loss": 1.5757, + "step": 13809 + }, + { + "epoch": 1.09, + "learning_rate": 0.000212922823867126, + "loss": 1.6138, + "step": 13810 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021291160397237516, + "loss": 1.5499, + "step": 13811 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021290038365048936, + "loss": 1.5468, + "step": 13812 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021288916290154462, + "loss": 1.5764, + "step": 13813 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021287794172561718, + "loss": 1.5457, + "step": 13814 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021286672012278327, + "loss": 1.5613, + "step": 13815 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021285549809311894, + "loss": 1.5826, + "step": 13816 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002128442756367005, + "loss": 1.5504, + "step": 13817 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021283305275360414, + "loss": 1.5389, + "step": 13818 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021282182944390595, + "loss": 1.5738, + "step": 13819 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021281060570768227, + "loss": 1.547, + "step": 13820 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021279938154500922, + "loss": 1.5189, + "step": 13821 + }, + { + "epoch": 1.09, + "learning_rate": 0.000212788156955963, + "loss": 1.5524, + "step": 13822 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002127769319406199, + "loss": 1.5781, + "step": 13823 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021276570649905602, + "loss": 1.5751, + "step": 13824 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021275448063134769, + "loss": 1.5833, + "step": 13825 + }, + { + "epoch": 1.09, + "learning_rate": 0.000212743254337571, + "loss": 1.4912, + "step": 13826 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021273202761780226, + "loss": 1.5541, + "step": 13827 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021272080047211766, + "loss": 1.5889, + "step": 13828 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021270957290059342, + "loss": 1.5226, + "step": 13829 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021269834490330588, + "loss": 1.6056, + "step": 13830 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002126871164803311, + "loss": 1.6168, + "step": 13831 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002126758876317454, + "loss": 1.5931, + "step": 13832 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021266465835762506, + "loss": 1.6113, + "step": 13833 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002126534286580462, + "loss": 1.5632, + "step": 13834 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021264219853308516, + "loss": 1.5415, + "step": 13835 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021263096798281814, + "loss": 1.5912, + "step": 13836 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021261973700732148, + "loss": 1.4958, + "step": 13837 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021260850560667128, + "loss": 1.6392, + "step": 13838 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021259727378094399, + "loss": 1.5886, + "step": 13839 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021258604153021567, + "loss": 1.5307, + "step": 13840 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021257480885456263, + "loss": 1.5303, + "step": 13841 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002125635757540612, + "loss": 1.5402, + "step": 13842 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021255234222878765, + "loss": 1.6114, + "step": 13843 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021254110827881821, + "loss": 1.5783, + "step": 13844 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021252987390422913, + "loss": 1.5468, + "step": 13845 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021251863910509673, + "loss": 1.514, + "step": 13846 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021250740388149727, + "loss": 1.5657, + "step": 13847 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021249616823350705, + "loss": 1.5558, + "step": 13848 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021248493216120235, + "loss": 1.5708, + "step": 13849 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021247369566465937, + "loss": 1.575, + "step": 13850 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021246245874395454, + "loss": 1.5768, + "step": 13851 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021245122139916403, + "loss": 1.5978, + "step": 13852 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021243998363036423, + "loss": 1.5075, + "step": 13853 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021242874543763137, + "loss": 1.5598, + "step": 13854 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021241750682104182, + "loss": 1.557, + "step": 13855 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021240626778067177, + "loss": 1.5863, + "step": 13856 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002123950283165977, + "loss": 1.6094, + "step": 13857 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021238378842889573, + "loss": 1.4625, + "step": 13858 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021237254811764232, + "loss": 1.5202, + "step": 13859 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021236130738291371, + "loss": 1.5625, + "step": 13860 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021235006622478627, + "loss": 1.5865, + "step": 13861 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021233882464333624, + "loss": 1.5648, + "step": 13862 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021232758263864, + "loss": 1.5965, + "step": 13863 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002123163402107739, + "loss": 1.5483, + "step": 13864 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002123050973598142, + "loss": 1.5996, + "step": 13865 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002122938540858373, + "loss": 1.571, + "step": 13866 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021228261038891947, + "loss": 1.5488, + "step": 13867 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021227136626913713, + "loss": 1.5791, + "step": 13868 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021226012172656655, + "loss": 1.5525, + "step": 13869 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021224887676128408, + "loss": 1.576, + "step": 13870 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021223763137336615, + "loss": 1.6368, + "step": 13871 + }, + { + "epoch": 1.09, + "learning_rate": 0.000212226385562889, + "loss": 1.5962, + "step": 13872 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021221513932992905, + "loss": 1.5591, + "step": 13873 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002122038926745626, + "loss": 1.6336, + "step": 13874 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002121926455968661, + "loss": 1.4603, + "step": 13875 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021218139809691587, + "loss": 1.5213, + "step": 13876 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002121701501747882, + "loss": 1.532, + "step": 13877 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021215890183055958, + "loss": 1.5747, + "step": 13878 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002121476530643063, + "loss": 1.5806, + "step": 13879 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002121364038761047, + "loss": 1.5852, + "step": 13880 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021212515426603128, + "loss": 1.5849, + "step": 13881 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021211390423416226, + "loss": 1.5362, + "step": 13882 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002121026537805742, + "loss": 1.6358, + "step": 13883 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021209140290534334, + "loss": 1.5562, + "step": 13884 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021208015160854613, + "loss": 1.5261, + "step": 13885 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021206889989025898, + "loss": 1.6102, + "step": 13886 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021205764775055817, + "loss": 1.5631, + "step": 13887 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021204639518952026, + "loss": 1.5715, + "step": 13888 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021203514220722154, + "loss": 1.5953, + "step": 13889 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021202388880373844, + "loss": 1.5464, + "step": 13890 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021201263497914734, + "loss": 1.5522, + "step": 13891 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021200138073352467, + "loss": 1.5674, + "step": 13892 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002119901260669469, + "loss": 1.5636, + "step": 13893 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002119788709794903, + "loss": 1.5445, + "step": 13894 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021196761547123143, + "loss": 1.5261, + "step": 13895 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021195635954224663, + "loss": 1.5577, + "step": 13896 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002119451031926123, + "loss": 1.5505, + "step": 13897 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021193384642240494, + "loss": 1.5723, + "step": 13898 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021192258923170094, + "loss": 1.4838, + "step": 13899 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021191133162057677, + "loss": 1.5808, + "step": 13900 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021190007358910877, + "loss": 1.5297, + "step": 13901 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002118888151373734, + "loss": 1.5353, + "step": 13902 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021187755626544722, + "loss": 1.5883, + "step": 13903 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021186629697340654, + "loss": 1.5986, + "step": 13904 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002118550372613278, + "loss": 1.5825, + "step": 13905 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021184377712928754, + "loss": 1.6134, + "step": 13906 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021183251657736217, + "loss": 1.5559, + "step": 13907 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002118212556056281, + "loss": 1.5542, + "step": 13908 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021180999421416182, + "loss": 1.5922, + "step": 13909 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021179873240303985, + "loss": 1.5638, + "step": 13910 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021178747017233852, + "loss": 1.6037, + "step": 13911 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021177620752213435, + "loss": 1.5903, + "step": 13912 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021176494445250386, + "loss": 1.5214, + "step": 13913 + }, + { + "epoch": 1.09, + "learning_rate": 0.0002117536809635235, + "loss": 1.5264, + "step": 13914 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021174241705526972, + "loss": 1.541, + "step": 13915 + }, + { + "epoch": 1.09, + "learning_rate": 0.00021173115272781897, + "loss": 1.5394, + "step": 13916 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002117198879812478, + "loss": 1.6199, + "step": 13917 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021170862281563263, + "loss": 1.5475, + "step": 13918 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021169735723104995, + "loss": 1.5519, + "step": 13919 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002116860912275763, + "loss": 1.5394, + "step": 13920 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021167482480528805, + "loss": 1.5534, + "step": 13921 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021166355796426185, + "loss": 1.5479, + "step": 13922 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021165229070457407, + "loss": 1.585, + "step": 13923 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002116410230263013, + "loss": 1.5436, + "step": 13924 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021162975492952, + "loss": 1.5332, + "step": 13925 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021161848641430668, + "loss": 1.5104, + "step": 13926 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021160721748073781, + "loss": 1.5574, + "step": 13927 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021159594812888996, + "loss": 1.5953, + "step": 13928 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002115846783588396, + "loss": 1.5845, + "step": 13929 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002115734081706632, + "loss": 1.5458, + "step": 13930 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021156213756443743, + "loss": 1.5597, + "step": 13931 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002115508665402387, + "loss": 1.5792, + "step": 13932 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021153959509814351, + "loss": 1.5594, + "step": 13933 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002115283232382285, + "loss": 1.5197, + "step": 13934 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002115170509605701, + "loss": 1.5555, + "step": 13935 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021150577826524483, + "loss": 1.588, + "step": 13936 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021149450515232926, + "loss": 1.558, + "step": 13937 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021148323162189996, + "loss": 1.5737, + "step": 13938 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002114719576740335, + "loss": 1.56, + "step": 13939 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002114606833088063, + "loss": 1.5487, + "step": 13940 + }, + { + "epoch": 1.1, + "learning_rate": 0.000211449408526295, + "loss": 1.5598, + "step": 13941 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021143813332657614, + "loss": 1.5791, + "step": 13942 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021142685770972623, + "loss": 1.5914, + "step": 13943 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002114155816758219, + "loss": 1.6038, + "step": 13944 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021140430522493964, + "loss": 1.5565, + "step": 13945 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021139302835715602, + "loss": 1.5584, + "step": 13946 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021138175107254762, + "loss": 1.5309, + "step": 13947 + }, + { + "epoch": 1.1, + "learning_rate": 0.000211370473371191, + "loss": 1.5467, + "step": 13948 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021135919525316278, + "loss": 1.5472, + "step": 13949 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021134791671853942, + "loss": 1.4963, + "step": 13950 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021133663776739763, + "loss": 1.6412, + "step": 13951 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021132535839981381, + "loss": 1.5985, + "step": 13952 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021131407861586473, + "loss": 1.5974, + "step": 13953 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002113027984156269, + "loss": 1.5475, + "step": 13954 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021129151779917683, + "loss": 1.5343, + "step": 13955 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021128023676659125, + "loss": 1.5411, + "step": 13956 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021126895531794665, + "loss": 1.5841, + "step": 13957 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021125767345331965, + "loss": 1.5409, + "step": 13958 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002112463911727869, + "loss": 1.5481, + "step": 13959 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021123510847642483, + "loss": 1.615, + "step": 13960 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021122382536431028, + "loss": 1.582, + "step": 13961 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002112125418365197, + "loss": 1.5786, + "step": 13962 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021120125789312978, + "loss": 1.5595, + "step": 13963 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021118997353421708, + "loss": 1.6043, + "step": 13964 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021117868875985816, + "loss": 1.5613, + "step": 13965 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002111674035701298, + "loss": 1.4604, + "step": 13966 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021115611796510846, + "loss": 1.5411, + "step": 13967 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021114483194487082, + "loss": 1.5268, + "step": 13968 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021113354550949355, + "loss": 1.525, + "step": 13969 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021112225865905324, + "loss": 1.5501, + "step": 13970 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002111109713936265, + "loss": 1.5782, + "step": 13971 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021109968371329002, + "loss": 1.5854, + "step": 13972 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021108839561812039, + "loss": 1.581, + "step": 13973 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021107710710819427, + "loss": 1.5723, + "step": 13974 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002110658181835883, + "loss": 1.5653, + "step": 13975 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002110545288443791, + "loss": 1.571, + "step": 13976 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021104323909064337, + "loss": 1.5209, + "step": 13977 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002110319489224577, + "loss": 1.571, + "step": 13978 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021102065833989879, + "loss": 1.5689, + "step": 13979 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021100936734304334, + "loss": 1.5882, + "step": 13980 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021099807593196788, + "loss": 1.5008, + "step": 13981 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021098678410674915, + "loss": 1.5002, + "step": 13982 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021097549186746385, + "loss": 1.6167, + "step": 13983 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021096419921418856, + "loss": 1.5256, + "step": 13984 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021095290614700005, + "loss": 1.5665, + "step": 13985 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021094161266597492, + "loss": 1.5334, + "step": 13986 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021093031877118988, + "loss": 1.5243, + "step": 13987 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021091902446272162, + "loss": 1.5613, + "step": 13988 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021090772974064677, + "loss": 1.5416, + "step": 13989 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021089643460504205, + "loss": 1.5574, + "step": 13990 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021088513905598416, + "loss": 1.5301, + "step": 13991 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021087384309354974, + "loss": 1.575, + "step": 13992 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021086254671781555, + "loss": 1.5762, + "step": 13993 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021085124992885823, + "loss": 1.5349, + "step": 13994 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021083995272675452, + "loss": 1.4543, + "step": 13995 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021082865511158112, + "loss": 1.5655, + "step": 13996 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002108173570834147, + "loss": 1.5856, + "step": 13997 + }, + { + "epoch": 1.1, + "learning_rate": 0.000210806058642332, + "loss": 1.5953, + "step": 13998 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002107947597884097, + "loss": 1.5683, + "step": 13999 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021078346052172452, + "loss": 1.5182, + "step": 14000 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002107721608423532, + "loss": 1.5809, + "step": 14001 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021076086075037248, + "loss": 1.4959, + "step": 14002 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021074956024585902, + "loss": 1.6144, + "step": 14003 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021073825932888953, + "loss": 1.5414, + "step": 14004 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021072695799954086, + "loss": 1.5278, + "step": 14005 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021071565625788957, + "loss": 1.5965, + "step": 14006 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021070435410401253, + "loss": 1.5578, + "step": 14007 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002106930515379864, + "loss": 1.5797, + "step": 14008 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021068174855988798, + "loss": 1.5231, + "step": 14009 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021067044516979395, + "loss": 1.5467, + "step": 14010 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021065914136778106, + "loss": 1.5759, + "step": 14011 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021064783715392613, + "loss": 1.5199, + "step": 14012 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021063653252830582, + "loss": 1.596, + "step": 14013 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021062522749099692, + "loss": 1.5897, + "step": 14014 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021061392204207614, + "loss": 1.5442, + "step": 14015 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021060261618162032, + "loss": 1.5129, + "step": 14016 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002105913099097062, + "loss": 1.5503, + "step": 14017 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021058000322641046, + "loss": 1.5646, + "step": 14018 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021056869613181003, + "loss": 1.5562, + "step": 14019 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002105573886259815, + "loss": 1.5391, + "step": 14020 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021054608070900172, + "loss": 1.5843, + "step": 14021 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002105347723809475, + "loss": 1.5607, + "step": 14022 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021052346364189555, + "loss": 1.5326, + "step": 14023 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002105121544919227, + "loss": 1.5503, + "step": 14024 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021050084493110565, + "loss": 1.5426, + "step": 14025 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021048953495952133, + "loss": 1.5291, + "step": 14026 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021047822457724645, + "loss": 1.5636, + "step": 14027 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021046691378435772, + "loss": 1.5614, + "step": 14028 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021045560258093214, + "loss": 1.5779, + "step": 14029 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021044429096704628, + "loss": 1.641, + "step": 14030 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021043297894277708, + "loss": 1.5975, + "step": 14031 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021042166650820125, + "loss": 1.5402, + "step": 14032 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002104103536633957, + "loss": 1.5411, + "step": 14033 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021039904040843718, + "loss": 1.5675, + "step": 14034 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002103877267434025, + "loss": 1.5845, + "step": 14035 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021037641266836852, + "loss": 1.5508, + "step": 14036 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021036509818341196, + "loss": 1.5363, + "step": 14037 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002103537832886097, + "loss": 1.5639, + "step": 14038 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021034246798403857, + "loss": 1.5491, + "step": 14039 + }, + { + "epoch": 1.1, + "learning_rate": 0.0002103311522697754, + "loss": 1.5932, + "step": 14040 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021031983614589698, + "loss": 1.5851, + "step": 14041 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021030851961248017, + "loss": 1.5819, + "step": 14042 + }, + { + "epoch": 1.1, + "learning_rate": 0.00021029720266960175, + "loss": 1.4933, + "step": 14043 + }, + { + "epoch": 1.11, + "learning_rate": 0.00021028588531733867, + "loss": 1.5601, + "step": 14044 + }, + { + "epoch": 1.11, + "learning_rate": 0.00021027456755576764, + "loss": 1.5612, + "step": 14045 + }, + { + "epoch": 1.11, + "learning_rate": 0.00021026324938496562, + "loss": 1.5005, + "step": 14046 + }, + { + "epoch": 1.11, + "learning_rate": 0.00021025193080500933, + "loss": 1.5618, + "step": 14047 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002102406118159757, + "loss": 1.5106, + "step": 14048 + }, + { + "epoch": 1.11, + "learning_rate": 0.00021022929241794154, + "loss": 1.5267, + "step": 14049 + }, + { + "epoch": 1.11, + "learning_rate": 0.00021021797261098373, + "loss": 1.5172, + "step": 14050 + }, + { + "epoch": 1.11, + "learning_rate": 0.00021020665239517917, + "loss": 1.5936, + "step": 14051 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002101953317706046, + "loss": 1.5525, + "step": 14052 + }, + { + "epoch": 1.11, + "learning_rate": 0.000210184010737337, + "loss": 1.5053, + "step": 14053 + }, + { + "epoch": 1.11, + "learning_rate": 0.00021017268929545313, + "loss": 1.5676, + "step": 14054 + }, + { + "epoch": 1.11, + "learning_rate": 0.00021016136744502988, + "loss": 1.5684, + "step": 14055 + }, + { + "epoch": 1.11, + "learning_rate": 0.00021015004518614425, + "loss": 1.547, + "step": 14056 + }, + { + "epoch": 1.11, + "learning_rate": 0.00021013872251887295, + "loss": 1.5217, + "step": 14057 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002101273994432929, + "loss": 1.6049, + "step": 14058 + }, + { + "epoch": 1.11, + "learning_rate": 0.000210116075959481, + "loss": 1.5761, + "step": 14059 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002101047520675141, + "loss": 1.6092, + "step": 14060 + }, + { + "epoch": 1.11, + "learning_rate": 0.00021009342776746916, + "loss": 1.5839, + "step": 14061 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002100821030594229, + "loss": 1.5396, + "step": 14062 + }, + { + "epoch": 1.11, + "learning_rate": 0.00021007077794345241, + "loss": 1.6007, + "step": 14063 + }, + { + "epoch": 1.11, + "learning_rate": 0.00021005945241963443, + "loss": 1.6015, + "step": 14064 + }, + { + "epoch": 1.11, + "learning_rate": 0.00021004812648804598, + "loss": 1.5017, + "step": 14065 + }, + { + "epoch": 1.11, + "learning_rate": 0.00021003680014876385, + "loss": 1.5242, + "step": 14066 + }, + { + "epoch": 1.11, + "learning_rate": 0.000210025473401865, + "loss": 1.5939, + "step": 14067 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002100141462474263, + "loss": 1.5711, + "step": 14068 + }, + { + "epoch": 1.11, + "learning_rate": 0.00021000281868552463, + "loss": 1.5783, + "step": 14069 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020999149071623696, + "loss": 1.5689, + "step": 14070 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020998016233964018, + "loss": 1.5515, + "step": 14071 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020996883355581117, + "loss": 1.5521, + "step": 14072 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020995750436482688, + "loss": 1.6229, + "step": 14073 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020994617476676424, + "loss": 1.558, + "step": 14074 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002099348447617002, + "loss": 1.5694, + "step": 14075 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020992351434971155, + "loss": 1.6166, + "step": 14076 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020991218353087534, + "loss": 1.5689, + "step": 14077 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020990085230526847, + "loss": 1.5551, + "step": 14078 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020988952067296784, + "loss": 1.5417, + "step": 14079 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020987818863405048, + "loss": 1.5546, + "step": 14080 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002098668561885932, + "loss": 1.5367, + "step": 14081 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020985552333667304, + "loss": 1.5438, + "step": 14082 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020984419007836694, + "loss": 1.5822, + "step": 14083 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020983285641375176, + "loss": 1.5821, + "step": 14084 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020982152234290453, + "loss": 1.5807, + "step": 14085 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020981018786590211, + "loss": 1.5581, + "step": 14086 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002097988529828216, + "loss": 1.5619, + "step": 14087 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020978751769373983, + "loss": 1.555, + "step": 14088 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020977618199873385, + "loss": 1.5862, + "step": 14089 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020976484589788056, + "loss": 1.5497, + "step": 14090 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020975350939125695, + "loss": 1.6064, + "step": 14091 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020974217247894, + "loss": 1.5764, + "step": 14092 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020973083516100666, + "loss": 1.5851, + "step": 14093 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020971949743753385, + "loss": 1.5234, + "step": 14094 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020970815930859867, + "loss": 1.5808, + "step": 14095 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020969682077427802, + "loss": 1.5662, + "step": 14096 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020968548183464896, + "loss": 1.5689, + "step": 14097 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020967414248978833, + "loss": 1.5077, + "step": 14098 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020966280273977323, + "loss": 1.5671, + "step": 14099 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020965146258468065, + "loss": 1.6022, + "step": 14100 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020964012202458754, + "loss": 1.545, + "step": 14101 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002096287810595709, + "loss": 1.5582, + "step": 14102 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020961743968970773, + "loss": 1.573, + "step": 14103 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002096060979150751, + "loss": 1.524, + "step": 14104 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020959475573574993, + "loss": 1.5784, + "step": 14105 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020958341315180923, + "loss": 1.5673, + "step": 14106 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002095720701633301, + "loss": 1.5608, + "step": 14107 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020956072677038941, + "loss": 1.5375, + "step": 14108 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002095493829730643, + "loss": 1.5894, + "step": 14109 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020953803877143173, + "loss": 1.5543, + "step": 14110 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020952669416556872, + "loss": 1.5085, + "step": 14111 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020951534915555233, + "loss": 1.5625, + "step": 14112 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020950400374145957, + "loss": 1.5538, + "step": 14113 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020949265792336746, + "loss": 1.6039, + "step": 14114 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020948131170135298, + "loss": 1.5406, + "step": 14115 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020946996507549328, + "loss": 1.5875, + "step": 14116 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002094586180458653, + "loss": 1.5798, + "step": 14117 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020944727061254613, + "loss": 1.5826, + "step": 14118 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002094359227756128, + "loss": 1.5351, + "step": 14119 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020942457453514235, + "loss": 1.5593, + "step": 14120 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020941322589121186, + "loss": 1.5655, + "step": 14121 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002094018768438983, + "loss": 1.5599, + "step": 14122 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002093905273932788, + "loss": 1.5984, + "step": 14123 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002093791775394304, + "loss": 1.5573, + "step": 14124 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002093678272824301, + "loss": 1.5151, + "step": 14125 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002093564766223551, + "loss": 1.546, + "step": 14126 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020934512555928234, + "loss": 1.5618, + "step": 14127 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020933377409328892, + "loss": 1.6309, + "step": 14128 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020932242222445195, + "loss": 1.5973, + "step": 14129 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020931106995284842, + "loss": 1.5747, + "step": 14130 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002092997172785555, + "loss": 1.5441, + "step": 14131 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002092883642016502, + "loss": 1.5799, + "step": 14132 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020927701072220961, + "loss": 1.5311, + "step": 14133 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020926565684031086, + "loss": 1.5518, + "step": 14134 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020925430255603098, + "loss": 1.5769, + "step": 14135 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020924294786944713, + "loss": 1.5832, + "step": 14136 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002092315927806363, + "loss": 1.5792, + "step": 14137 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002092202372896757, + "loss": 1.5756, + "step": 14138 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020920888139664234, + "loss": 1.57, + "step": 14139 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020919752510161334, + "loss": 1.5803, + "step": 14140 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020918616840466582, + "loss": 1.5246, + "step": 14141 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020917481130587682, + "loss": 1.5561, + "step": 14142 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002091634538053236, + "loss": 1.5225, + "step": 14143 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020915209590308316, + "loss": 1.5596, + "step": 14144 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020914073759923258, + "loss": 1.526, + "step": 14145 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020912937889384909, + "loss": 1.5868, + "step": 14146 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002091180197870097, + "loss": 1.5535, + "step": 14147 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020910666027879166, + "loss": 1.5867, + "step": 14148 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002090953003692719, + "loss": 1.5907, + "step": 14149 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002090839400585277, + "loss": 1.5322, + "step": 14150 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020907257934663618, + "loss": 1.5537, + "step": 14151 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020906121823367445, + "loss": 1.5624, + "step": 14152 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020904985671971963, + "loss": 1.5604, + "step": 14153 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020903849480484885, + "loss": 1.5446, + "step": 14154 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002090271324891393, + "loss": 1.5466, + "step": 14155 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020901576977266808, + "loss": 1.5699, + "step": 14156 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002090044066555123, + "loss": 1.5679, + "step": 14157 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020899304313774924, + "loss": 1.5274, + "step": 14158 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020898167921945594, + "loss": 1.5488, + "step": 14159 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002089703149007096, + "loss": 1.5401, + "step": 14160 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020895895018158736, + "loss": 1.5092, + "step": 14161 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020894758506216635, + "loss": 1.5412, + "step": 14162 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020893621954252382, + "loss": 1.5187, + "step": 14163 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020892485362273685, + "loss": 1.5455, + "step": 14164 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002089134873028826, + "loss": 1.5305, + "step": 14165 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020890212058303836, + "loss": 1.5918, + "step": 14166 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002088907534632812, + "loss": 1.5512, + "step": 14167 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020887938594368833, + "loss": 1.6142, + "step": 14168 + }, + { + "epoch": 1.11, + "learning_rate": 0.0002088680180243369, + "loss": 1.5171, + "step": 14169 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020885664970530414, + "loss": 1.5836, + "step": 14170 + }, + { + "epoch": 1.11, + "learning_rate": 0.00020884528098666719, + "loss": 1.5951, + "step": 14171 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020883391186850324, + "loss": 1.5551, + "step": 14172 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020882254235088951, + "loss": 1.5678, + "step": 14173 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002088111724339032, + "loss": 1.5216, + "step": 14174 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020879980211762147, + "loss": 1.6171, + "step": 14175 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020878843140212153, + "loss": 1.5851, + "step": 14176 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002087770602874806, + "loss": 1.4874, + "step": 14177 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020876568877377583, + "loss": 1.5775, + "step": 14178 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020875431686108448, + "loss": 1.5532, + "step": 14179 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020874294454948373, + "loss": 1.578, + "step": 14180 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020873157183905078, + "loss": 1.4725, + "step": 14181 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020872019872986294, + "loss": 1.5869, + "step": 14182 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002087088252219973, + "loss": 1.612, + "step": 14183 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020869745131553118, + "loss": 1.5933, + "step": 14184 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020868607701054174, + "loss": 1.5696, + "step": 14185 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020867470230710622, + "loss": 1.6297, + "step": 14186 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020866332720530185, + "loss": 1.5825, + "step": 14187 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020865195170520585, + "loss": 1.5653, + "step": 14188 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020864057580689544, + "loss": 1.552, + "step": 14189 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020862919951044795, + "loss": 1.5456, + "step": 14190 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002086178228159405, + "loss": 1.5655, + "step": 14191 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020860644572345038, + "loss": 1.5712, + "step": 14192 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020859506823305482, + "loss": 1.5846, + "step": 14193 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002085836903448311, + "loss": 1.5467, + "step": 14194 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002085723120588565, + "loss": 1.5991, + "step": 14195 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020856093337520815, + "loss": 1.5762, + "step": 14196 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020854955429396344, + "loss": 1.5453, + "step": 14197 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020853817481519954, + "loss": 1.5632, + "step": 14198 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020852679493899376, + "loss": 1.6024, + "step": 14199 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002085154146654233, + "loss": 1.5557, + "step": 14200 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002085040339945655, + "loss": 1.5576, + "step": 14201 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020849265292649757, + "loss": 1.5882, + "step": 14202 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020848127146129683, + "loss": 1.5929, + "step": 14203 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002084698895990405, + "loss": 1.5091, + "step": 14204 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002084585073398059, + "loss": 1.5361, + "step": 14205 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020844712468367027, + "loss": 1.5679, + "step": 14206 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020843574163071095, + "loss": 1.5711, + "step": 14207 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002084243581810052, + "loss": 1.5248, + "step": 14208 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002084129743346303, + "loss": 1.5382, + "step": 14209 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002084015900916635, + "loss": 1.5548, + "step": 14210 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020839020545218215, + "loss": 1.6118, + "step": 14211 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020837882041626352, + "loss": 1.5438, + "step": 14212 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002083674349839849, + "loss": 1.5891, + "step": 14213 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002083560491554237, + "loss": 1.586, + "step": 14214 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020834466293065705, + "loss": 1.5301, + "step": 14215 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020833327630976237, + "loss": 1.5828, + "step": 14216 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020832188929281688, + "loss": 1.5634, + "step": 14217 + }, + { + "epoch": 1.12, + "learning_rate": 0.000208310501879898, + "loss": 1.5976, + "step": 14218 + }, + { + "epoch": 1.12, + "learning_rate": 0.000208299114071083, + "loss": 1.5612, + "step": 14219 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002082877258664491, + "loss": 1.5702, + "step": 14220 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002082763372660738, + "loss": 1.5349, + "step": 14221 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020826494827003427, + "loss": 1.602, + "step": 14222 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020825355887840792, + "loss": 1.5905, + "step": 14223 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020824216909127205, + "loss": 1.5802, + "step": 14224 + }, + { + "epoch": 1.12, + "learning_rate": 0.000208230778908704, + "loss": 1.5204, + "step": 14225 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020821938833078113, + "loss": 1.5833, + "step": 14226 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020820799735758066, + "loss": 1.5975, + "step": 14227 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020819660598918004, + "loss": 1.5918, + "step": 14228 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002081852142256566, + "loss": 1.5732, + "step": 14229 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020817382206708766, + "loss": 1.58, + "step": 14230 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020816242951355058, + "loss": 1.6128, + "step": 14231 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020815103656512268, + "loss": 1.6127, + "step": 14232 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020813964322188134, + "loss": 1.5895, + "step": 14233 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020812824948390394, + "loss": 1.6027, + "step": 14234 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002081168553512677, + "loss": 1.5199, + "step": 14235 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020810546082405018, + "loss": 1.547, + "step": 14236 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020809406590232863, + "loss": 1.5548, + "step": 14237 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020808267058618045, + "loss": 1.5575, + "step": 14238 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020807127487568295, + "loss": 1.5372, + "step": 14239 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020805987877091354, + "loss": 1.5822, + "step": 14240 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002080484822719496, + "loss": 1.5094, + "step": 14241 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002080370853788685, + "loss": 1.6101, + "step": 14242 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020802568809174764, + "loss": 1.5215, + "step": 14243 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020801429041066434, + "loss": 1.5469, + "step": 14244 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020800289233569608, + "loss": 1.5, + "step": 14245 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020799149386692013, + "loss": 1.5535, + "step": 14246 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020798009500441395, + "loss": 1.5396, + "step": 14247 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020796869574825496, + "loss": 1.5777, + "step": 14248 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020795729609852047, + "loss": 1.5296, + "step": 14249 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020794589605528793, + "loss": 1.5724, + "step": 14250 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020793449561863476, + "loss": 1.5531, + "step": 14251 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020792309478863828, + "loss": 1.4807, + "step": 14252 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020791169356537602, + "loss": 1.5591, + "step": 14253 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002079002919489253, + "loss": 1.5227, + "step": 14254 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020788888993936356, + "loss": 1.5413, + "step": 14255 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020787748753676817, + "loss": 1.5395, + "step": 14256 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020786608474121659, + "loss": 1.5476, + "step": 14257 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020785468155278623, + "loss": 1.5761, + "step": 14258 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002078432779715545, + "loss": 1.575, + "step": 14259 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020783187399759883, + "loss": 1.5238, + "step": 14260 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002078204696309967, + "loss": 1.5769, + "step": 14261 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002078090648718254, + "loss": 1.5676, + "step": 14262 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020779765972016255, + "loss": 1.55, + "step": 14263 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020778625417608543, + "loss": 1.5506, + "step": 14264 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020777484823967154, + "loss": 1.549, + "step": 14265 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020776344191099832, + "loss": 1.5385, + "step": 14266 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020775203519014318, + "loss": 1.6073, + "step": 14267 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020774062807718362, + "loss": 1.6087, + "step": 14268 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020772922057219707, + "loss": 1.5628, + "step": 14269 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020771781267526097, + "loss": 1.5644, + "step": 14270 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020770640438645273, + "loss": 1.565, + "step": 14271 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020769499570584988, + "loss": 1.5743, + "step": 14272 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020768358663352988, + "loss": 1.5265, + "step": 14273 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020767217716957008, + "loss": 1.5092, + "step": 14274 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020766076731404805, + "loss": 1.5631, + "step": 14275 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020764935706704123, + "loss": 1.5967, + "step": 14276 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020763794642862714, + "loss": 1.5578, + "step": 14277 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020762653539888317, + "loss": 1.5124, + "step": 14278 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002076151239778868, + "loss": 1.5642, + "step": 14279 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020760371216571558, + "loss": 1.6092, + "step": 14280 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002075922999624469, + "loss": 1.5421, + "step": 14281 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002075808873681583, + "loss": 1.5477, + "step": 14282 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020756947438292723, + "loss": 1.5358, + "step": 14283 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020755806100683125, + "loss": 1.5136, + "step": 14284 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020754664723994775, + "loss": 1.5384, + "step": 14285 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002075352330823543, + "loss": 1.5564, + "step": 14286 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020752381853412837, + "loss": 1.5123, + "step": 14287 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020751240359534744, + "loss": 1.5553, + "step": 14288 + }, + { + "epoch": 1.12, + "learning_rate": 0.000207500988266089, + "loss": 1.5203, + "step": 14289 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020748957254643061, + "loss": 1.5947, + "step": 14290 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020747815643644977, + "loss": 1.5764, + "step": 14291 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020746673993622395, + "loss": 1.5315, + "step": 14292 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020745532304583067, + "loss": 1.4287, + "step": 14293 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020744390576534746, + "loss": 1.565, + "step": 14294 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020743248809485182, + "loss": 1.5466, + "step": 14295 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020742107003442133, + "loss": 1.5157, + "step": 14296 + }, + { + "epoch": 1.12, + "learning_rate": 0.00020740965158413344, + "loss": 1.5826, + "step": 14297 + }, + { + "epoch": 1.12, + "learning_rate": 0.0002073982327440656, + "loss": 1.5141, + "step": 14298 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020738681351429556, + "loss": 1.5434, + "step": 14299 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020737539389490065, + "loss": 1.6036, + "step": 14300 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020736397388595854, + "loss": 1.6009, + "step": 14301 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020735255348754668, + "loss": 1.5404, + "step": 14302 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002073411326997426, + "loss": 1.5675, + "step": 14303 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002073297115226239, + "loss": 1.5867, + "step": 14304 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020731828995626807, + "loss": 1.5289, + "step": 14305 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020730686800075272, + "loss": 1.5168, + "step": 14306 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020729544565615534, + "loss": 1.533, + "step": 14307 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002072840229225535, + "loss": 1.5603, + "step": 14308 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020727259980002477, + "loss": 1.4877, + "step": 14309 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020726117628864666, + "loss": 1.5948, + "step": 14310 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020724975238849684, + "loss": 1.535, + "step": 14311 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002072383280996527, + "loss": 1.5463, + "step": 14312 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020722690342219193, + "loss": 1.5861, + "step": 14313 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020721547835619207, + "loss": 1.5362, + "step": 14314 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002072040529017307, + "loss": 1.5834, + "step": 14315 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020719262705888537, + "loss": 1.5628, + "step": 14316 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020718120082773367, + "loss": 1.5439, + "step": 14317 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020716977420835316, + "loss": 1.5061, + "step": 14318 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020715834720082146, + "loss": 1.4814, + "step": 14319 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020714691980521608, + "loss": 1.5309, + "step": 14320 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002071354920216147, + "loss": 1.5161, + "step": 14321 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002071240638500948, + "loss": 1.5294, + "step": 14322 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020711263529073407, + "loss": 1.5654, + "step": 14323 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020710120634361007, + "loss": 1.5601, + "step": 14324 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020708977700880035, + "loss": 1.556, + "step": 14325 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002070783472863826, + "loss": 1.557, + "step": 14326 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020706691717643433, + "loss": 1.5257, + "step": 14327 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020705548667903324, + "loss": 1.5382, + "step": 14328 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020704405579425683, + "loss": 1.5226, + "step": 14329 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020703262452218275, + "loss": 1.5727, + "step": 14330 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020702119286288863, + "loss": 1.6115, + "step": 14331 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002070097608164521, + "loss": 1.5604, + "step": 14332 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020699832838295078, + "loss": 1.5373, + "step": 14333 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002069868955624622, + "loss": 1.6019, + "step": 14334 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020697546235506407, + "loss": 1.5751, + "step": 14335 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020696402876083404, + "loss": 1.527, + "step": 14336 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020695259477984963, + "loss": 1.5525, + "step": 14337 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020694116041218853, + "loss": 1.5534, + "step": 14338 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020692972565792842, + "loss": 1.5374, + "step": 14339 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020691829051714688, + "loss": 1.5195, + "step": 14340 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020690685498992155, + "loss": 1.566, + "step": 14341 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020689541907633005, + "loss": 1.5075, + "step": 14342 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020688398277645008, + "loss": 1.5677, + "step": 14343 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020687254609035925, + "loss": 1.5852, + "step": 14344 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002068611090181352, + "loss": 1.5905, + "step": 14345 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002068496715598556, + "loss": 1.6193, + "step": 14346 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002068382337155981, + "loss": 1.5077, + "step": 14347 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020682679548544042, + "loss": 1.5871, + "step": 14348 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002068153568694601, + "loss": 1.5442, + "step": 14349 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002068039178677349, + "loss": 1.5439, + "step": 14350 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020679247848034242, + "loss": 1.55, + "step": 14351 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020678103870736033, + "loss": 1.5095, + "step": 14352 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020676959854886633, + "loss": 1.5191, + "step": 14353 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002067581580049381, + "loss": 1.5933, + "step": 14354 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020674671707565333, + "loss": 1.5696, + "step": 14355 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002067352757610896, + "loss": 1.5431, + "step": 14356 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020672383406132472, + "loss": 1.567, + "step": 14357 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020671239197643626, + "loss": 1.5631, + "step": 14358 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020670094950650194, + "loss": 1.6025, + "step": 14359 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020668950665159953, + "loss": 1.528, + "step": 14360 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020667806341180658, + "loss": 1.5426, + "step": 14361 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020666661978720093, + "loss": 1.5392, + "step": 14362 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020665517577786018, + "loss": 1.5593, + "step": 14363 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020664373138386204, + "loss": 1.5992, + "step": 14364 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020663228660528423, + "loss": 1.5317, + "step": 14365 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020662084144220443, + "loss": 1.6087, + "step": 14366 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002066093958947004, + "loss": 1.5361, + "step": 14367 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020659794996284977, + "loss": 1.5642, + "step": 14368 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002065865036467303, + "loss": 1.5178, + "step": 14369 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002065750569464197, + "loss": 1.5648, + "step": 14370 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020656360986199567, + "loss": 1.5135, + "step": 14371 + }, + { + "epoch": 1.13, + "learning_rate": 0.000206552162393536, + "loss": 1.558, + "step": 14372 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002065407145411183, + "loss": 1.5597, + "step": 14373 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020652926630482035, + "loss": 1.5782, + "step": 14374 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020651781768471993, + "loss": 1.4993, + "step": 14375 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020650636868089467, + "loss": 1.5416, + "step": 14376 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020649491929342236, + "loss": 1.5124, + "step": 14377 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020648346952238073, + "loss": 1.5843, + "step": 14378 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002064720193678475, + "loss": 1.5904, + "step": 14379 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020646056882990042, + "loss": 1.5491, + "step": 14380 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020644911790861727, + "loss": 1.5729, + "step": 14381 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020643766660407575, + "loss": 1.6006, + "step": 14382 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020642621491635357, + "loss": 1.5493, + "step": 14383 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020641476284552861, + "loss": 1.5444, + "step": 14384 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020640331039167845, + "loss": 1.5296, + "step": 14385 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020639185755488103, + "loss": 1.599, + "step": 14386 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020638040433521395, + "loss": 1.559, + "step": 14387 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020636895073275501, + "loss": 1.5453, + "step": 14388 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002063574967475821, + "loss": 1.5668, + "step": 14389 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020634604237977283, + "loss": 1.5308, + "step": 14390 + }, + { + "epoch": 1.13, + "learning_rate": 0.000206334587629405, + "loss": 1.5806, + "step": 14391 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020632313249655646, + "loss": 1.5623, + "step": 14392 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002063116769813049, + "loss": 1.5953, + "step": 14393 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020630022108372817, + "loss": 1.5306, + "step": 14394 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020628876480390396, + "loss": 1.5218, + "step": 14395 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020627730814191014, + "loss": 1.498, + "step": 14396 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020626585109782442, + "loss": 1.5399, + "step": 14397 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020625439367172465, + "loss": 1.6219, + "step": 14398 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002062429358636886, + "loss": 1.5434, + "step": 14399 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020623147767379396, + "loss": 1.5971, + "step": 14400 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020622001910211875, + "loss": 1.5177, + "step": 14401 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020620856014874056, + "loss": 1.5602, + "step": 14402 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020619710081373727, + "loss": 1.5386, + "step": 14403 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020618564109718668, + "loss": 1.5777, + "step": 14404 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002061741809991666, + "loss": 1.5636, + "step": 14405 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020616272051975486, + "loss": 1.5046, + "step": 14406 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002061512596590292, + "loss": 1.5948, + "step": 14407 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020613979841706747, + "loss": 1.5409, + "step": 14408 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020612833679394752, + "loss": 1.4702, + "step": 14409 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020611687478974707, + "loss": 1.5121, + "step": 14410 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002061054124045441, + "loss": 1.5672, + "step": 14411 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002060939496384163, + "loss": 1.5222, + "step": 14412 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020608248649144154, + "loss": 1.5755, + "step": 14413 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020607102296369765, + "loss": 1.536, + "step": 14414 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020605955905526242, + "loss": 1.5129, + "step": 14415 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020604809476621375, + "loss": 1.6037, + "step": 14416 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020603663009662946, + "loss": 1.5333, + "step": 14417 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020602516504658738, + "loss": 1.5609, + "step": 14418 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002060136996161653, + "loss": 1.552, + "step": 14419 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020600223380544112, + "loss": 1.5372, + "step": 14420 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020599076761449272, + "loss": 1.531, + "step": 14421 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020597930104339788, + "loss": 1.5693, + "step": 14422 + }, + { + "epoch": 1.13, + "learning_rate": 0.0002059678340922345, + "loss": 1.515, + "step": 14423 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020595636676108036, + "loss": 1.5519, + "step": 14424 + }, + { + "epoch": 1.13, + "learning_rate": 0.00020594489905001342, + "loss": 1.5639, + "step": 14425 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020593343095911144, + "loss": 1.5585, + "step": 14426 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020592196248845235, + "loss": 1.5275, + "step": 14427 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020591049363811404, + "loss": 1.5384, + "step": 14428 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002058990244081743, + "loss": 1.5446, + "step": 14429 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020588755479871102, + "loss": 1.5573, + "step": 14430 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002058760848098021, + "loss": 1.5607, + "step": 14431 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020586461444152535, + "loss": 1.5961, + "step": 14432 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020585314369395879, + "loss": 1.5117, + "step": 14433 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020584167256718013, + "loss": 1.5166, + "step": 14434 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020583020106126735, + "loss": 1.6384, + "step": 14435 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020581872917629834, + "loss": 1.5829, + "step": 14436 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002058072569123509, + "loss": 1.5924, + "step": 14437 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020579578426950306, + "loss": 1.5681, + "step": 14438 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020578431124783255, + "loss": 1.6036, + "step": 14439 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020577283784741743, + "loss": 1.5142, + "step": 14440 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020576136406833545, + "loss": 1.5, + "step": 14441 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020574988991066466, + "loss": 1.5611, + "step": 14442 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020573841537448284, + "loss": 1.5582, + "step": 14443 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020572694045986793, + "loss": 1.5112, + "step": 14444 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020571546516689787, + "loss": 1.5827, + "step": 14445 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020570398949565054, + "loss": 1.5456, + "step": 14446 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020569251344620384, + "loss": 1.5457, + "step": 14447 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002056810370186357, + "loss": 1.5567, + "step": 14448 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020566956021302407, + "loss": 1.5831, + "step": 14449 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020565808302944687, + "loss": 1.5754, + "step": 14450 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020564660546798196, + "loss": 1.5635, + "step": 14451 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020563512752870734, + "loss": 1.5098, + "step": 14452 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002056236492117009, + "loss": 1.5661, + "step": 14453 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020561217051704055, + "loss": 1.5407, + "step": 14454 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020560069144480425, + "loss": 1.5846, + "step": 14455 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020558921199506994, + "loss": 1.5942, + "step": 14456 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002055777321679156, + "loss": 1.5755, + "step": 14457 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020556625196341909, + "loss": 1.5363, + "step": 14458 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020555477138165844, + "loss": 1.539, + "step": 14459 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020554329042271152, + "loss": 1.5369, + "step": 14460 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002055318090866563, + "loss": 1.5228, + "step": 14461 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020552032737357077, + "loss": 1.6003, + "step": 14462 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020550884528353278, + "loss": 1.5493, + "step": 14463 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020549736281662046, + "loss": 1.5293, + "step": 14464 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002054858799729116, + "loss": 1.5711, + "step": 14465 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020547439675248425, + "loss": 1.5592, + "step": 14466 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002054629131554164, + "loss": 1.5545, + "step": 14467 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020545142918178594, + "loss": 1.5931, + "step": 14468 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002054399448316709, + "loss": 1.5425, + "step": 14469 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002054284601051492, + "loss": 1.5858, + "step": 14470 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020541697500229885, + "loss": 1.5406, + "step": 14471 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020540548952319783, + "loss": 1.5691, + "step": 14472 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002053940036679241, + "loss": 1.5976, + "step": 14473 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002053825174365557, + "loss": 1.5159, + "step": 14474 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002053710308291705, + "loss": 1.5417, + "step": 14475 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002053595438458466, + "loss": 1.5338, + "step": 14476 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020534805648666195, + "loss": 1.5803, + "step": 14477 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020533656875169453, + "loss": 1.5544, + "step": 14478 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020532508064102233, + "loss": 1.5379, + "step": 14479 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020531359215472336, + "loss": 1.6044, + "step": 14480 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002053021032928757, + "loss": 1.5323, + "step": 14481 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002052906140555572, + "loss": 1.5943, + "step": 14482 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020527912444284595, + "loss": 1.5412, + "step": 14483 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020526763445481998, + "loss": 1.5492, + "step": 14484 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020525614409155722, + "loss": 1.5539, + "step": 14485 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020524465335313577, + "loss": 1.5179, + "step": 14486 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002052331622396336, + "loss": 1.5376, + "step": 14487 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020522167075112874, + "loss": 1.6135, + "step": 14488 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020521017888769922, + "loss": 1.5174, + "step": 14489 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020519868664942308, + "loss": 1.5658, + "step": 14490 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020518719403637829, + "loss": 1.5562, + "step": 14491 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020517570104864287, + "loss": 1.5651, + "step": 14492 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020516420768629492, + "loss": 1.5831, + "step": 14493 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020515271394941248, + "loss": 1.5491, + "step": 14494 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020514121983807347, + "loss": 1.5692, + "step": 14495 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020512972535235608, + "loss": 1.5642, + "step": 14496 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020511823049233825, + "loss": 1.5595, + "step": 14497 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020510673525809804, + "loss": 1.5232, + "step": 14498 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002050952396497135, + "loss": 1.5176, + "step": 14499 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002050837436672627, + "loss": 1.5333, + "step": 14500 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020507224731082372, + "loss": 1.5772, + "step": 14501 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020506075058047447, + "loss": 1.5367, + "step": 14502 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020504925347629319, + "loss": 1.5238, + "step": 14503 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020503775599835784, + "loss": 1.5069, + "step": 14504 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002050262581467465, + "loss": 1.53, + "step": 14505 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020501475992153724, + "loss": 1.5734, + "step": 14506 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020500326132280814, + "loss": 1.5378, + "step": 14507 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020499176235063722, + "loss": 1.5709, + "step": 14508 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002049802630051026, + "loss": 1.5305, + "step": 14509 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020496876328628228, + "loss": 1.5341, + "step": 14510 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020495726319425442, + "loss": 1.6043, + "step": 14511 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020494576272909708, + "loss": 1.5114, + "step": 14512 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020493426189088833, + "loss": 1.583, + "step": 14513 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020492276067970628, + "loss": 1.6263, + "step": 14514 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020491125909562896, + "loss": 1.5463, + "step": 14515 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002048997571387345, + "loss": 1.609, + "step": 14516 + }, + { + "epoch": 1.14, + "learning_rate": 0.000204888254809101, + "loss": 1.5287, + "step": 14517 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020487675210680652, + "loss": 1.4799, + "step": 14518 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020486524903192918, + "loss": 1.5688, + "step": 14519 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002048537455845471, + "loss": 1.5571, + "step": 14520 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020484224176473836, + "loss": 1.5463, + "step": 14521 + }, + { + "epoch": 1.14, + "learning_rate": 0.000204830737572581, + "loss": 1.5329, + "step": 14522 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020481923300815326, + "loss": 1.5437, + "step": 14523 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020480772807153315, + "loss": 1.595, + "step": 14524 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020479622276279886, + "loss": 1.5827, + "step": 14525 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020478471708202837, + "loss": 1.5723, + "step": 14526 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002047732110292999, + "loss": 1.5361, + "step": 14527 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020476170460469162, + "loss": 1.5595, + "step": 14528 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002047501978082815, + "loss": 1.5428, + "step": 14529 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020473869064014784, + "loss": 1.5962, + "step": 14530 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020472718310036864, + "loss": 1.568, + "step": 14531 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020471567518902205, + "loss": 1.5679, + "step": 14532 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020470416690618624, + "loss": 1.5544, + "step": 14533 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020469265825193926, + "loss": 1.5487, + "step": 14534 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002046811492263594, + "loss": 1.5238, + "step": 14535 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002046696398295247, + "loss": 1.5682, + "step": 14536 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002046581300615133, + "loss": 1.565, + "step": 14537 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020464661992240335, + "loss": 1.5669, + "step": 14538 + }, + { + "epoch": 1.14, + "learning_rate": 0.000204635109412273, + "loss": 1.5666, + "step": 14539 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020462359853120045, + "loss": 1.5509, + "step": 14540 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020461208727926377, + "loss": 1.5784, + "step": 14541 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020460057565654114, + "loss": 1.5457, + "step": 14542 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020458906366311073, + "loss": 1.5907, + "step": 14543 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020457755129905077, + "loss": 1.5853, + "step": 14544 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020456603856443931, + "loss": 1.547, + "step": 14545 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020455452545935457, + "loss": 1.5661, + "step": 14546 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002045430119838747, + "loss": 1.5135, + "step": 14547 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002045314981380779, + "loss": 1.5719, + "step": 14548 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020451998392204227, + "loss": 1.5167, + "step": 14549 + }, + { + "epoch": 1.14, + "learning_rate": 0.0002045084693358461, + "loss": 1.5946, + "step": 14550 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020449695437956743, + "loss": 1.5479, + "step": 14551 + }, + { + "epoch": 1.14, + "learning_rate": 0.00020448543905328458, + "loss": 1.5284, + "step": 14552 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020447392335707563, + "loss": 1.5441, + "step": 14553 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020446240729101885, + "loss": 1.5141, + "step": 14554 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020445089085519233, + "loss": 1.497, + "step": 14555 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020443937404967426, + "loss": 1.5628, + "step": 14556 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020442785687454295, + "loss": 1.552, + "step": 14557 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020441633932987652, + "loss": 1.499, + "step": 14558 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002044048214157532, + "loss": 1.5853, + "step": 14559 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020439330313225113, + "loss": 1.5032, + "step": 14560 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020438178447944856, + "loss": 1.5757, + "step": 14561 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002043702654574237, + "loss": 1.559, + "step": 14562 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020435874606625473, + "loss": 1.5359, + "step": 14563 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002043472263060199, + "loss": 1.4927, + "step": 14564 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002043357061767973, + "loss": 1.5515, + "step": 14565 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020432418567866532, + "loss": 1.5246, + "step": 14566 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020431266481170209, + "loss": 1.5239, + "step": 14567 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002043011435759858, + "loss": 1.5756, + "step": 14568 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020428962197159475, + "loss": 1.5746, + "step": 14569 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020427809999860712, + "loss": 1.5295, + "step": 14570 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020426657765710112, + "loss": 1.5099, + "step": 14571 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020425505494715506, + "loss": 1.5485, + "step": 14572 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020424353186884706, + "loss": 1.5548, + "step": 14573 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020423200842225545, + "loss": 1.56, + "step": 14574 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002042204846074584, + "loss": 1.5289, + "step": 14575 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020420896042453422, + "loss": 1.5634, + "step": 14576 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020419743587356108, + "loss": 1.4872, + "step": 14577 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020418591095461725, + "loss": 1.5121, + "step": 14578 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020417438566778102, + "loss": 1.5648, + "step": 14579 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002041628600131306, + "loss": 1.5436, + "step": 14580 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002041513339907442, + "loss": 1.526, + "step": 14581 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002041398076007002, + "loss": 1.4753, + "step": 14582 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020412828084307672, + "loss": 1.5619, + "step": 14583 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020411675371795215, + "loss": 1.5424, + "step": 14584 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020410522622540462, + "loss": 1.5148, + "step": 14585 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020409369836551253, + "loss": 1.538, + "step": 14586 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020408217013835405, + "loss": 1.5477, + "step": 14587 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020407064154400744, + "loss": 1.5603, + "step": 14588 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020405911258255103, + "loss": 1.5654, + "step": 14589 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020404758325406308, + "loss": 1.5328, + "step": 14590 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020403605355862192, + "loss": 1.5792, + "step": 14591 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020402452349630574, + "loss": 1.5513, + "step": 14592 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020401299306719285, + "loss": 1.5482, + "step": 14593 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020400146227136153, + "loss": 1.5297, + "step": 14594 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002039899311088901, + "loss": 1.4981, + "step": 14595 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020397839957985686, + "loss": 1.5866, + "step": 14596 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020396686768434, + "loss": 1.534, + "step": 14597 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020395533542241794, + "loss": 1.4891, + "step": 14598 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020394380279416892, + "loss": 1.5765, + "step": 14599 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020393226979967125, + "loss": 1.5165, + "step": 14600 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020392073643900324, + "loss": 1.5136, + "step": 14601 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020390920271224315, + "loss": 1.5723, + "step": 14602 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002038976686194694, + "loss": 1.5471, + "step": 14603 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020388613416076016, + "loss": 1.5292, + "step": 14604 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002038745993361938, + "loss": 1.5924, + "step": 14605 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020386306414584864, + "loss": 1.5856, + "step": 14606 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020385152858980302, + "loss": 1.5533, + "step": 14607 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020383999266813526, + "loss": 1.5577, + "step": 14608 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002038284563809236, + "loss": 1.5818, + "step": 14609 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002038169197282465, + "loss": 1.5683, + "step": 14610 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020380538271018217, + "loss": 1.4751, + "step": 14611 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020379384532680895, + "loss": 1.5719, + "step": 14612 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020378230757820526, + "loss": 1.5951, + "step": 14613 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002037707694644494, + "loss": 1.5342, + "step": 14614 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020375923098561965, + "loss": 1.5825, + "step": 14615 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020374769214179437, + "loss": 1.5924, + "step": 14616 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020373615293305195, + "loss": 1.5866, + "step": 14617 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020372461335947073, + "loss": 1.5842, + "step": 14618 + }, + { + "epoch": 1.15, + "learning_rate": 0.000203713073421129, + "loss": 1.5601, + "step": 14619 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020370153311810514, + "loss": 1.5212, + "step": 14620 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002036899924504775, + "loss": 1.5721, + "step": 14621 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020367845141832448, + "loss": 1.5391, + "step": 14622 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020366691002172434, + "loss": 1.5562, + "step": 14623 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020365536826075554, + "loss": 1.5317, + "step": 14624 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020364382613549637, + "loss": 1.5385, + "step": 14625 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020363228364602526, + "loss": 1.5932, + "step": 14626 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020362074079242047, + "loss": 1.5171, + "step": 14627 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020360919757476047, + "loss": 1.482, + "step": 14628 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020359765399312365, + "loss": 1.5211, + "step": 14629 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020358611004758832, + "loss": 1.5565, + "step": 14630 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020357456573823286, + "loss": 1.5008, + "step": 14631 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020356302106513567, + "loss": 1.5224, + "step": 14632 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020355147602837514, + "loss": 1.5813, + "step": 14633 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002035399306280296, + "loss": 1.5441, + "step": 14634 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020352838486417752, + "loss": 1.5483, + "step": 14635 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002035168387368972, + "loss": 1.574, + "step": 14636 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002035052922462671, + "loss": 1.5228, + "step": 14637 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002034937453923656, + "loss": 1.4952, + "step": 14638 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020348219817527106, + "loss": 1.5558, + "step": 14639 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020347065059506198, + "loss": 1.5652, + "step": 14640 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020345910265181662, + "loss": 1.5505, + "step": 14641 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020344755434561349, + "loss": 1.6149, + "step": 14642 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020343600567653095, + "loss": 1.5319, + "step": 14643 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020342445664464742, + "loss": 1.529, + "step": 14644 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020341290725004127, + "loss": 1.6191, + "step": 14645 + }, + { + "epoch": 1.15, + "learning_rate": 0.000203401357492791, + "loss": 1.5582, + "step": 14646 + }, + { + "epoch": 1.15, + "learning_rate": 0.000203389807372975, + "loss": 1.5517, + "step": 14647 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020337825689067162, + "loss": 1.5506, + "step": 14648 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002033667060459594, + "loss": 1.5928, + "step": 14649 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020335515483891662, + "loss": 1.474, + "step": 14650 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020334360326962185, + "loss": 1.5459, + "step": 14651 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020333205133815337, + "loss": 1.5455, + "step": 14652 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020332049904458975, + "loss": 1.5064, + "step": 14653 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002033089463890094, + "loss": 1.5072, + "step": 14654 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020329739337149067, + "loss": 1.5704, + "step": 14655 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020328583999211204, + "loss": 1.5651, + "step": 14656 + }, + { + "epoch": 1.15, + "learning_rate": 0.000203274286250952, + "loss": 1.5288, + "step": 14657 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020326273214808893, + "loss": 1.6144, + "step": 14658 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020325117768360136, + "loss": 1.5691, + "step": 14659 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020323962285756758, + "loss": 1.5603, + "step": 14660 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020322806767006618, + "loss": 1.5502, + "step": 14661 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020321651212117559, + "loss": 1.5687, + "step": 14662 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020320495621097424, + "loss": 1.4882, + "step": 14663 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020319339993954064, + "loss": 1.5422, + "step": 14664 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020318184330695314, + "loss": 1.5496, + "step": 14665 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002031702863132903, + "loss": 1.5871, + "step": 14666 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020315872895863057, + "loss": 1.5374, + "step": 14667 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020314717124305238, + "loss": 1.5916, + "step": 14668 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020313561316663426, + "loss": 1.5374, + "step": 14669 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002031240547294546, + "loss": 1.5299, + "step": 14670 + }, + { + "epoch": 1.15, + "learning_rate": 0.000203112495931592, + "loss": 1.5709, + "step": 14671 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020310093677312481, + "loss": 1.5724, + "step": 14672 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020308937725413155, + "loss": 1.5585, + "step": 14673 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020307781737469077, + "loss": 1.5137, + "step": 14674 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020306625713488084, + "loss": 1.6098, + "step": 14675 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020305469653478036, + "loss": 1.582, + "step": 14676 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020304313557446775, + "loss": 1.5919, + "step": 14677 + }, + { + "epoch": 1.15, + "learning_rate": 0.0002030315742540215, + "loss": 1.5556, + "step": 14678 + }, + { + "epoch": 1.15, + "learning_rate": 0.00020302001257352015, + "loss": 1.6076, + "step": 14679 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020300845053304215, + "loss": 1.5628, + "step": 14680 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002029968881326661, + "loss": 1.5804, + "step": 14681 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020298532537247035, + "loss": 1.5316, + "step": 14682 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020297376225253345, + "loss": 1.5722, + "step": 14683 + }, + { + "epoch": 1.16, + "learning_rate": 0.000202962198772934, + "loss": 1.6335, + "step": 14684 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020295063493375043, + "loss": 1.5216, + "step": 14685 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020293907073506127, + "loss": 1.6007, + "step": 14686 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020292750617694502, + "loss": 1.5381, + "step": 14687 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020291594125948026, + "loss": 1.5442, + "step": 14688 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002029043759827454, + "loss": 1.5463, + "step": 14689 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002028928103468191, + "loss": 1.5181, + "step": 14690 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002028812443517797, + "loss": 1.5405, + "step": 14691 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020286967799770588, + "loss": 1.5657, + "step": 14692 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020285811128467615, + "loss": 1.5463, + "step": 14693 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020284654421276897, + "loss": 1.5997, + "step": 14694 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020283497678206297, + "loss": 1.5269, + "step": 14695 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002028234089926366, + "loss": 1.5346, + "step": 14696 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020281184084456843, + "loss": 1.5217, + "step": 14697 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020280027233793706, + "loss": 1.5805, + "step": 14698 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020278870347282087, + "loss": 1.5264, + "step": 14699 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020277713424929862, + "loss": 1.5386, + "step": 14700 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002027655646674487, + "loss": 1.6007, + "step": 14701 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002027539947273497, + "loss": 1.5726, + "step": 14702 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020274242442908026, + "loss": 1.4688, + "step": 14703 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002027308537727188, + "loss": 1.5376, + "step": 14704 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020271928275834397, + "loss": 1.5483, + "step": 14705 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002027077113860343, + "loss": 1.5083, + "step": 14706 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020269613965586832, + "loss": 1.5353, + "step": 14707 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020268456756792466, + "loss": 1.5598, + "step": 14708 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020267299512228185, + "loss": 1.5665, + "step": 14709 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020266142231901852, + "loss": 1.5285, + "step": 14710 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020264984915821312, + "loss": 1.5768, + "step": 14711 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020263827563994435, + "loss": 1.5236, + "step": 14712 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020262670176429074, + "loss": 1.5497, + "step": 14713 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002026151275313308, + "loss": 1.5252, + "step": 14714 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020260355294114324, + "loss": 1.5874, + "step": 14715 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020259197799380656, + "loss": 1.5845, + "step": 14716 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002025804026893994, + "loss": 1.4976, + "step": 14717 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020256882702800028, + "loss": 1.5212, + "step": 14718 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020255725100968788, + "loss": 1.5178, + "step": 14719 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020254567463454072, + "loss": 1.5556, + "step": 14720 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020253409790263745, + "loss": 1.5565, + "step": 14721 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020252252081405663, + "loss": 1.6056, + "step": 14722 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020251094336887684, + "loss": 1.5879, + "step": 14723 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020249936556717676, + "loss": 1.5907, + "step": 14724 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020248778740903498, + "loss": 1.516, + "step": 14725 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020247620889453006, + "loss": 1.5659, + "step": 14726 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020246463002374066, + "loss": 1.5869, + "step": 14727 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020245305079674537, + "loss": 1.5381, + "step": 14728 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002024414712136228, + "loss": 1.5659, + "step": 14729 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020242989127445158, + "loss": 1.5798, + "step": 14730 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020241831097931028, + "loss": 1.5154, + "step": 14731 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002024067303282777, + "loss": 1.5378, + "step": 14732 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020239514932143227, + "loss": 1.5464, + "step": 14733 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002023835679588527, + "loss": 1.567, + "step": 14734 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002023719862406176, + "loss": 1.5498, + "step": 14735 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002023604041668056, + "loss": 1.5794, + "step": 14736 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020234882173749539, + "loss": 1.5393, + "step": 14737 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002023372389527655, + "loss": 1.5395, + "step": 14738 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020232565581269473, + "loss": 1.5525, + "step": 14739 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002023140723173616, + "loss": 1.5826, + "step": 14740 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020230248846684473, + "loss": 1.5497, + "step": 14741 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002022909042612229, + "loss": 1.5407, + "step": 14742 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020227931970057467, + "loss": 1.5309, + "step": 14743 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020226773478497872, + "loss": 1.5075, + "step": 14744 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020225614951451367, + "loss": 1.5777, + "step": 14745 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002022445638892582, + "loss": 1.5025, + "step": 14746 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020223297790929095, + "loss": 1.5504, + "step": 14747 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020222139157469063, + "loss": 1.5517, + "step": 14748 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020220980488553592, + "loss": 1.581, + "step": 14749 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002021982178419054, + "loss": 1.5754, + "step": 14750 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020218663044387777, + "loss": 1.5564, + "step": 14751 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020217504269153178, + "loss": 1.5642, + "step": 14752 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020216345458494602, + "loss": 1.5638, + "step": 14753 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020215186612419913, + "loss": 1.5371, + "step": 14754 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002021402773093699, + "loss": 1.527, + "step": 14755 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020212868814053697, + "loss": 1.6033, + "step": 14756 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020211709861777899, + "loss": 1.5139, + "step": 14757 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020210550874117465, + "loss": 1.5785, + "step": 14758 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020209391851080274, + "loss": 1.5443, + "step": 14759 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020208232792674183, + "loss": 1.5456, + "step": 14760 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020207073698907065, + "loss": 1.5755, + "step": 14761 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020205914569786787, + "loss": 1.5339, + "step": 14762 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020204755405321226, + "loss": 1.5351, + "step": 14763 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020203596205518247, + "loss": 1.5919, + "step": 14764 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002020243697038572, + "loss": 1.5963, + "step": 14765 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020201277699931518, + "loss": 1.536, + "step": 14766 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002020011839416351, + "loss": 1.5433, + "step": 14767 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002019895905308957, + "loss": 1.5868, + "step": 14768 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020197799676717566, + "loss": 1.5595, + "step": 14769 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020196640265055367, + "loss": 1.5617, + "step": 14770 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020195480818110853, + "loss": 1.5395, + "step": 14771 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020194321335891889, + "loss": 1.5928, + "step": 14772 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020193161818406354, + "loss": 1.5845, + "step": 14773 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020192002265662112, + "loss": 1.549, + "step": 14774 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002019084267766704, + "loss": 1.5151, + "step": 14775 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002018968305442901, + "loss": 1.5163, + "step": 14776 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020188523395955896, + "loss": 1.5491, + "step": 14777 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020187363702255573, + "loss": 1.5473, + "step": 14778 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020186203973335913, + "loss": 1.5338, + "step": 14779 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020185044209204787, + "loss": 1.5385, + "step": 14780 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020183884409870077, + "loss": 1.5487, + "step": 14781 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002018272457533965, + "loss": 1.5084, + "step": 14782 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020181564705621386, + "loss": 1.5114, + "step": 14783 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020180404800723153, + "loss": 1.4976, + "step": 14784 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002017924486065283, + "loss": 1.5851, + "step": 14785 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020178084885418292, + "loss": 1.5363, + "step": 14786 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020176924875027418, + "loss": 1.5774, + "step": 14787 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020175764829488083, + "loss": 1.5812, + "step": 14788 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020174604748808154, + "loss": 1.5417, + "step": 14789 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020173444632995524, + "loss": 1.5528, + "step": 14790 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002017228448205805, + "loss": 1.5234, + "step": 14791 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020171124296003624, + "loss": 1.5112, + "step": 14792 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020169964074840118, + "loss": 1.5467, + "step": 14793 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020168803818575406, + "loss": 1.5401, + "step": 14794 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020167643527217374, + "loss": 1.5875, + "step": 14795 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020166483200773888, + "loss": 1.5776, + "step": 14796 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020165322839252832, + "loss": 1.5203, + "step": 14797 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002016416244266209, + "loss": 1.5547, + "step": 14798 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020163002011009534, + "loss": 1.5525, + "step": 14799 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020161841544303043, + "loss": 1.5536, + "step": 14800 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002016068104255049, + "loss": 1.5867, + "step": 14801 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002015952050575977, + "loss": 1.521, + "step": 14802 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020158359933938744, + "loss": 1.5936, + "step": 14803 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020157199327095306, + "loss": 1.5668, + "step": 14804 + }, + { + "epoch": 1.16, + "learning_rate": 0.0002015603868523733, + "loss": 1.5778, + "step": 14805 + }, + { + "epoch": 1.16, + "learning_rate": 0.00020154878008372696, + "loss": 1.6052, + "step": 14806 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020153717296509286, + "loss": 1.5361, + "step": 14807 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020152556549654982, + "loss": 1.549, + "step": 14808 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020151395767817654, + "loss": 1.559, + "step": 14809 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020150234951005203, + "loss": 1.545, + "step": 14810 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020149074099225488, + "loss": 1.5672, + "step": 14811 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002014791321248641, + "loss": 1.5207, + "step": 14812 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020146752290795835, + "loss": 1.5614, + "step": 14813 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020145591334161655, + "loss": 1.5117, + "step": 14814 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020144430342591753, + "loss": 1.5713, + "step": 14815 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020143269316094003, + "loss": 1.5605, + "step": 14816 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020142108254676296, + "loss": 1.5727, + "step": 14817 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002014094715834651, + "loss": 1.5471, + "step": 14818 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002013978602711253, + "loss": 1.5476, + "step": 14819 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020138624860982238, + "loss": 1.4714, + "step": 14820 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002013746365996352, + "loss": 1.5565, + "step": 14821 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002013630242406426, + "loss": 1.5253, + "step": 14822 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002013514115329234, + "loss": 1.5142, + "step": 14823 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020133979847655642, + "loss": 1.5387, + "step": 14824 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020132818507162057, + "loss": 1.5293, + "step": 14825 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020131657131819465, + "loss": 1.513, + "step": 14826 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002013049572163576, + "loss": 1.5747, + "step": 14827 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020129334276618814, + "loss": 1.5856, + "step": 14828 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002012817279677652, + "loss": 1.5796, + "step": 14829 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020127011282116764, + "loss": 1.5458, + "step": 14830 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020125849732647428, + "loss": 1.5454, + "step": 14831 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020124688148376402, + "loss": 1.5315, + "step": 14832 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002012352652931157, + "loss": 1.5269, + "step": 14833 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020122364875460827, + "loss": 1.533, + "step": 14834 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020121203186832047, + "loss": 1.5931, + "step": 14835 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020120041463433125, + "loss": 1.5714, + "step": 14836 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002011887970527195, + "loss": 1.5201, + "step": 14837 + }, + { + "epoch": 1.17, + "learning_rate": 0.000201177179123564, + "loss": 1.5252, + "step": 14838 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020116556084694376, + "loss": 1.5444, + "step": 14839 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020115394222293753, + "loss": 1.6306, + "step": 14840 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020114232325162433, + "loss": 1.5699, + "step": 14841 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020113070393308293, + "loss": 1.5552, + "step": 14842 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020111908426739228, + "loss": 1.5328, + "step": 14843 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020110746425463128, + "loss": 1.5323, + "step": 14844 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020109584389487877, + "loss": 1.5051, + "step": 14845 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020108422318821373, + "loss": 1.5107, + "step": 14846 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020107260213471495, + "loss": 1.5769, + "step": 14847 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020106098073446136, + "loss": 1.5591, + "step": 14848 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020104935898753194, + "loss": 1.5003, + "step": 14849 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020103773689400555, + "loss": 1.5339, + "step": 14850 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020102611445396108, + "loss": 1.5181, + "step": 14851 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020101449166747744, + "loss": 1.5542, + "step": 14852 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020100286853463355, + "loss": 1.5119, + "step": 14853 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020099124505550836, + "loss": 1.5094, + "step": 14854 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020097962123018072, + "loss": 1.5504, + "step": 14855 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020096799705872958, + "loss": 1.5466, + "step": 14856 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002009563725412339, + "loss": 1.5844, + "step": 14857 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020094474767777255, + "loss": 1.529, + "step": 14858 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002009331224684245, + "loss": 1.5405, + "step": 14859 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020092149691326865, + "loss": 1.5552, + "step": 14860 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020090987101238392, + "loss": 1.575, + "step": 14861 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020089824476584927, + "loss": 1.529, + "step": 14862 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002008866181737436, + "loss": 1.5695, + "step": 14863 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002008749912361459, + "loss": 1.5962, + "step": 14864 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020086336395313506, + "loss": 1.525, + "step": 14865 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020085173632479009, + "loss": 1.5515, + "step": 14866 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020084010835118987, + "loss": 1.5824, + "step": 14867 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020082848003241338, + "loss": 1.5512, + "step": 14868 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020081685136853956, + "loss": 1.4863, + "step": 14869 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020080522235964735, + "loss": 1.5709, + "step": 14870 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020079359300581573, + "loss": 1.5397, + "step": 14871 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002007819633071236, + "loss": 1.5804, + "step": 14872 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020077033326364998, + "loss": 1.5459, + "step": 14873 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020075870287547385, + "loss": 1.5148, + "step": 14874 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020074707214267414, + "loss": 1.5637, + "step": 14875 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020073544106532978, + "loss": 1.5873, + "step": 14876 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020072380964351977, + "loss": 1.5166, + "step": 14877 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020071217787732314, + "loss": 1.5387, + "step": 14878 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020070054576681875, + "loss": 1.5389, + "step": 14879 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020068891331208566, + "loss": 1.564, + "step": 14880 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020067728051320277, + "loss": 1.6148, + "step": 14881 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020066564737024917, + "loss": 1.5884, + "step": 14882 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002006540138833038, + "loss": 1.5261, + "step": 14883 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002006423800524456, + "loss": 1.5482, + "step": 14884 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020063074587775359, + "loss": 1.5589, + "step": 14885 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020061911135930673, + "loss": 1.6026, + "step": 14886 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020060747649718405, + "loss": 1.5523, + "step": 14887 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020059584129146453, + "loss": 1.5497, + "step": 14888 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020058420574222714, + "loss": 1.5489, + "step": 14889 + }, + { + "epoch": 1.17, + "learning_rate": 0.000200572569849551, + "loss": 1.5432, + "step": 14890 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020056093361351497, + "loss": 1.5275, + "step": 14891 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020054929703419808, + "loss": 1.5759, + "step": 14892 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020053766011167938, + "loss": 1.5592, + "step": 14893 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020052602284603786, + "loss": 1.5129, + "step": 14894 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020051438523735251, + "loss": 1.5439, + "step": 14895 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020050274728570234, + "loss": 1.6067, + "step": 14896 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020049110899116645, + "loss": 1.5165, + "step": 14897 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020047947035382378, + "loss": 1.5567, + "step": 14898 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002004678313737533, + "loss": 1.5046, + "step": 14899 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020045619205103418, + "loss": 1.5188, + "step": 14900 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002004445523857453, + "loss": 1.4878, + "step": 14901 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020043291237796578, + "loss": 1.5835, + "step": 14902 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020042127202777457, + "loss": 1.5147, + "step": 14903 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020040963133525076, + "loss": 1.5929, + "step": 14904 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020039799030047343, + "loss": 1.5245, + "step": 14905 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020038634892352152, + "loss": 1.557, + "step": 14906 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020037470720447412, + "loss": 1.5266, + "step": 14907 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020036306514341023, + "loss": 1.5465, + "step": 14908 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020035142274040893, + "loss": 1.5323, + "step": 14909 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020033977999554928, + "loss": 1.5395, + "step": 14910 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020032813690891023, + "loss": 1.5867, + "step": 14911 + }, + { + "epoch": 1.17, + "learning_rate": 0.000200316493480571, + "loss": 1.5376, + "step": 14912 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020030484971061047, + "loss": 1.5901, + "step": 14913 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020029320559910782, + "loss": 1.6383, + "step": 14914 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020028156114614202, + "loss": 1.6228, + "step": 14915 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020026991635179218, + "loss": 1.6023, + "step": 14916 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002002582712161374, + "loss": 1.565, + "step": 14917 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020024662573925664, + "loss": 1.5326, + "step": 14918 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020023497992122902, + "loss": 1.5025, + "step": 14919 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002002233337621336, + "loss": 1.5684, + "step": 14920 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020021168726204946, + "loss": 1.5261, + "step": 14921 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020020004042105573, + "loss": 1.5787, + "step": 14922 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002001883932392314, + "loss": 1.5355, + "step": 14923 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020017674571665554, + "loss": 1.5146, + "step": 14924 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002001650978534073, + "loss": 1.5514, + "step": 14925 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020015344964956572, + "loss": 1.5647, + "step": 14926 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002001418011052099, + "loss": 1.5621, + "step": 14927 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020013015222041888, + "loss": 1.5433, + "step": 14928 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020011850299527184, + "loss": 1.5437, + "step": 14929 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002001068534298478, + "loss": 1.6097, + "step": 14930 + }, + { + "epoch": 1.17, + "learning_rate": 0.0002000952035242259, + "loss": 1.5176, + "step": 14931 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020008355327848522, + "loss": 1.5434, + "step": 14932 + }, + { + "epoch": 1.17, + "learning_rate": 0.00020007190269270478, + "loss": 1.499, + "step": 14933 + }, + { + "epoch": 1.18, + "learning_rate": 0.00020006025176696384, + "loss": 1.5835, + "step": 14934 + }, + { + "epoch": 1.18, + "learning_rate": 0.00020004860050134134, + "loss": 1.6121, + "step": 14935 + }, + { + "epoch": 1.18, + "learning_rate": 0.00020003694889591652, + "loss": 1.5574, + "step": 14936 + }, + { + "epoch": 1.18, + "learning_rate": 0.00020002529695076841, + "loss": 1.5755, + "step": 14937 + }, + { + "epoch": 1.18, + "learning_rate": 0.00020001364466597612, + "loss": 1.6119, + "step": 14938 + }, + { + "epoch": 1.18, + "learning_rate": 0.00020000199204161883, + "loss": 1.6063, + "step": 14939 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019999033907777556, + "loss": 1.5351, + "step": 14940 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019997868577452553, + "loss": 1.581, + "step": 14941 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019996703213194772, + "loss": 1.5515, + "step": 14942 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019995537815012138, + "loss": 1.5363, + "step": 14943 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001999437238291256, + "loss": 1.5937, + "step": 14944 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001999320691690395, + "loss": 1.5329, + "step": 14945 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019992041416994224, + "loss": 1.5084, + "step": 14946 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019990875883191283, + "loss": 1.5428, + "step": 14947 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001998971031550305, + "loss": 1.5711, + "step": 14948 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019988544713937445, + "loss": 1.5345, + "step": 14949 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019987379078502363, + "loss": 1.5537, + "step": 14950 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019986213409205742, + "loss": 1.5461, + "step": 14951 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019985047706055475, + "loss": 1.5037, + "step": 14952 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019983881969059492, + "loss": 1.5135, + "step": 14953 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019982716198225695, + "loss": 1.5276, + "step": 14954 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019981550393562006, + "loss": 1.5506, + "step": 14955 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019980384555076338, + "loss": 1.5072, + "step": 14956 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001997921868277661, + "loss": 1.5108, + "step": 14957 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019978052776670733, + "loss": 1.5703, + "step": 14958 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019976886836766623, + "loss": 1.5915, + "step": 14959 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019975720863072197, + "loss": 1.5005, + "step": 14960 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001997455485559538, + "loss": 1.5735, + "step": 14961 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019973388814344074, + "loss": 1.5448, + "step": 14962 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019972222739326207, + "loss": 1.549, + "step": 14963 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019971056630549688, + "loss": 1.5414, + "step": 14964 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019969890488022438, + "loss": 1.5995, + "step": 14965 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019968724311752374, + "loss": 1.5571, + "step": 14966 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019967558101747414, + "loss": 1.5718, + "step": 14967 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019966391858015477, + "loss": 1.5665, + "step": 14968 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001996522558056448, + "loss": 1.5301, + "step": 14969 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019964059269402345, + "loss": 1.5298, + "step": 14970 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019962892924536979, + "loss": 1.5152, + "step": 14971 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019961726545976314, + "loss": 1.5253, + "step": 14972 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019960560133728262, + "loss": 1.5733, + "step": 14973 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001995939368780074, + "loss": 1.5185, + "step": 14974 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001995822720820168, + "loss": 1.5078, + "step": 14975 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019957060694938988, + "loss": 1.548, + "step": 14976 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001995589414802059, + "loss": 1.5486, + "step": 14977 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001995472756745441, + "loss": 1.547, + "step": 14978 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019953560953248357, + "loss": 1.5207, + "step": 14979 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019952394305410365, + "loss": 1.5483, + "step": 14980 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019951227623948346, + "loss": 1.5167, + "step": 14981 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019950060908870224, + "loss": 1.5662, + "step": 14982 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019948894160183917, + "loss": 1.5614, + "step": 14983 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019947727377897355, + "loss": 1.5322, + "step": 14984 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019946560562018452, + "loss": 1.5207, + "step": 14985 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001994539371255513, + "loss": 1.5642, + "step": 14986 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019944226829515316, + "loss": 1.5255, + "step": 14987 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019943059912906936, + "loss": 1.561, + "step": 14988 + }, + { + "epoch": 1.18, + "learning_rate": 0.000199418929627379, + "loss": 1.5568, + "step": 14989 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019940725979016136, + "loss": 1.5306, + "step": 14990 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019939558961749572, + "loss": 1.5937, + "step": 14991 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019938391910946133, + "loss": 1.5663, + "step": 14992 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019937224826613735, + "loss": 1.5663, + "step": 14993 + }, + { + "epoch": 1.18, + "learning_rate": 0.000199360577087603, + "loss": 1.5557, + "step": 14994 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019934890557393766, + "loss": 1.5369, + "step": 14995 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019933723372522044, + "loss": 1.6417, + "step": 14996 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019932556154153062, + "loss": 1.5543, + "step": 14997 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019931388902294747, + "loss": 1.4782, + "step": 14998 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019930221616955022, + "loss": 1.519, + "step": 14999 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001992905429814181, + "loss": 1.5899, + "step": 15000 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019927886945863044, + "loss": 1.5209, + "step": 15001 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019926719560126645, + "loss": 1.5586, + "step": 15002 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019925552140940536, + "loss": 1.512, + "step": 15003 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001992438468831265, + "loss": 1.5065, + "step": 15004 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019923217202250906, + "loss": 1.5733, + "step": 15005 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019922049682763232, + "loss": 1.5378, + "step": 15006 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019920882129857562, + "loss": 1.4742, + "step": 15007 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019919714543541818, + "loss": 1.5635, + "step": 15008 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019918546923823927, + "loss": 1.5344, + "step": 15009 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019917379270711813, + "loss": 1.5229, + "step": 15010 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001991621158421341, + "loss": 1.5355, + "step": 15011 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019915043864336646, + "loss": 1.5502, + "step": 15012 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001991387611108944, + "loss": 1.5902, + "step": 15013 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001991270832447973, + "loss": 1.5504, + "step": 15014 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001991154050451544, + "loss": 1.5747, + "step": 15015 + }, + { + "epoch": 1.18, + "learning_rate": 0.000199103726512045, + "loss": 1.5748, + "step": 15016 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019909204764554845, + "loss": 1.5629, + "step": 15017 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019908036844574396, + "loss": 1.5496, + "step": 15018 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019906868891271084, + "loss": 1.5105, + "step": 15019 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001990570090465284, + "loss": 1.4935, + "step": 15020 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019904532884727595, + "loss": 1.5371, + "step": 15021 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019903364831503278, + "loss": 1.5922, + "step": 15022 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001990219674498782, + "loss": 1.4516, + "step": 15023 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001990102862518915, + "loss": 1.5544, + "step": 15024 + }, + { + "epoch": 1.18, + "learning_rate": 0.000198998604721152, + "loss": 1.4893, + "step": 15025 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019898692285773905, + "loss": 1.5298, + "step": 15026 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001989752406617319, + "loss": 1.5757, + "step": 15027 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001989635581332099, + "loss": 1.5665, + "step": 15028 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019895187527225233, + "loss": 1.5765, + "step": 15029 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019894019207893857, + "loss": 1.5699, + "step": 15030 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019892850855334794, + "loss": 1.6082, + "step": 15031 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019891682469555966, + "loss": 1.5253, + "step": 15032 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001989051405056532, + "loss": 1.5763, + "step": 15033 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019889345598370783, + "loss": 1.5641, + "step": 15034 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019888177112980284, + "loss": 1.5061, + "step": 15035 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019887008594401763, + "loss": 1.5658, + "step": 15036 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019885840042643146, + "loss": 1.5756, + "step": 15037 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001988467145771238, + "loss": 1.5409, + "step": 15038 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019883502839617378, + "loss": 1.5851, + "step": 15039 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019882334188366094, + "loss": 1.6157, + "step": 15040 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019881165503966456, + "loss": 1.5541, + "step": 15041 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019879996786426393, + "loss": 1.5472, + "step": 15042 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019878828035753852, + "loss": 1.5314, + "step": 15043 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019877659251956755, + "loss": 1.5478, + "step": 15044 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019876490435043043, + "loss": 1.5551, + "step": 15045 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019875321585020658, + "loss": 1.5567, + "step": 15046 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019874152701897525, + "loss": 1.5371, + "step": 15047 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019872983785681586, + "loss": 1.5331, + "step": 15048 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019871814836380777, + "loss": 1.5894, + "step": 15049 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019870645854003035, + "loss": 1.5745, + "step": 15050 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019869476838556293, + "loss": 1.4963, + "step": 15051 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019868307790048487, + "loss": 1.517, + "step": 15052 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019867138708487564, + "loss": 1.5409, + "step": 15053 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019865969593881453, + "loss": 1.6157, + "step": 15054 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019864800446238093, + "loss": 1.5531, + "step": 15055 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019863631265565422, + "loss": 1.5469, + "step": 15056 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001986246205187138, + "loss": 1.5551, + "step": 15057 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019861292805163904, + "loss": 1.5804, + "step": 15058 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019860123525450933, + "loss": 1.5921, + "step": 15059 + }, + { + "epoch": 1.18, + "learning_rate": 0.00019858954212740405, + "loss": 1.5331, + "step": 15060 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019857784867040256, + "loss": 1.5383, + "step": 15061 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019856615488358432, + "loss": 1.5467, + "step": 15062 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019855446076702874, + "loss": 1.5368, + "step": 15063 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019854276632081506, + "loss": 1.5759, + "step": 15064 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001985310715450229, + "loss": 1.5764, + "step": 15065 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001985193764397314, + "loss": 1.5182, + "step": 15066 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001985076810050202, + "loss": 1.534, + "step": 15067 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019849598524096862, + "loss": 1.6172, + "step": 15068 + }, + { + "epoch": 1.19, + "learning_rate": 0.000198484289147656, + "loss": 1.5613, + "step": 15069 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019847259272516191, + "loss": 1.596, + "step": 15070 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019846089597356557, + "loss": 1.5526, + "step": 15071 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019844919889294656, + "loss": 1.5339, + "step": 15072 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001984375014833842, + "loss": 1.5204, + "step": 15073 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019842580374495794, + "loss": 1.5384, + "step": 15074 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019841410567774723, + "loss": 1.5563, + "step": 15075 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019840240728183136, + "loss": 1.5664, + "step": 15076 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019839070855728997, + "loss": 1.564, + "step": 15077 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019837900950420227, + "loss": 1.5374, + "step": 15078 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019836731012264785, + "loss": 1.4921, + "step": 15079 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001983556104127061, + "loss": 1.5674, + "step": 15080 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001983439103744564, + "loss": 1.5359, + "step": 15081 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019833221000797828, + "loss": 1.5523, + "step": 15082 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019832050931335108, + "loss": 1.4992, + "step": 15083 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019830880829065428, + "loss": 1.5188, + "step": 15084 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019829710693996733, + "loss": 1.5771, + "step": 15085 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019828540526136969, + "loss": 1.4954, + "step": 15086 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019827370325494083, + "loss": 1.5294, + "step": 15087 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001982620009207601, + "loss": 1.5727, + "step": 15088 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019825029825890704, + "loss": 1.6093, + "step": 15089 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001982385952694611, + "loss": 1.5694, + "step": 15090 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019822689195250174, + "loss": 1.524, + "step": 15091 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019821518830810835, + "loss": 1.5472, + "step": 15092 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019820348433636045, + "loss": 1.5392, + "step": 15093 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019819178003733752, + "loss": 1.5537, + "step": 15094 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019818007541111895, + "loss": 1.6358, + "step": 15095 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019816837045778427, + "loss": 1.5612, + "step": 15096 + }, + { + "epoch": 1.19, + "learning_rate": 0.000198156665177413, + "loss": 1.5207, + "step": 15097 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001981449595700845, + "loss": 1.579, + "step": 15098 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019813325363587827, + "loss": 1.567, + "step": 15099 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001981215473748738, + "loss": 1.571, + "step": 15100 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019810984078715062, + "loss": 1.5666, + "step": 15101 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019809813387278817, + "loss": 1.5528, + "step": 15102 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019808642663186592, + "loss": 1.5673, + "step": 15103 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001980747190644634, + "loss": 1.5609, + "step": 15104 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019806301117066002, + "loss": 1.562, + "step": 15105 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019805130295053532, + "loss": 1.5989, + "step": 15106 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001980395944041688, + "loss": 1.5241, + "step": 15107 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019802788553163994, + "loss": 1.4957, + "step": 15108 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019801617633302828, + "loss": 1.5511, + "step": 15109 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019800446680841324, + "loss": 1.5321, + "step": 15110 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019799275695787442, + "loss": 1.5289, + "step": 15111 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019798104678149118, + "loss": 1.5154, + "step": 15112 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019796933627934317, + "loss": 1.5909, + "step": 15113 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019795762545150983, + "loss": 1.5602, + "step": 15114 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019794591429807062, + "loss": 1.5479, + "step": 15115 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019793420281910516, + "loss": 1.6018, + "step": 15116 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019792249101469291, + "loss": 1.5508, + "step": 15117 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001979107788849134, + "loss": 1.5788, + "step": 15118 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019789906642984616, + "loss": 1.5748, + "step": 15119 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019788735364957064, + "loss": 1.5728, + "step": 15120 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019787564054416648, + "loss": 1.512, + "step": 15121 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019786392711371308, + "loss": 1.4686, + "step": 15122 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019785221335829006, + "loss": 1.5711, + "step": 15123 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019784049927797686, + "loss": 1.5277, + "step": 15124 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019782878487285314, + "loss": 1.56, + "step": 15125 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019781707014299838, + "loss": 1.538, + "step": 15126 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019780535508849207, + "loss": 1.5978, + "step": 15127 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019779363970941373, + "loss": 1.521, + "step": 15128 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019778192400584304, + "loss": 1.5841, + "step": 15129 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019777020797785938, + "loss": 1.6084, + "step": 15130 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001977584916255424, + "loss": 1.5498, + "step": 15131 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001977467749489716, + "loss": 1.5644, + "step": 15132 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001977350579482266, + "loss": 1.5131, + "step": 15133 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019772334062338683, + "loss": 1.5236, + "step": 15134 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019771162297453195, + "loss": 1.5288, + "step": 15135 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019769990500174153, + "loss": 1.5619, + "step": 15136 + }, + { + "epoch": 1.19, + "learning_rate": 0.000197688186705095, + "loss": 1.5319, + "step": 15137 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019767646808467205, + "loss": 1.586, + "step": 15138 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019766474914055212, + "loss": 1.5946, + "step": 15139 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019765302987281491, + "loss": 1.5133, + "step": 15140 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001976413102815399, + "loss": 1.5541, + "step": 15141 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001976295903668067, + "loss": 1.5696, + "step": 15142 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019761787012869487, + "loss": 1.5276, + "step": 15143 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019760614956728392, + "loss": 1.5541, + "step": 15144 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019759442868265355, + "loss": 1.5335, + "step": 15145 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001975827074748833, + "loss": 1.549, + "step": 15146 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001975709859440526, + "loss": 1.5484, + "step": 15147 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019755926409024128, + "loss": 1.5447, + "step": 15148 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019754754191352874, + "loss": 1.5089, + "step": 15149 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019753581941399468, + "loss": 1.5384, + "step": 15150 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001975240965917186, + "loss": 1.5378, + "step": 15151 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019751237344678012, + "loss": 1.5737, + "step": 15152 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001975006499792589, + "loss": 1.5567, + "step": 15153 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019748892618923441, + "loss": 1.5769, + "step": 15154 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019747720207678634, + "loss": 1.5529, + "step": 15155 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019746547764199428, + "loss": 1.5838, + "step": 15156 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001974537528849378, + "loss": 1.5305, + "step": 15157 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019744202780569659, + "loss": 1.596, + "step": 15158 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001974303024043501, + "loss": 1.5574, + "step": 15159 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001974185766809781, + "loss": 1.5411, + "step": 15160 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001974068506356601, + "loss": 1.5515, + "step": 15161 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019739512426847575, + "loss": 1.5751, + "step": 15162 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019738339757950464, + "loss": 1.5805, + "step": 15163 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019737167056882644, + "loss": 1.494, + "step": 15164 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019735994323652074, + "loss": 1.5545, + "step": 15165 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019734821558266714, + "loss": 1.5392, + "step": 15166 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019733648760734534, + "loss": 1.5975, + "step": 15167 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019732475931063482, + "loss": 1.5224, + "step": 15168 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019731303069261537, + "loss": 1.5142, + "step": 15169 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001973013017533665, + "loss": 1.5421, + "step": 15170 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019728957249296792, + "loss": 1.5604, + "step": 15171 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001972778429114993, + "loss": 1.5661, + "step": 15172 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019726611300904015, + "loss": 1.5943, + "step": 15173 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019725438278567016, + "loss": 1.5527, + "step": 15174 + }, + { + "epoch": 1.19, + "learning_rate": 0.000197242652241469, + "loss": 1.5191, + "step": 15175 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019723092137651632, + "loss": 1.5197, + "step": 15176 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001972191901908918, + "loss": 1.5316, + "step": 15177 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019720745868467493, + "loss": 1.6017, + "step": 15178 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019719572685794552, + "loss": 1.5275, + "step": 15179 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019718399471078317, + "loss": 1.5268, + "step": 15180 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001971722622432675, + "loss": 1.5798, + "step": 15181 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019716052945547828, + "loss": 1.5403, + "step": 15182 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019714879634749502, + "loss": 1.5114, + "step": 15183 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019713706291939745, + "loss": 1.563, + "step": 15184 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001971253291712653, + "loss": 1.5692, + "step": 15185 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001971135951031781, + "loss": 1.5871, + "step": 15186 + }, + { + "epoch": 1.19, + "learning_rate": 0.00019710186071521564, + "loss": 1.5301, + "step": 15187 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001970901260074575, + "loss": 1.5887, + "step": 15188 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019707839097998344, + "loss": 1.5233, + "step": 15189 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019706665563287302, + "loss": 1.5296, + "step": 15190 + }, + { + "epoch": 1.2, + "learning_rate": 0.000197054919966206, + "loss": 1.6056, + "step": 15191 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001970431839800621, + "loss": 1.5729, + "step": 15192 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001970314476745209, + "loss": 1.545, + "step": 15193 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019701971104966207, + "loss": 1.5797, + "step": 15194 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019700797410556544, + "loss": 1.5796, + "step": 15195 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019699623684231058, + "loss": 1.5449, + "step": 15196 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019698449925997715, + "loss": 1.5799, + "step": 15197 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019697276135864495, + "loss": 1.5938, + "step": 15198 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019696102313839365, + "loss": 1.5334, + "step": 15199 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019694928459930287, + "loss": 1.5203, + "step": 15200 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019693754574145236, + "loss": 1.6097, + "step": 15201 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001969258065649218, + "loss": 1.5877, + "step": 15202 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019691406706979093, + "loss": 1.5608, + "step": 15203 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019690232725613947, + "loss": 1.6108, + "step": 15204 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019689058712404707, + "loss": 1.5715, + "step": 15205 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019687884667359343, + "loss": 1.5258, + "step": 15206 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019686710590485833, + "loss": 1.553, + "step": 15207 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019685536481792138, + "loss": 1.6206, + "step": 15208 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019684362341286244, + "loss": 1.5893, + "step": 15209 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001968318816897611, + "loss": 1.5555, + "step": 15210 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019682013964869715, + "loss": 1.599, + "step": 15211 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019680839728975023, + "loss": 1.5729, + "step": 15212 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001967966546130002, + "loss": 1.5115, + "step": 15213 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019678491161852668, + "loss": 1.5637, + "step": 15214 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019677316830640947, + "loss": 1.5347, + "step": 15215 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001967614246767282, + "loss": 1.5461, + "step": 15216 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019674968072956267, + "loss": 1.5714, + "step": 15217 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019673793646499263, + "loss": 1.5524, + "step": 15218 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019672619188309775, + "loss": 1.5306, + "step": 15219 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019671444698395784, + "loss": 1.5661, + "step": 15220 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019670270176765263, + "loss": 1.5229, + "step": 15221 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019669095623426185, + "loss": 1.5454, + "step": 15222 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019667921038386523, + "loss": 1.52, + "step": 15223 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019666746421654252, + "loss": 1.5538, + "step": 15224 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001966557177323735, + "loss": 1.5818, + "step": 15225 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019664397093143788, + "loss": 1.5152, + "step": 15226 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019663222381381543, + "loss": 1.5167, + "step": 15227 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019662047637958595, + "loss": 1.5846, + "step": 15228 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019660872862882917, + "loss": 1.625, + "step": 15229 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001965969805616248, + "loss": 1.5358, + "step": 15230 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019658523217805268, + "loss": 1.609, + "step": 15231 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019657348347819253, + "loss": 1.5696, + "step": 15232 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001965617344621241, + "loss": 1.5459, + "step": 15233 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019654998512992722, + "loss": 1.4938, + "step": 15234 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019653823548168166, + "loss": 1.552, + "step": 15235 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001965264855174671, + "loss": 1.5603, + "step": 15236 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001965147352373634, + "loss": 1.6004, + "step": 15237 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019650298464145033, + "loss": 1.523, + "step": 15238 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019649123372980764, + "loss": 1.5003, + "step": 15239 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019647948250251516, + "loss": 1.5329, + "step": 15240 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019646773095965262, + "loss": 1.5782, + "step": 15241 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001964559791012998, + "loss": 1.5479, + "step": 15242 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001964442269275366, + "loss": 1.5469, + "step": 15243 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019643247443844265, + "loss": 1.5494, + "step": 15244 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019642072163409788, + "loss": 1.5568, + "step": 15245 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019640896851458198, + "loss": 1.5387, + "step": 15246 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001963972150799748, + "loss": 1.567, + "step": 15247 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001963854613303562, + "loss": 1.5161, + "step": 15248 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001963737072658058, + "loss": 1.5177, + "step": 15249 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019636195288640358, + "loss": 1.5844, + "step": 15250 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001963501981922293, + "loss": 1.6065, + "step": 15251 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019633844318336276, + "loss": 1.4813, + "step": 15252 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019632668785988375, + "loss": 1.5072, + "step": 15253 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019631493222187208, + "loss": 1.4841, + "step": 15254 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019630317626940757, + "loss": 1.5031, + "step": 15255 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019629142000257007, + "loss": 1.5607, + "step": 15256 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019627966342143936, + "loss": 1.5202, + "step": 15257 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019626790652609526, + "loss": 1.5463, + "step": 15258 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019625614931661762, + "loss": 1.6016, + "step": 15259 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001962443917930863, + "loss": 1.5064, + "step": 15260 + }, + { + "epoch": 1.2, + "learning_rate": 0.000196232633955581, + "loss": 1.5404, + "step": 15261 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001962208758041817, + "loss": 1.5893, + "step": 15262 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019620911733896808, + "loss": 1.549, + "step": 15263 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019619735856002011, + "loss": 1.5038, + "step": 15264 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019618559946741755, + "loss": 1.5584, + "step": 15265 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019617384006124028, + "loss": 1.5426, + "step": 15266 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001961620803415681, + "loss": 1.5896, + "step": 15267 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019615032030848088, + "loss": 1.5494, + "step": 15268 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019613855996205844, + "loss": 1.5028, + "step": 15269 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019612679930238066, + "loss": 1.566, + "step": 15270 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019611503832952734, + "loss": 1.5822, + "step": 15271 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001961032770435784, + "loss": 1.5859, + "step": 15272 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019609151544461358, + "loss": 1.5628, + "step": 15273 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019607975353271286, + "loss": 1.5817, + "step": 15274 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019606799130795602, + "loss": 1.5425, + "step": 15275 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019605622877042294, + "loss": 1.5418, + "step": 15276 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001960444659201935, + "loss": 1.5929, + "step": 15277 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019603270275734755, + "loss": 1.5383, + "step": 15278 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019602093928196496, + "loss": 1.5664, + "step": 15279 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019600917549412552, + "loss": 1.5778, + "step": 15280 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001959974113939092, + "loss": 1.5332, + "step": 15281 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019598564698139587, + "loss": 1.5569, + "step": 15282 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019597388225666535, + "loss": 1.5263, + "step": 15283 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001959621172197976, + "loss": 1.5014, + "step": 15284 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019595035187087236, + "loss": 1.527, + "step": 15285 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001959385862099696, + "loss": 1.4592, + "step": 15286 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019592682023716925, + "loss": 1.5439, + "step": 15287 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019591505395255104, + "loss": 1.5235, + "step": 15288 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019590328735619506, + "loss": 1.5922, + "step": 15289 + }, + { + "epoch": 1.2, + "learning_rate": 0.000195891520448181, + "loss": 1.5579, + "step": 15290 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001958797532285889, + "loss": 1.5121, + "step": 15291 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019586798569749857, + "loss": 1.5483, + "step": 15292 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001958562178549899, + "loss": 1.5441, + "step": 15293 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001958444497011429, + "loss": 1.5593, + "step": 15294 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019583268123603729, + "loss": 1.529, + "step": 15295 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019582091245975308, + "loss": 1.5248, + "step": 15296 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001958091433723702, + "loss": 1.5237, + "step": 15297 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019579737397396851, + "loss": 1.5798, + "step": 15298 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019578560426462794, + "loss": 1.5554, + "step": 15299 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019577383424442836, + "loss": 1.551, + "step": 15300 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019576206391344971, + "loss": 1.4884, + "step": 15301 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019575029327177187, + "loss": 1.5564, + "step": 15302 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019573852231947482, + "loss": 1.5665, + "step": 15303 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019572675105663842, + "loss": 1.5484, + "step": 15304 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019571497948334265, + "loss": 1.5883, + "step": 15305 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001957032075996674, + "loss": 1.624, + "step": 15306 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019569143540569255, + "loss": 1.5579, + "step": 15307 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019567966290149808, + "loss": 1.5526, + "step": 15308 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019566789008716395, + "loss": 1.5976, + "step": 15309 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019565611696276998, + "loss": 1.5371, + "step": 15310 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019564434352839624, + "loss": 1.5677, + "step": 15311 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019563256978412253, + "loss": 1.5502, + "step": 15312 + }, + { + "epoch": 1.2, + "learning_rate": 0.00019562079573002888, + "loss": 1.5279, + "step": 15313 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001956090213661952, + "loss": 1.5123, + "step": 15314 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019559724669270144, + "loss": 1.5086, + "step": 15315 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019558547170962754, + "loss": 1.5283, + "step": 15316 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019557369641705344, + "loss": 1.5322, + "step": 15317 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001955619208150591, + "loss": 1.5441, + "step": 15318 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019555014490372445, + "loss": 1.5533, + "step": 15319 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019553836868312945, + "loss": 1.5209, + "step": 15320 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019552659215335406, + "loss": 1.5492, + "step": 15321 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019551481531447822, + "loss": 1.5816, + "step": 15322 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019550303816658196, + "loss": 1.621, + "step": 15323 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001954912607097451, + "loss": 1.564, + "step": 15324 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001954794829440477, + "loss": 1.5872, + "step": 15325 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001954677048695698, + "loss": 1.5542, + "step": 15326 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001954559264863912, + "loss": 1.4857, + "step": 15327 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001954441477945919, + "loss": 1.5337, + "step": 15328 + }, + { + "epoch": 1.21, + "learning_rate": 0.000195432368794252, + "loss": 1.5127, + "step": 15329 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019542058948545136, + "loss": 1.5694, + "step": 15330 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019540880986826994, + "loss": 1.504, + "step": 15331 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019539702994278782, + "loss": 1.5496, + "step": 15332 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019538524970908489, + "loss": 1.5604, + "step": 15333 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019537346916724115, + "loss": 1.5649, + "step": 15334 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019536168831733657, + "loss": 1.561, + "step": 15335 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001953499071594512, + "loss": 1.5723, + "step": 15336 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019533812569366498, + "loss": 1.5432, + "step": 15337 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019532634392005794, + "loss": 1.5054, + "step": 15338 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019531456183871, + "loss": 1.4959, + "step": 15339 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019530277944970122, + "loss": 1.6402, + "step": 15340 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019529099675311154, + "loss": 1.5067, + "step": 15341 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019527921374902098, + "loss": 1.6224, + "step": 15342 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019526743043750955, + "loss": 1.561, + "step": 15343 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019525564681865723, + "loss": 1.6096, + "step": 15344 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001952438628925441, + "loss": 1.5142, + "step": 15345 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019523207865925006, + "loss": 1.5681, + "step": 15346 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001952202941188552, + "loss": 1.512, + "step": 15347 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019520850927143946, + "loss": 1.5087, + "step": 15348 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001951967241170829, + "loss": 1.4646, + "step": 15349 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019518493865586557, + "loss": 1.5217, + "step": 15350 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019517315288786736, + "loss": 1.5797, + "step": 15351 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019516136681316845, + "loss": 1.561, + "step": 15352 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019514958043184873, + "loss": 1.5186, + "step": 15353 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001951377937439883, + "loss": 1.5146, + "step": 15354 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019512600674966718, + "loss": 1.5034, + "step": 15355 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019511421944896535, + "loss": 1.5641, + "step": 15356 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019510243184196288, + "loss": 1.587, + "step": 15357 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019509064392873973, + "loss": 1.5164, + "step": 15358 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019507885570937603, + "loss": 1.5152, + "step": 15359 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001950670671839518, + "loss": 1.5335, + "step": 15360 + }, + { + "epoch": 1.21, + "learning_rate": 0.000195055278352547, + "loss": 1.5158, + "step": 15361 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001950434892152418, + "loss": 1.5351, + "step": 15362 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001950316997721161, + "loss": 1.5179, + "step": 15363 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019501991002325003, + "loss": 1.5932, + "step": 15364 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019500811996872364, + "loss": 1.569, + "step": 15365 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019499632960861692, + "loss": 1.466, + "step": 15366 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019498453894300995, + "loss": 1.5005, + "step": 15367 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001949727479719828, + "loss": 1.5353, + "step": 15368 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001949609566956155, + "loss": 1.5581, + "step": 15369 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001949491651139881, + "loss": 1.5026, + "step": 15370 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001949373732271807, + "loss": 1.5472, + "step": 15371 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019492558103527337, + "loss": 1.5131, + "step": 15372 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019491378853834606, + "loss": 1.5383, + "step": 15373 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019490199573647898, + "loss": 1.5811, + "step": 15374 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001948902026297521, + "loss": 1.4935, + "step": 15375 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019487840921824553, + "loss": 1.5541, + "step": 15376 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019486661550203928, + "loss": 1.5278, + "step": 15377 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019485482148121349, + "loss": 1.5383, + "step": 15378 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019484302715584823, + "loss": 1.556, + "step": 15379 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019483123252602355, + "loss": 1.5298, + "step": 15380 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019481943759181954, + "loss": 1.5078, + "step": 15381 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019480764235331634, + "loss": 1.5646, + "step": 15382 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019479584681059386, + "loss": 1.5851, + "step": 15383 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001947840509637324, + "loss": 1.5656, + "step": 15384 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019477225481281192, + "loss": 1.573, + "step": 15385 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019476045835791254, + "loss": 1.5577, + "step": 15386 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019474866159911432, + "loss": 1.56, + "step": 15387 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019473686453649742, + "loss": 1.5167, + "step": 15388 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019472506717014187, + "loss": 1.5413, + "step": 15389 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019471326950012778, + "loss": 1.4872, + "step": 15390 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019470147152653532, + "loss": 1.5048, + "step": 15391 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001946896732494445, + "loss": 1.5983, + "step": 15392 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019467787466893546, + "loss": 1.5506, + "step": 15393 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019466607578508832, + "loss": 1.5474, + "step": 15394 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019465427659798318, + "loss": 1.5153, + "step": 15395 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019464247710770016, + "loss": 1.5187, + "step": 15396 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001946306773143193, + "loss": 1.5125, + "step": 15397 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019461887721792078, + "loss": 1.535, + "step": 15398 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019460707681858474, + "loss": 1.5528, + "step": 15399 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019459527611639122, + "loss": 1.527, + "step": 15400 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019458347511142044, + "loss": 1.5514, + "step": 15401 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019457167380375245, + "loss": 1.5756, + "step": 15402 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019455987219346737, + "loss": 1.5663, + "step": 15403 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019454807028064535, + "loss": 1.5862, + "step": 15404 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019453626806536654, + "loss": 1.5417, + "step": 15405 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019452446554771101, + "loss": 1.5267, + "step": 15406 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019451266272775897, + "loss": 1.5467, + "step": 15407 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019450085960559052, + "loss": 1.5474, + "step": 15408 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019448905618128575, + "loss": 1.5198, + "step": 15409 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019447725245492486, + "loss": 1.5624, + "step": 15410 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019446544842658797, + "loss": 1.5558, + "step": 15411 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019445364409635522, + "loss": 1.5581, + "step": 15412 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001944418394643068, + "loss": 1.5441, + "step": 15413 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019443003453052272, + "loss": 1.4992, + "step": 15414 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019441822929508332, + "loss": 1.5455, + "step": 15415 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001944064237580686, + "loss": 1.5698, + "step": 15416 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019439461791955878, + "loss": 1.5467, + "step": 15417 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019438281177963402, + "loss": 1.5746, + "step": 15418 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019437100533837445, + "loss": 1.5828, + "step": 15419 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001943591985958602, + "loss": 1.5081, + "step": 15420 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019434739155217156, + "loss": 1.5299, + "step": 15421 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001943355842073885, + "loss": 1.5717, + "step": 15422 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019432377656159136, + "loss": 1.5259, + "step": 15423 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001943119686148602, + "loss": 1.5691, + "step": 15424 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001943001603672753, + "loss": 1.5141, + "step": 15425 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001942883518189167, + "loss": 1.6127, + "step": 15426 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001942765429698646, + "loss": 1.4978, + "step": 15427 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019426473382019928, + "loss": 1.5773, + "step": 15428 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019425292437000077, + "loss": 1.5638, + "step": 15429 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019424111461934936, + "loss": 1.566, + "step": 15430 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001942293045683252, + "loss": 1.6251, + "step": 15431 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019421749421700846, + "loss": 1.5609, + "step": 15432 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019420568356547934, + "loss": 1.5977, + "step": 15433 + }, + { + "epoch": 1.21, + "learning_rate": 0.000194193872613818, + "loss": 1.5159, + "step": 15434 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019418206136210473, + "loss": 1.542, + "step": 15435 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019417024981041958, + "loss": 1.5252, + "step": 15436 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001941584379588428, + "loss": 1.6064, + "step": 15437 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019414662580745463, + "loss": 1.592, + "step": 15438 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019413481335633519, + "loss": 1.5337, + "step": 15439 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019412300060556476, + "loss": 1.5329, + "step": 15440 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001941111875552235, + "loss": 1.5457, + "step": 15441 + }, + { + "epoch": 1.21, + "learning_rate": 0.00019409937420539165, + "loss": 1.5311, + "step": 15442 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019408756055614934, + "loss": 1.5305, + "step": 15443 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019407574660757683, + "loss": 1.5493, + "step": 15444 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001940639323597543, + "loss": 1.5809, + "step": 15445 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019405211781276202, + "loss": 1.6023, + "step": 15446 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001940403029666802, + "loss": 1.525, + "step": 15447 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019402848782158898, + "loss": 1.5585, + "step": 15448 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019401667237756861, + "loss": 1.5284, + "step": 15449 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019400485663469938, + "loss": 1.5727, + "step": 15450 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001939930405930614, + "loss": 1.5573, + "step": 15451 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019398122425273503, + "loss": 1.4825, + "step": 15452 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001939694076138003, + "loss": 1.5609, + "step": 15453 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019395759067633765, + "loss": 1.5462, + "step": 15454 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001939457734404272, + "loss": 1.4955, + "step": 15455 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019393395590614919, + "loss": 1.5868, + "step": 15456 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001939221380735839, + "loss": 1.5487, + "step": 15457 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019391031994281147, + "loss": 1.5172, + "step": 15458 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019389850151391223, + "loss": 1.567, + "step": 15459 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001938866827869664, + "loss": 1.541, + "step": 15460 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001938748637620542, + "loss": 1.4659, + "step": 15461 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019386304443925583, + "loss": 1.5114, + "step": 15462 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019385122481865166, + "loss": 1.5083, + "step": 15463 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001938394049003219, + "loss": 1.5443, + "step": 15464 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019382758468434671, + "loss": 1.5705, + "step": 15465 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019381576417080643, + "loss": 1.6054, + "step": 15466 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001938039433597813, + "loss": 1.5311, + "step": 15467 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019379212225135154, + "loss": 1.5546, + "step": 15468 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019378030084559746, + "loss": 1.561, + "step": 15469 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019376847914259927, + "loss": 1.5863, + "step": 15470 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019375665714243734, + "loss": 1.5295, + "step": 15471 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019374483484519176, + "loss": 1.5066, + "step": 15472 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019373301225094293, + "loss": 1.5474, + "step": 15473 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001937211893597711, + "loss": 1.5227, + "step": 15474 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019370936617175652, + "loss": 1.5323, + "step": 15475 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019369754268697945, + "loss": 1.5752, + "step": 15476 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001936857189055201, + "loss": 1.5643, + "step": 15477 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019367389482745893, + "loss": 1.5914, + "step": 15478 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001936620704528761, + "loss": 1.5179, + "step": 15479 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019365024578185192, + "loss": 1.535, + "step": 15480 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019363842081446662, + "loss": 1.5557, + "step": 15481 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019362659555080053, + "loss": 1.5732, + "step": 15482 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019361476999093396, + "loss": 1.5334, + "step": 15483 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019360294413494714, + "loss": 1.5584, + "step": 15484 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019359111798292035, + "loss": 1.557, + "step": 15485 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019357929153493404, + "loss": 1.5614, + "step": 15486 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001935674647910683, + "loss": 1.545, + "step": 15487 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019355563775140357, + "loss": 1.5188, + "step": 15488 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019354381041602003, + "loss": 1.5233, + "step": 15489 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019353198278499812, + "loss": 1.5116, + "step": 15490 + }, + { + "epoch": 1.22, + "learning_rate": 0.000193520154858418, + "loss": 1.5635, + "step": 15491 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001935083266363601, + "loss": 1.5191, + "step": 15492 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001934964981189046, + "loss": 1.5825, + "step": 15493 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019348466930613198, + "loss": 1.518, + "step": 15494 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019347284019812237, + "loss": 1.5448, + "step": 15495 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019346101079495623, + "loss": 1.5352, + "step": 15496 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019344918109671374, + "loss": 1.5374, + "step": 15497 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019343735110347537, + "loss": 1.5425, + "step": 15498 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001934255208153213, + "loss": 1.5018, + "step": 15499 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001934136902323319, + "loss": 1.4945, + "step": 15500 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019340185935458752, + "loss": 1.5477, + "step": 15501 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019339002818216848, + "loss": 1.4983, + "step": 15502 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001933781967151551, + "loss": 1.5183, + "step": 15503 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001933663649536277, + "loss": 1.591, + "step": 15504 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019335453289766655, + "loss": 1.5616, + "step": 15505 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019334270054735214, + "loss": 1.5243, + "step": 15506 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019333086790276465, + "loss": 1.552, + "step": 15507 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019331903496398446, + "loss": 1.5668, + "step": 15508 + }, + { + "epoch": 1.22, + "learning_rate": 0.000193307201731092, + "loss": 1.5258, + "step": 15509 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001932953682041675, + "loss": 1.504, + "step": 15510 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019328353438329135, + "loss": 1.4725, + "step": 15511 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019327170026854388, + "loss": 1.4998, + "step": 15512 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019325986586000543, + "loss": 1.4844, + "step": 15513 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019324803115775636, + "loss": 1.5186, + "step": 15514 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001932361961618771, + "loss": 1.5354, + "step": 15515 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019322436087244784, + "loss": 1.5261, + "step": 15516 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001932125252895491, + "loss": 1.5606, + "step": 15517 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019320068941326108, + "loss": 1.5619, + "step": 15518 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019318885324366423, + "loss": 1.5253, + "step": 15519 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019317701678083895, + "loss": 1.5238, + "step": 15520 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019316518002486554, + "loss": 1.5532, + "step": 15521 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019315334297582436, + "loss": 1.4829, + "step": 15522 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001931415056337958, + "loss": 1.4946, + "step": 15523 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001931296679988602, + "loss": 1.487, + "step": 15524 + }, + { + "epoch": 1.22, + "learning_rate": 0.000193117830071098, + "loss": 1.5295, + "step": 15525 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019310599185058948, + "loss": 1.5594, + "step": 15526 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019309415333741513, + "loss": 1.4972, + "step": 15527 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001930823145316552, + "loss": 1.5163, + "step": 15528 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019307047543339016, + "loss": 1.5269, + "step": 15529 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019305863604270035, + "loss": 1.5707, + "step": 15530 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019304679635966617, + "loss": 1.5785, + "step": 15531 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019303495638436796, + "loss": 1.565, + "step": 15532 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001930231161168862, + "loss": 1.5888, + "step": 15533 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001930112755573012, + "loss": 1.5246, + "step": 15534 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019299943470569338, + "loss": 1.518, + "step": 15535 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019298759356214314, + "loss": 1.5427, + "step": 15536 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019297575212673084, + "loss": 1.5665, + "step": 15537 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001929639103995369, + "loss": 1.55, + "step": 15538 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001929520683806417, + "loss": 1.4961, + "step": 15539 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019294022607012568, + "loss": 1.5259, + "step": 15540 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001929283834680692, + "loss": 1.5453, + "step": 15541 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019291654057455274, + "loss": 1.5317, + "step": 15542 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001929046973896566, + "loss": 1.5826, + "step": 15543 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001928928539134613, + "loss": 1.5054, + "step": 15544 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019288101014604714, + "loss": 1.5448, + "step": 15545 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019286916608749461, + "loss": 1.5612, + "step": 15546 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001928573217378841, + "loss": 1.5564, + "step": 15547 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019284547709729597, + "loss": 1.552, + "step": 15548 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019283363216581078, + "loss": 1.5604, + "step": 15549 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019282178694350879, + "loss": 1.5091, + "step": 15550 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019280994143047053, + "loss": 1.5367, + "step": 15551 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019279809562677643, + "loss": 1.5315, + "step": 15552 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019278624953250682, + "loss": 1.557, + "step": 15553 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001927744031477422, + "loss": 1.54, + "step": 15554 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019276255647256298, + "loss": 1.5223, + "step": 15555 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019275070950704965, + "loss": 1.5596, + "step": 15556 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019273886225128258, + "loss": 1.5352, + "step": 15557 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019272701470534215, + "loss": 1.4809, + "step": 15558 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019271516686930894, + "loss": 1.6166, + "step": 15559 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019270331874326332, + "loss": 1.4841, + "step": 15560 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019269147032728568, + "loss": 1.5591, + "step": 15561 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019267962162145658, + "loss": 1.4944, + "step": 15562 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019266777262585632, + "loss": 1.5555, + "step": 15563 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001926559233405655, + "loss": 1.5434, + "step": 15564 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019264407376566448, + "loss": 1.5383, + "step": 15565 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019263222390123374, + "loss": 1.5314, + "step": 15566 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001926203737473537, + "loss": 1.5142, + "step": 15567 + }, + { + "epoch": 1.22, + "learning_rate": 0.00019260852330410487, + "loss": 1.5592, + "step": 15568 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001925966725715677, + "loss": 1.5444, + "step": 15569 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019258482154982257, + "loss": 1.4941, + "step": 15570 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019257297023895, + "loss": 1.5522, + "step": 15571 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019256111863903049, + "loss": 1.5129, + "step": 15572 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001925492667501445, + "loss": 1.5187, + "step": 15573 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019253741457237245, + "loss": 1.5513, + "step": 15574 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019252556210579478, + "loss": 1.5482, + "step": 15575 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019251370935049206, + "loss": 1.5818, + "step": 15576 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019250185630654472, + "loss": 1.5026, + "step": 15577 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019249000297403318, + "loss": 1.5497, + "step": 15578 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019247814935303802, + "loss": 1.578, + "step": 15579 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019246629544363963, + "loss": 1.5166, + "step": 15580 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019245444124591857, + "loss": 1.5285, + "step": 15581 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019244258675995524, + "loss": 1.5381, + "step": 15582 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001924307319858302, + "loss": 1.5632, + "step": 15583 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019241887692362389, + "loss": 1.5528, + "step": 15584 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019240702157341682, + "loss": 1.4855, + "step": 15585 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019239516593528948, + "loss": 1.5644, + "step": 15586 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019238331000932232, + "loss": 1.5605, + "step": 15587 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019237145379559593, + "loss": 1.5346, + "step": 15588 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019235959729419072, + "loss": 1.5826, + "step": 15589 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001923477405051872, + "loss": 1.6003, + "step": 15590 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019233588342866594, + "loss": 1.5496, + "step": 15591 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019232402606470737, + "loss": 1.5369, + "step": 15592 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019231216841339202, + "loss": 1.5915, + "step": 15593 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001923003104748004, + "loss": 1.5392, + "step": 15594 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019228845224901302, + "loss": 1.5668, + "step": 15595 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019227659373611037, + "loss": 1.5047, + "step": 15596 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019226473493617297, + "loss": 1.5325, + "step": 15597 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019225287584928138, + "loss": 1.561, + "step": 15598 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019224101647551605, + "loss": 1.5615, + "step": 15599 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019222915681495754, + "loss": 1.5591, + "step": 15600 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019221729686768634, + "loss": 1.556, + "step": 15601 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019220543663378304, + "loss": 1.5321, + "step": 15602 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019219357611332806, + "loss": 1.5405, + "step": 15603 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019218171530640198, + "loss": 1.5203, + "step": 15604 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001921698542130854, + "loss": 1.527, + "step": 15605 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019215799283345874, + "loss": 1.5634, + "step": 15606 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019214613116760255, + "loss": 1.5241, + "step": 15607 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019213426921559746, + "loss": 1.5244, + "step": 15608 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019212240697752387, + "loss": 1.5644, + "step": 15609 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019211054445346238, + "loss": 1.5512, + "step": 15610 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019209868164349352, + "loss": 1.5835, + "step": 15611 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019208681854769792, + "loss": 1.5405, + "step": 15612 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019207495516615597, + "loss": 1.5512, + "step": 15613 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019206309149894833, + "loss": 1.5597, + "step": 15614 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001920512275461555, + "loss": 1.485, + "step": 15615 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019203936330785805, + "loss": 1.5326, + "step": 15616 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019202749878413652, + "loss": 1.5021, + "step": 15617 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019201563397507144, + "loss": 1.5705, + "step": 15618 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019200376888074341, + "loss": 1.5536, + "step": 15619 + }, + { + "epoch": 1.23, + "learning_rate": 0.000191991903501233, + "loss": 1.5824, + "step": 15620 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019198003783662068, + "loss": 1.5515, + "step": 15621 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001919681718869871, + "loss": 1.5779, + "step": 15622 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019195630565241282, + "loss": 1.4841, + "step": 15623 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019194443913297834, + "loss": 1.5615, + "step": 15624 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001919325723287643, + "loss": 1.5366, + "step": 15625 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019192070523985118, + "loss": 1.556, + "step": 15626 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019190883786631964, + "loss": 1.5118, + "step": 15627 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001918969702082502, + "loss": 1.5626, + "step": 15628 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001918851022657235, + "loss": 1.4779, + "step": 15629 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019187323403882005, + "loss": 1.5575, + "step": 15630 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019186136552762042, + "loss": 1.5381, + "step": 15631 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019184949673220527, + "loss": 1.4963, + "step": 15632 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019183762765265507, + "loss": 1.6265, + "step": 15633 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001918257582890505, + "loss": 1.5425, + "step": 15634 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019181388864147208, + "loss": 1.564, + "step": 15635 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019180201871000043, + "loss": 1.5523, + "step": 15636 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001917901484947162, + "loss": 1.512, + "step": 15637 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001917782779956999, + "loss": 1.5589, + "step": 15638 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019176640721303215, + "loss": 1.5267, + "step": 15639 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001917545361467935, + "loss": 1.5373, + "step": 15640 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019174266479706463, + "loss": 1.5363, + "step": 15641 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001917307931639261, + "loss": 1.5405, + "step": 15642 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019171892124745848, + "loss": 1.6082, + "step": 15643 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019170704904774246, + "loss": 1.5102, + "step": 15644 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019169517656485855, + "loss": 1.5453, + "step": 15645 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019168330379888741, + "loss": 1.5466, + "step": 15646 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019167143074990967, + "loss": 1.4927, + "step": 15647 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001916595574180059, + "loss": 1.524, + "step": 15648 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019164768380325672, + "loss": 1.5138, + "step": 15649 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001916358099057427, + "loss": 1.5623, + "step": 15650 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001916239357255446, + "loss": 1.5904, + "step": 15651 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001916120612627429, + "loss": 1.5203, + "step": 15652 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019160018651741823, + "loss": 1.5741, + "step": 15653 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019158831148965132, + "loss": 1.4969, + "step": 15654 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019157643617952267, + "loss": 1.5573, + "step": 15655 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019156456058711302, + "loss": 1.5118, + "step": 15656 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019155268471250287, + "loss": 1.5423, + "step": 15657 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019154080855577295, + "loss": 1.5487, + "step": 15658 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019152893211700386, + "loss": 1.5004, + "step": 15659 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019151705539627626, + "loss": 1.5202, + "step": 15660 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019150517839367078, + "loss": 1.564, + "step": 15661 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019149330110926802, + "loss": 1.5734, + "step": 15662 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001914814235431486, + "loss": 1.5204, + "step": 15663 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019146954569539327, + "loss": 1.5057, + "step": 15664 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019145766756608254, + "loss": 1.5695, + "step": 15665 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019144578915529723, + "loss": 1.5616, + "step": 15666 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001914339104631178, + "loss": 1.5376, + "step": 15667 + }, + { + "epoch": 1.23, + "learning_rate": 0.000191422031489625, + "loss": 1.5469, + "step": 15668 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019141015223489948, + "loss": 1.5365, + "step": 15669 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019139827269902188, + "loss": 1.5957, + "step": 15670 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019138639288207286, + "loss": 1.5247, + "step": 15671 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019137451278413304, + "loss": 1.5943, + "step": 15672 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001913626324052831, + "loss": 1.5685, + "step": 15673 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019135075174560372, + "loss": 1.5335, + "step": 15674 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019133887080517557, + "loss": 1.5765, + "step": 15675 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019132698958407936, + "loss": 1.5329, + "step": 15676 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019131510808239563, + "loss": 1.5387, + "step": 15677 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019130322630020512, + "loss": 1.5245, + "step": 15678 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001912913442375885, + "loss": 1.573, + "step": 15679 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019127946189462645, + "loss": 1.562, + "step": 15680 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001912675792713996, + "loss": 1.5585, + "step": 15681 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019125569636798867, + "loss": 1.5646, + "step": 15682 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019124381318447436, + "loss": 1.5904, + "step": 15683 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001912319297209373, + "loss": 1.5195, + "step": 15684 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019122004597745817, + "loss": 1.4962, + "step": 15685 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019120816195411774, + "loss": 1.5388, + "step": 15686 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019119627765099657, + "loss": 1.5533, + "step": 15687 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019118439306817545, + "loss": 1.5698, + "step": 15688 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019117250820573496, + "loss": 1.5423, + "step": 15689 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019116062306375592, + "loss": 1.495, + "step": 15690 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019114873764231892, + "loss": 1.5339, + "step": 15691 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019113685194150476, + "loss": 1.5414, + "step": 15692 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019112496596139405, + "loss": 1.5587, + "step": 15693 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019111307970206748, + "loss": 1.5393, + "step": 15694 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019110119316360588, + "loss": 1.4787, + "step": 15695 + }, + { + "epoch": 1.23, + "learning_rate": 0.00019108930634608977, + "loss": 1.5851, + "step": 15696 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019107741924959996, + "loss": 1.5245, + "step": 15697 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019106553187421717, + "loss": 1.5708, + "step": 15698 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019105364422002203, + "loss": 1.5585, + "step": 15699 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019104175628709534, + "loss": 1.5582, + "step": 15700 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019102986807551778, + "loss": 1.5151, + "step": 15701 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019101797958537002, + "loss": 1.5846, + "step": 15702 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019100609081673287, + "loss": 1.536, + "step": 15703 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019099420176968697, + "loss": 1.5119, + "step": 15704 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019098231244431304, + "loss": 1.5388, + "step": 15705 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019097042284069182, + "loss": 1.5839, + "step": 15706 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001909585329589041, + "loss": 1.5737, + "step": 15707 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019094664279903047, + "loss": 1.5683, + "step": 15708 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019093475236115178, + "loss": 1.5555, + "step": 15709 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019092286164534868, + "loss": 1.535, + "step": 15710 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019091097065170195, + "loss": 1.5372, + "step": 15711 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019089907938029234, + "loss": 1.5729, + "step": 15712 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019088718783120048, + "loss": 1.5736, + "step": 15713 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001908752960045072, + "loss": 1.5669, + "step": 15714 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019086340390029325, + "loss": 1.5714, + "step": 15715 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001908515115186393, + "loss": 1.5546, + "step": 15716 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001908396188596262, + "loss": 1.4973, + "step": 15717 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019082772592333454, + "loss": 1.5292, + "step": 15718 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019081583270984516, + "loss": 1.5718, + "step": 15719 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001908039392192388, + "loss": 1.5676, + "step": 15720 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019079204545159625, + "loss": 1.5055, + "step": 15721 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019078015140699823, + "loss": 1.5338, + "step": 15722 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001907682570855255, + "loss": 1.591, + "step": 15723 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019075636248725873, + "loss": 1.579, + "step": 15724 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019074446761227878, + "loss": 1.5756, + "step": 15725 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019073257246066637, + "loss": 1.5243, + "step": 15726 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019072067703250232, + "loss": 1.5699, + "step": 15727 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019070878132786728, + "loss": 1.596, + "step": 15728 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001906968853468421, + "loss": 1.5484, + "step": 15729 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019068498908950756, + "loss": 1.5405, + "step": 15730 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019067309255594436, + "loss": 1.5398, + "step": 15731 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019066119574623333, + "loss": 1.532, + "step": 15732 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001906492986604552, + "loss": 1.5269, + "step": 15733 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001906374012986908, + "loss": 1.506, + "step": 15734 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019062550366102083, + "loss": 1.5572, + "step": 15735 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019061360574752613, + "loss": 1.5257, + "step": 15736 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019060170755828745, + "loss": 1.5525, + "step": 15737 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019058980909338557, + "loss": 1.5779, + "step": 15738 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001905779103529013, + "loss": 1.5692, + "step": 15739 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019056601133691543, + "loss": 1.5157, + "step": 15740 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019055411204550867, + "loss": 1.5506, + "step": 15741 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019054221247876194, + "loss": 1.4872, + "step": 15742 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019053031263675593, + "loss": 1.5634, + "step": 15743 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019051841251957146, + "loss": 1.5241, + "step": 15744 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019050651212728934, + "loss": 1.5515, + "step": 15745 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019049461145999034, + "loss": 1.5341, + "step": 15746 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001904827105177553, + "loss": 1.5458, + "step": 15747 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019047080930066493, + "loss": 1.5631, + "step": 15748 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019045890780880018, + "loss": 1.5403, + "step": 15749 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019044700604224174, + "loss": 1.5799, + "step": 15750 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019043510400107048, + "loss": 1.568, + "step": 15751 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019042320168536709, + "loss": 1.5096, + "step": 15752 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019041129909521258, + "loss": 1.5115, + "step": 15753 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001903993962306876, + "loss": 1.5873, + "step": 15754 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019038749309187298, + "loss": 1.5625, + "step": 15755 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019037558967884962, + "loss": 1.5459, + "step": 15756 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019036368599169827, + "loss": 1.5563, + "step": 15757 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019035178203049975, + "loss": 1.5733, + "step": 15758 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001903398777953349, + "loss": 1.5341, + "step": 15759 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019032797328628453, + "loss": 1.5545, + "step": 15760 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019031606850342952, + "loss": 1.5542, + "step": 15761 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019030416344685062, + "loss": 1.5284, + "step": 15762 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019029225811662874, + "loss": 1.5279, + "step": 15763 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001902803525128446, + "loss": 1.5346, + "step": 15764 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001902684466355791, + "loss": 1.5057, + "step": 15765 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019025654048491312, + "loss": 1.5061, + "step": 15766 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001902446340609274, + "loss": 1.5703, + "step": 15767 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019023272736370283, + "loss": 1.5178, + "step": 15768 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019022082039332026, + "loss": 1.5885, + "step": 15769 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001902089131498605, + "loss": 1.5536, + "step": 15770 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001901970056334044, + "loss": 1.5338, + "step": 15771 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019018509784403287, + "loss": 1.5013, + "step": 15772 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019017318978182667, + "loss": 1.4668, + "step": 15773 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019016128144686665, + "loss": 1.5578, + "step": 15774 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019014937283923371, + "loss": 1.4846, + "step": 15775 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001901374639590087, + "loss": 1.561, + "step": 15776 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019012555480627243, + "loss": 1.4877, + "step": 15777 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019011364538110582, + "loss": 1.5195, + "step": 15778 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019010173568358968, + "loss": 1.5048, + "step": 15779 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001900898257138049, + "loss": 1.5207, + "step": 15780 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001900779154718323, + "loss": 1.4877, + "step": 15781 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001900660049577528, + "loss": 1.5001, + "step": 15782 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019005409417164717, + "loss": 1.5126, + "step": 15783 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001900421831135964, + "loss": 1.5801, + "step": 15784 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019003027178368133, + "loss": 1.5464, + "step": 15785 + }, + { + "epoch": 1.24, + "learning_rate": 0.00019001836018198273, + "loss": 1.5249, + "step": 15786 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001900064483085816, + "loss": 1.5266, + "step": 15787 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018999453616355875, + "loss": 1.576, + "step": 15788 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018998262374699508, + "loss": 1.5322, + "step": 15789 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018997071105897147, + "loss": 1.5467, + "step": 15790 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018995879809956872, + "loss": 1.5526, + "step": 15791 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018994688486886788, + "loss": 1.5294, + "step": 15792 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018993497136694969, + "loss": 1.4968, + "step": 15793 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018992305759389506, + "loss": 1.5448, + "step": 15794 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018991114354978495, + "loss": 1.563, + "step": 15795 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018989922923470017, + "loss": 1.4871, + "step": 15796 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018988731464872165, + "loss": 1.535, + "step": 15797 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018987539979193024, + "loss": 1.5231, + "step": 15798 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018986348466440688, + "loss": 1.5591, + "step": 15799 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001898515692662325, + "loss": 1.521, + "step": 15800 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018983965359748792, + "loss": 1.5099, + "step": 15801 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001898277376582541, + "loss": 1.5732, + "step": 15802 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018981582144861193, + "loss": 1.5631, + "step": 15803 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018980390496864229, + "loss": 1.543, + "step": 15804 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001897919882184261, + "loss": 1.6359, + "step": 15805 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018978007119804425, + "loss": 1.5357, + "step": 15806 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001897681539075777, + "loss": 1.4954, + "step": 15807 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001897562363471073, + "loss": 1.5612, + "step": 15808 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018974431851671403, + "loss": 1.5287, + "step": 15809 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018973240041647872, + "loss": 1.532, + "step": 15810 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001897204820464824, + "loss": 1.5264, + "step": 15811 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001897085634068059, + "loss": 1.5696, + "step": 15812 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018969664449753015, + "loss": 1.5657, + "step": 15813 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001896847253187361, + "loss": 1.5496, + "step": 15814 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018967280587050466, + "loss": 1.575, + "step": 15815 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018966088615291675, + "loss": 1.5412, + "step": 15816 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018964896616605336, + "loss": 1.5547, + "step": 15817 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018963704590999533, + "loss": 1.5609, + "step": 15818 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018962512538482363, + "loss": 1.5378, + "step": 15819 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018961320459061923, + "loss": 1.4814, + "step": 15820 + }, + { + "epoch": 1.24, + "learning_rate": 0.000189601283527463, + "loss": 1.5026, + "step": 15821 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018958936219543593, + "loss": 1.459, + "step": 15822 + }, + { + "epoch": 1.24, + "learning_rate": 0.00018957744059461889, + "loss": 1.5945, + "step": 15823 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018956551872509293, + "loss": 1.518, + "step": 15824 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001895535965869389, + "loss": 1.4968, + "step": 15825 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018954167418023773, + "loss": 1.509, + "step": 15826 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018952975150507052, + "loss": 1.5373, + "step": 15827 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018951782856151803, + "loss": 1.5718, + "step": 15828 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018950590534966134, + "loss": 1.5304, + "step": 15829 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001894939818695813, + "loss": 1.5283, + "step": 15830 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018948205812135898, + "loss": 1.5605, + "step": 15831 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001894701341050752, + "loss": 1.5406, + "step": 15832 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018945820982081105, + "loss": 1.5533, + "step": 15833 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018944628526864745, + "loss": 1.5817, + "step": 15834 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001894343604486653, + "loss": 1.5319, + "step": 15835 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001894224353609456, + "loss": 1.5298, + "step": 15836 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018941051000556932, + "loss": 1.491, + "step": 15837 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018939858438261743, + "loss": 1.6156, + "step": 15838 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018938665849217089, + "loss": 1.602, + "step": 15839 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018937473233431067, + "loss": 1.5206, + "step": 15840 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018936280590911775, + "loss": 1.5651, + "step": 15841 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018935087921667312, + "loss": 1.5918, + "step": 15842 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001893389522570577, + "loss": 1.5343, + "step": 15843 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018932702503035259, + "loss": 1.4804, + "step": 15844 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018931509753663858, + "loss": 1.6006, + "step": 15845 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001893031697759968, + "loss": 1.5025, + "step": 15846 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018929124174850816, + "loss": 1.5122, + "step": 15847 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018927931345425372, + "loss": 1.5613, + "step": 15848 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001892673848933144, + "loss": 1.4411, + "step": 15849 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018925545606577118, + "loss": 1.567, + "step": 15850 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001892435269717051, + "loss": 1.5886, + "step": 15851 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018923159761119712, + "loss": 1.5452, + "step": 15852 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018921966798432824, + "loss": 1.5224, + "step": 15853 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018920773809117942, + "loss": 1.5968, + "step": 15854 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018919580793183173, + "loss": 1.5424, + "step": 15855 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018918387750636615, + "loss": 1.6028, + "step": 15856 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018917194681486365, + "loss": 1.577, + "step": 15857 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001891600158574053, + "loss": 1.5302, + "step": 15858 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018914808463407198, + "loss": 1.5487, + "step": 15859 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018913615314494476, + "loss": 1.5217, + "step": 15860 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018912422139010475, + "loss": 1.5959, + "step": 15861 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018911228936963274, + "loss": 1.5415, + "step": 15862 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018910035708360996, + "loss": 1.569, + "step": 15863 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018908842453211732, + "loss": 1.5469, + "step": 15864 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018907649171523585, + "loss": 1.5738, + "step": 15865 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018906455863304652, + "loss": 1.5368, + "step": 15866 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018905262528563042, + "loss": 1.5784, + "step": 15867 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001890406916730686, + "loss": 1.5544, + "step": 15868 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018902875779544198, + "loss": 1.5348, + "step": 15869 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001890168236528316, + "loss": 1.5425, + "step": 15870 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018900488924531857, + "loss": 1.5462, + "step": 15871 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018899295457298383, + "loss": 1.4881, + "step": 15872 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018898101963590847, + "loss": 1.5275, + "step": 15873 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001889690844341735, + "loss": 1.541, + "step": 15874 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018895714896785995, + "loss": 1.5289, + "step": 15875 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018894521323704886, + "loss": 1.6397, + "step": 15876 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018893327724182126, + "loss": 1.5883, + "step": 15877 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018892134098225815, + "loss": 1.5596, + "step": 15878 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018890940445844066, + "loss": 1.5165, + "step": 15879 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018889746767044977, + "loss": 1.4925, + "step": 15880 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018888553061836657, + "loss": 1.5415, + "step": 15881 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018887359330227202, + "loss": 1.5788, + "step": 15882 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018886165572224727, + "loss": 1.5161, + "step": 15883 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001888497178783733, + "loss": 1.5636, + "step": 15884 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001888377797707312, + "loss": 1.4557, + "step": 15885 + }, + { + "epoch": 1.25, + "learning_rate": 0.000188825841399402, + "loss": 1.5241, + "step": 15886 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018881390276446677, + "loss": 1.4744, + "step": 15887 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018880196386600656, + "loss": 1.5224, + "step": 15888 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001887900247041024, + "loss": 1.5253, + "step": 15889 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001887780852788354, + "loss": 1.5266, + "step": 15890 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018876614559028664, + "loss": 1.5128, + "step": 15891 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018875420563853714, + "loss": 1.5576, + "step": 15892 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018874226542366787, + "loss": 1.6258, + "step": 15893 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018873032494576007, + "loss": 1.6111, + "step": 15894 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018871838420489472, + "loss": 1.5743, + "step": 15895 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018870644320115293, + "loss": 1.5261, + "step": 15896 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018869450193461574, + "loss": 1.5348, + "step": 15897 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018868256040536425, + "loss": 1.5564, + "step": 15898 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001886706186134795, + "loss": 1.5165, + "step": 15899 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001886586765590426, + "loss": 1.5267, + "step": 15900 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001886467342421346, + "loss": 1.5372, + "step": 15901 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018863479166283663, + "loss": 1.563, + "step": 15902 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018862284882122972, + "loss": 1.5201, + "step": 15903 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018861090571739502, + "loss": 1.5588, + "step": 15904 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018859896235141354, + "loss": 1.5442, + "step": 15905 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001885870187233664, + "loss": 1.5021, + "step": 15906 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018857507483333472, + "loss": 1.5268, + "step": 15907 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018856313068139956, + "loss": 1.5341, + "step": 15908 + }, + { + "epoch": 1.25, + "learning_rate": 0.000188551186267642, + "loss": 1.5674, + "step": 15909 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018853924159214317, + "loss": 1.5776, + "step": 15910 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001885272966549842, + "loss": 1.6151, + "step": 15911 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018851535145624615, + "loss": 1.5334, + "step": 15912 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018850340599601008, + "loss": 1.5314, + "step": 15913 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018849146027435714, + "loss": 1.5524, + "step": 15914 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018847951429136844, + "loss": 1.5038, + "step": 15915 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018846756804712504, + "loss": 1.5775, + "step": 15916 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018845562154170807, + "loss": 1.5653, + "step": 15917 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001884436747751987, + "loss": 1.5234, + "step": 15918 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018843172774767798, + "loss": 1.5195, + "step": 15919 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018841978045922703, + "loss": 1.5072, + "step": 15920 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018840783290992698, + "loss": 1.5882, + "step": 15921 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001883958850998589, + "loss": 1.5268, + "step": 15922 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018838393702910402, + "loss": 1.5604, + "step": 15923 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018837198869774333, + "loss": 1.5405, + "step": 15924 + }, + { + "epoch": 1.25, + "learning_rate": 0.000188360040105858, + "loss": 1.5308, + "step": 15925 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018834809125352925, + "loss": 1.5461, + "step": 15926 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018833614214083802, + "loss": 1.5669, + "step": 15927 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001883241927678656, + "loss": 1.5485, + "step": 15928 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001883122431346931, + "loss": 1.5032, + "step": 15929 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018830029324140153, + "loss": 1.5449, + "step": 15930 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018828834308807216, + "loss": 1.5472, + "step": 15931 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018827639267478605, + "loss": 1.5531, + "step": 15932 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018826444200162437, + "loss": 1.6052, + "step": 15933 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018825249106866818, + "loss": 1.5357, + "step": 15934 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018824053987599875, + "loss": 1.5898, + "step": 15935 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018822858842369717, + "loss": 1.6027, + "step": 15936 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018821663671184452, + "loss": 1.552, + "step": 15937 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018820468474052202, + "loss": 1.5263, + "step": 15938 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001881927325098108, + "loss": 1.5576, + "step": 15939 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018818078001979195, + "loss": 1.5184, + "step": 15940 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018816882727054678, + "loss": 1.5782, + "step": 15941 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018815687426215622, + "loss": 1.5074, + "step": 15942 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018814492099470165, + "loss": 1.5377, + "step": 15943 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018813296746826404, + "loss": 1.5935, + "step": 15944 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018812101368292464, + "loss": 1.5405, + "step": 15945 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018810905963876463, + "loss": 1.4968, + "step": 15946 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018809710533586508, + "loss": 1.5554, + "step": 15947 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018808515077430726, + "loss": 1.5266, + "step": 15948 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018807319595417224, + "loss": 1.5415, + "step": 15949 + }, + { + "epoch": 1.25, + "learning_rate": 0.00018806124087554125, + "loss": 1.5325, + "step": 15950 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018804928553849544, + "loss": 1.5814, + "step": 15951 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018803732994311596, + "loss": 1.5257, + "step": 15952 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018802537408948406, + "loss": 1.5159, + "step": 15953 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001880134179776808, + "loss": 1.5492, + "step": 15954 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001880014616077874, + "loss": 1.5443, + "step": 15955 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018798950497988503, + "loss": 1.536, + "step": 15956 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018797754809405493, + "loss": 1.5713, + "step": 15957 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018796559095037827, + "loss": 1.5305, + "step": 15958 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018795363354893614, + "loss": 1.5269, + "step": 15959 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001879416758898098, + "loss": 1.5304, + "step": 15960 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001879297179730804, + "loss": 1.5577, + "step": 15961 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018791775979882917, + "loss": 1.5741, + "step": 15962 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001879058013671373, + "loss": 1.4847, + "step": 15963 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018789384267808588, + "loss": 1.5443, + "step": 15964 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018788188373175624, + "loss": 1.4956, + "step": 15965 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001878699245282295, + "loss": 1.4862, + "step": 15966 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018785796506758687, + "loss": 1.5355, + "step": 15967 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018784600534990957, + "loss": 1.5959, + "step": 15968 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018783404537527873, + "loss": 1.541, + "step": 15969 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018782208514377566, + "loss": 1.4895, + "step": 15970 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001878101246554815, + "loss": 1.5319, + "step": 15971 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001877981639104774, + "loss": 1.5269, + "step": 15972 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018778620290884465, + "loss": 1.4808, + "step": 15973 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001877742416506644, + "loss": 1.4698, + "step": 15974 + }, + { + "epoch": 1.26, + "learning_rate": 0.000187762280136018, + "loss": 1.5444, + "step": 15975 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018775031836498646, + "loss": 1.5619, + "step": 15976 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018773835633765116, + "loss": 1.5346, + "step": 15977 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001877263940540932, + "loss": 1.5251, + "step": 15978 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018771443151439384, + "loss": 1.5425, + "step": 15979 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001877024687186343, + "loss": 1.4757, + "step": 15980 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018769050566689582, + "loss": 1.5543, + "step": 15981 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018767854235925962, + "loss": 1.5386, + "step": 15982 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001876665787958069, + "loss": 1.5693, + "step": 15983 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018765461497661888, + "loss": 1.5434, + "step": 15984 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018764265090177686, + "loss": 1.4914, + "step": 15985 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018763068657136193, + "loss": 1.5551, + "step": 15986 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001876187219854555, + "loss": 1.5183, + "step": 15987 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001876067571441386, + "loss": 1.6135, + "step": 15988 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018759479204749264, + "loss": 1.4975, + "step": 15989 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018758282669559877, + "loss": 1.5336, + "step": 15990 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018757086108853822, + "loss": 1.517, + "step": 15991 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001875588952263923, + "loss": 1.567, + "step": 15992 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001875469291092422, + "loss": 1.6004, + "step": 15993 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018753496273716917, + "loss": 1.4991, + "step": 15994 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018752299611025442, + "loss": 1.5488, + "step": 15995 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001875110292285793, + "loss": 1.5294, + "step": 15996 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018749906209222493, + "loss": 1.5572, + "step": 15997 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018748709470127266, + "loss": 1.5409, + "step": 15998 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001874751270558037, + "loss": 1.5799, + "step": 15999 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001874631591558993, + "loss": 1.4787, + "step": 16000 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001874511910016407, + "loss": 1.5003, + "step": 16001 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018743922259310922, + "loss": 1.4867, + "step": 16002 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018742725393038607, + "loss": 1.5557, + "step": 16003 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018741528501355252, + "loss": 1.5168, + "step": 16004 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001874033158426898, + "loss": 1.5286, + "step": 16005 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018739134641787924, + "loss": 1.5096, + "step": 16006 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001873793767392021, + "loss": 1.5714, + "step": 16007 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018736740680673955, + "loss": 1.5272, + "step": 16008 + }, + { + "epoch": 1.26, + "learning_rate": 0.000187355436620573, + "loss": 1.5544, + "step": 16009 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001873434661807836, + "loss": 1.5909, + "step": 16010 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001873314954874527, + "loss": 1.5793, + "step": 16011 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001873195245406615, + "loss": 1.5961, + "step": 16012 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018730755334049135, + "loss": 1.4928, + "step": 16013 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001872955818870235, + "loss": 1.5728, + "step": 16014 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018728361018033923, + "loss": 1.5679, + "step": 16015 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018727163822051984, + "loss": 1.5537, + "step": 16016 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018725966600764658, + "loss": 1.5618, + "step": 16017 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018724769354180074, + "loss": 1.5435, + "step": 16018 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018723572082306362, + "loss": 1.4966, + "step": 16019 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001872237478515165, + "loss": 1.5627, + "step": 16020 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001872117746272407, + "loss": 1.5154, + "step": 16021 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001871998011503175, + "loss": 1.5456, + "step": 16022 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018718782742082812, + "loss": 1.5797, + "step": 16023 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018717585343885397, + "loss": 1.5726, + "step": 16024 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018716387920447627, + "loss": 1.4868, + "step": 16025 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018715190471777632, + "loss": 1.5797, + "step": 16026 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018713992997883543, + "loss": 1.5633, + "step": 16027 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018712795498773495, + "loss": 1.561, + "step": 16028 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018711597974455611, + "loss": 1.5315, + "step": 16029 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018710400424938026, + "loss": 1.5496, + "step": 16030 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018709202850228875, + "loss": 1.5872, + "step": 16031 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018708005250336275, + "loss": 1.5392, + "step": 16032 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018706807625268372, + "loss": 1.5468, + "step": 16033 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018705609975033286, + "loss": 1.5304, + "step": 16034 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018704412299639153, + "loss": 1.5104, + "step": 16035 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001870321459909411, + "loss": 1.4969, + "step": 16036 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018702016873406278, + "loss": 1.5404, + "step": 16037 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018700819122583802, + "loss": 1.6017, + "step": 16038 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018699621346634802, + "loss": 1.5327, + "step": 16039 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018698423545567412, + "loss": 1.5352, + "step": 16040 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001869722571938977, + "loss": 1.5137, + "step": 16041 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018696027868110005, + "loss": 1.5624, + "step": 16042 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001869482999173625, + "loss": 1.5032, + "step": 16043 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018693632090276637, + "loss": 1.5137, + "step": 16044 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018692434163739306, + "loss": 1.5151, + "step": 16045 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001869123621213238, + "loss": 1.5524, + "step": 16046 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018690038235463996, + "loss": 1.558, + "step": 16047 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018688840233742292, + "loss": 1.5553, + "step": 16048 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018687642206975398, + "loss": 1.5292, + "step": 16049 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018686444155171443, + "loss": 1.539, + "step": 16050 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018685246078338572, + "loss": 1.5558, + "step": 16051 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001868404797648491, + "loss": 1.5187, + "step": 16052 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018682849849618603, + "loss": 1.4791, + "step": 16053 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018681651697747772, + "loss": 1.5564, + "step": 16054 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001868045352088056, + "loss": 1.5378, + "step": 16055 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018679255319025098, + "loss": 1.5616, + "step": 16056 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018678057092189523, + "loss": 1.5334, + "step": 16057 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001867685884038197, + "loss": 1.5234, + "step": 16058 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018675660563610575, + "loss": 1.5612, + "step": 16059 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018674462261883472, + "loss": 1.5281, + "step": 16060 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018673263935208798, + "loss": 1.5321, + "step": 16061 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018672065583594688, + "loss": 1.517, + "step": 16062 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018670867207049285, + "loss": 1.5185, + "step": 16063 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018669668805580713, + "loss": 1.6226, + "step": 16064 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001866847037919712, + "loss": 1.5189, + "step": 16065 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018667271927906633, + "loss": 1.5444, + "step": 16066 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018666073451717395, + "loss": 1.561, + "step": 16067 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018664874950637543, + "loss": 1.4931, + "step": 16068 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018663676424675207, + "loss": 1.5598, + "step": 16069 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001866247787383854, + "loss": 1.5138, + "step": 16070 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001866127929813566, + "loss": 1.5917, + "step": 16071 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018660080697574722, + "loss": 1.5625, + "step": 16072 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001865888207216385, + "loss": 1.565, + "step": 16073 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018657683421911185, + "loss": 1.5991, + "step": 16074 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018656484746824872, + "loss": 1.552, + "step": 16075 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018655286046913045, + "loss": 1.5415, + "step": 16076 + }, + { + "epoch": 1.26, + "learning_rate": 0.00018654087322183847, + "loss": 1.4865, + "step": 16077 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018652888572645405, + "loss": 1.541, + "step": 16078 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018651689798305872, + "loss": 1.483, + "step": 16079 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018650490999173378, + "loss": 1.5677, + "step": 16080 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018649292175256066, + "loss": 1.5612, + "step": 16081 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018648093326562067, + "loss": 1.5357, + "step": 16082 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018646894453099535, + "loss": 1.5028, + "step": 16083 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018645695554876603, + "loss": 1.5369, + "step": 16084 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018644496631901403, + "loss": 1.5109, + "step": 16085 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018643297684182089, + "loss": 1.5716, + "step": 16086 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018642098711726794, + "loss": 1.5661, + "step": 16087 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001864089971454365, + "loss": 1.5542, + "step": 16088 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018639700692640816, + "loss": 1.5849, + "step": 16089 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018638501646026415, + "loss": 1.5293, + "step": 16090 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018637302574708598, + "loss": 1.4936, + "step": 16091 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001863610347869551, + "loss": 1.5526, + "step": 16092 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001863490435799528, + "loss": 1.496, + "step": 16093 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001863370521261606, + "loss": 1.5401, + "step": 16094 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018632506042565983, + "loss": 1.5782, + "step": 16095 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018631306847853194, + "loss": 1.5531, + "step": 16096 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018630107628485838, + "loss": 1.5362, + "step": 16097 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018628908384472052, + "loss": 1.536, + "step": 16098 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018627709115819982, + "loss": 1.5392, + "step": 16099 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001862650982253777, + "loss": 1.5728, + "step": 16100 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018625310504633558, + "loss": 1.5661, + "step": 16101 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018624111162115486, + "loss": 1.5453, + "step": 16102 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018622911794991697, + "loss": 1.609, + "step": 16103 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001862171240327034, + "loss": 1.5424, + "step": 16104 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018620512986959552, + "loss": 1.5235, + "step": 16105 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018619313546067482, + "loss": 1.5003, + "step": 16106 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018618114080602268, + "loss": 1.5863, + "step": 16107 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018616914590572056, + "loss": 1.5202, + "step": 16108 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018615715075984992, + "loss": 1.5319, + "step": 16109 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018614515536849213, + "loss": 1.5064, + "step": 16110 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018613315973172877, + "loss": 1.5264, + "step": 16111 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018612116384964113, + "loss": 1.5662, + "step": 16112 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001861091677223107, + "loss": 1.5342, + "step": 16113 + }, + { + "epoch": 1.27, + "learning_rate": 0.000186097171349819, + "loss": 1.5122, + "step": 16114 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018608517473224737, + "loss": 1.5785, + "step": 16115 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018607317786967738, + "loss": 1.52, + "step": 16116 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001860611807621904, + "loss": 1.5243, + "step": 16117 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018604918340986787, + "loss": 1.5548, + "step": 16118 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018603718581279135, + "loss": 1.5259, + "step": 16119 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018602518797104214, + "loss": 1.5481, + "step": 16120 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018601318988470183, + "loss": 1.5218, + "step": 16121 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001860011915538518, + "loss": 1.524, + "step": 16122 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001859891929785736, + "loss": 1.6125, + "step": 16123 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018597719415894861, + "loss": 1.5717, + "step": 16124 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018596519509505834, + "loss": 1.5595, + "step": 16125 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018595319578698424, + "loss": 1.545, + "step": 16126 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018594119623480777, + "loss": 1.5036, + "step": 16127 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018592919643861043, + "loss": 1.5419, + "step": 16128 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018591719639847362, + "loss": 1.5032, + "step": 16129 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018590519611447892, + "loss": 1.5154, + "step": 16130 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018589319558670774, + "loss": 1.5756, + "step": 16131 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018588119481524154, + "loss": 1.5617, + "step": 16132 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018586919380016186, + "loss": 1.6139, + "step": 16133 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001858571925415502, + "loss": 1.5108, + "step": 16134 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001858451910394879, + "loss": 1.503, + "step": 16135 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018583318929405658, + "loss": 1.5713, + "step": 16136 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001858211873053376, + "loss": 1.5215, + "step": 16137 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018580918507341265, + "loss": 1.4984, + "step": 16138 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018579718259836302, + "loss": 1.5506, + "step": 16139 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018578517988027032, + "loss": 1.556, + "step": 16140 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018577317691921598, + "loss": 1.5268, + "step": 16141 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018576117371528147, + "loss": 1.4886, + "step": 16142 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018574917026854837, + "loss": 1.5295, + "step": 16143 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018573716657909812, + "loss": 1.5579, + "step": 16144 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001857251626470122, + "loss": 1.5711, + "step": 16145 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018571315847237216, + "loss": 1.5487, + "step": 16146 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018570115405525946, + "loss": 1.5532, + "step": 16147 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001856891493957557, + "loss": 1.5378, + "step": 16148 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018567714449394223, + "loss": 1.5337, + "step": 16149 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018566513934990074, + "loss": 1.5262, + "step": 16150 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018565313396371253, + "loss": 1.5598, + "step": 16151 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018564112833545926, + "loss": 1.5849, + "step": 16152 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018562912246522238, + "loss": 1.5005, + "step": 16153 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001856171163530834, + "loss": 1.5619, + "step": 16154 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018560510999912394, + "loss": 1.5534, + "step": 16155 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018559310340342537, + "loss": 1.5313, + "step": 16156 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018558109656606928, + "loss": 1.5594, + "step": 16157 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018556908948713717, + "loss": 1.5581, + "step": 16158 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018555708216671057, + "loss": 1.5564, + "step": 16159 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018554507460487101, + "loss": 1.561, + "step": 16160 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018553306680169998, + "loss": 1.5255, + "step": 16161 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001855210587572791, + "loss": 1.5315, + "step": 16162 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018550905047168978, + "loss": 1.5123, + "step": 16163 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018549704194501361, + "loss": 1.5042, + "step": 16164 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018548503317733216, + "loss": 1.601, + "step": 16165 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018547302416872688, + "loss": 1.4985, + "step": 16166 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018546101491927937, + "loss": 1.5718, + "step": 16167 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018544900542907106, + "loss": 1.5578, + "step": 16168 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018543699569818363, + "loss": 1.5932, + "step": 16169 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018542498572669854, + "loss": 1.5504, + "step": 16170 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018541297551469735, + "loss": 1.5074, + "step": 16171 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001854009650622616, + "loss": 1.5613, + "step": 16172 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001853889543694728, + "loss": 1.5938, + "step": 16173 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018537694343641258, + "loss": 1.5873, + "step": 16174 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018536493226316246, + "loss": 1.5475, + "step": 16175 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018535292084980384, + "loss": 1.531, + "step": 16176 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001853409091964185, + "loss": 1.5847, + "step": 16177 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018532889730308788, + "loss": 1.5179, + "step": 16178 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018531688516989356, + "loss": 1.5188, + "step": 16179 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018530487279691703, + "loss": 1.5563, + "step": 16180 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001852928601842399, + "loss": 1.5603, + "step": 16181 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018528084733194377, + "loss": 1.5418, + "step": 16182 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018526883424011014, + "loss": 1.5707, + "step": 16183 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018525682090882056, + "loss": 1.5678, + "step": 16184 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018524480733815663, + "loss": 1.5679, + "step": 16185 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018523279352819993, + "loss": 1.5433, + "step": 16186 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018522077947903198, + "loss": 1.5412, + "step": 16187 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001852087651907344, + "loss": 1.4944, + "step": 16188 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018519675066338873, + "loss": 1.5503, + "step": 16189 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018518473589707653, + "loss": 1.5878, + "step": 16190 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001851727208918794, + "loss": 1.5277, + "step": 16191 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018516070564787888, + "loss": 1.5297, + "step": 16192 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018514869016515658, + "loss": 1.4969, + "step": 16193 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001851366744437941, + "loss": 1.5299, + "step": 16194 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018512465848387298, + "loss": 1.5614, + "step": 16195 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018511264228547483, + "loss": 1.5086, + "step": 16196 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018510062584868117, + "loss": 1.5255, + "step": 16197 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018508860917357365, + "loss": 1.5199, + "step": 16198 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018507659226023386, + "loss": 1.5475, + "step": 16199 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018506457510874332, + "loss": 1.5532, + "step": 16200 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001850525577191837, + "loss": 1.5411, + "step": 16201 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018504054009163654, + "loss": 1.5379, + "step": 16202 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018502852222618344, + "loss": 1.6073, + "step": 16203 + }, + { + "epoch": 1.27, + "learning_rate": 0.00018501650412290605, + "loss": 1.5748, + "step": 16204 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018500448578188586, + "loss": 1.5352, + "step": 16205 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001849924672032046, + "loss": 1.5247, + "step": 16206 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018498044838694377, + "loss": 1.51, + "step": 16207 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018496842933318495, + "loss": 1.5267, + "step": 16208 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018495641004200982, + "loss": 1.521, + "step": 16209 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018494439051349997, + "loss": 1.5191, + "step": 16210 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018493237074773702, + "loss": 1.5537, + "step": 16211 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001849203507448025, + "loss": 1.5179, + "step": 16212 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001849083305047781, + "loss": 1.5208, + "step": 16213 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018489631002774538, + "loss": 1.4723, + "step": 16214 + }, + { + "epoch": 1.28, + "learning_rate": 0.000184884289313786, + "loss": 1.5339, + "step": 16215 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018487226836298148, + "loss": 1.5938, + "step": 16216 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018486024717541353, + "loss": 1.5272, + "step": 16217 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001848482257511638, + "loss": 1.559, + "step": 16218 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001848362040903138, + "loss": 1.5537, + "step": 16219 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001848241821929452, + "loss": 1.5153, + "step": 16220 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018481216005913963, + "loss": 1.6079, + "step": 16221 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001848001376889787, + "loss": 1.5449, + "step": 16222 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018478811508254402, + "loss": 1.5562, + "step": 16223 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018477609223991725, + "loss": 1.5585, + "step": 16224 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018476406916118003, + "loss": 1.5982, + "step": 16225 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018475204584641393, + "loss": 1.5529, + "step": 16226 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018474002229570063, + "loss": 1.5682, + "step": 16227 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018472799850912178, + "loss": 1.5291, + "step": 16228 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018471597448675896, + "loss": 1.5762, + "step": 16229 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001847039502286938, + "loss": 1.4917, + "step": 16230 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018469192573500798, + "loss": 1.5223, + "step": 16231 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018467990100578315, + "loss": 1.4914, + "step": 16232 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018466787604110095, + "loss": 1.5575, + "step": 16233 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018465585084104295, + "loss": 1.5049, + "step": 16234 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001846438254056909, + "loss": 1.5342, + "step": 16235 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018463179973512636, + "loss": 1.5454, + "step": 16236 + }, + { + "epoch": 1.28, + "learning_rate": 0.000184619773829431, + "loss": 1.5202, + "step": 16237 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001846077476886865, + "loss": 1.5499, + "step": 16238 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018459572131297448, + "loss": 1.5045, + "step": 16239 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018458369470237662, + "loss": 1.5654, + "step": 16240 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018457166785697458, + "loss": 1.5415, + "step": 16241 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018455964077684995, + "loss": 1.5255, + "step": 16242 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018454761346208446, + "loss": 1.5054, + "step": 16243 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001845355859127597, + "loss": 1.4795, + "step": 16244 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001845235581289574, + "loss": 1.6051, + "step": 16245 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001845115301107592, + "loss": 1.549, + "step": 16246 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018449950185824674, + "loss": 1.5173, + "step": 16247 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001844874733715017, + "loss": 1.5672, + "step": 16248 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018447544465060575, + "loss": 1.4803, + "step": 16249 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001844634156956406, + "loss": 1.5282, + "step": 16250 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001844513865066878, + "loss": 1.5816, + "step": 16251 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018443935708382914, + "loss": 1.5581, + "step": 16252 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018442732742714624, + "loss": 1.5028, + "step": 16253 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001844152975367208, + "loss": 1.5223, + "step": 16254 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018440326741263444, + "loss": 1.5815, + "step": 16255 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001843912370549689, + "loss": 1.5986, + "step": 16256 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018437920646380588, + "loss": 1.5791, + "step": 16257 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018436717563922696, + "loss": 1.5264, + "step": 16258 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018435514458131391, + "loss": 1.5815, + "step": 16259 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001843431132901484, + "loss": 1.5245, + "step": 16260 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001843310817658121, + "loss": 1.5498, + "step": 16261 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018431905000838668, + "loss": 1.5339, + "step": 16262 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018430701801795384, + "loss": 1.5394, + "step": 16263 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001842949857945953, + "loss": 1.5574, + "step": 16264 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018428295333839273, + "loss": 1.5012, + "step": 16265 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018427092064942784, + "loss": 1.5295, + "step": 16266 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001842588877277823, + "loss": 1.4922, + "step": 16267 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018424685457353783, + "loss": 1.5144, + "step": 16268 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018423482118677613, + "loss": 1.5183, + "step": 16269 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001842227875675788, + "loss": 1.4895, + "step": 16270 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018421075371602771, + "loss": 1.5725, + "step": 16271 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018419871963220447, + "loss": 1.53, + "step": 16272 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018418668531619076, + "loss": 1.5995, + "step": 16273 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018417465076806837, + "loss": 1.5411, + "step": 16274 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018416261598791893, + "loss": 1.4631, + "step": 16275 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018415058097582418, + "loss": 1.5379, + "step": 16276 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018413854573186584, + "loss": 1.5593, + "step": 16277 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018412651025612558, + "loss": 1.5401, + "step": 16278 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018411447454868518, + "loss": 1.5205, + "step": 16279 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018410243860962635, + "loss": 1.5612, + "step": 16280 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018409040243903076, + "loss": 1.5466, + "step": 16281 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018407836603698014, + "loss": 1.5547, + "step": 16282 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018406632940355623, + "loss": 1.5945, + "step": 16283 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018405429253884074, + "loss": 1.5114, + "step": 16284 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001840422554429154, + "loss": 1.4773, + "step": 16285 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018403021811586195, + "loss": 1.5382, + "step": 16286 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018401818055776203, + "loss": 1.5321, + "step": 16287 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018400614276869749, + "loss": 1.5712, + "step": 16288 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018399410474875, + "loss": 1.533, + "step": 16289 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001839820664980013, + "loss": 1.5828, + "step": 16290 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018397002801653312, + "loss": 1.5185, + "step": 16291 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001839579893044272, + "loss": 1.5052, + "step": 16292 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018394595036176525, + "loss": 1.5258, + "step": 16293 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018393391118862905, + "loss": 1.5445, + "step": 16294 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001839218717851003, + "loss": 1.5258, + "step": 16295 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001839098321512608, + "loss": 1.5074, + "step": 16296 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001838977922871922, + "loss": 1.5497, + "step": 16297 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018388575219297637, + "loss": 1.5346, + "step": 16298 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018387371186869494, + "loss": 1.5035, + "step": 16299 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018386167131442967, + "loss": 1.5465, + "step": 16300 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018384963053026237, + "loss": 1.4912, + "step": 16301 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018383758951627473, + "loss": 1.5838, + "step": 16302 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018382554827254857, + "loss": 1.5119, + "step": 16303 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018381350679916558, + "loss": 1.5726, + "step": 16304 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018380146509620754, + "loss": 1.5504, + "step": 16305 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018378942316375622, + "loss": 1.5109, + "step": 16306 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018377738100189338, + "loss": 1.4942, + "step": 16307 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018376533861070074, + "loss": 1.5622, + "step": 16308 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001837532959902601, + "loss": 1.5505, + "step": 16309 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018374125314065315, + "loss": 1.4801, + "step": 16310 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018372921006196176, + "loss": 1.5755, + "step": 16311 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001837171667542676, + "loss": 1.5821, + "step": 16312 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018370512321765254, + "loss": 1.5063, + "step": 16313 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018369307945219828, + "loss": 1.5042, + "step": 16314 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018368103545798658, + "loss": 1.6055, + "step": 16315 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001836689912350993, + "loss": 1.5394, + "step": 16316 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001836569467836181, + "loss": 1.5421, + "step": 16317 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018364490210362477, + "loss": 1.5314, + "step": 16318 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018363285719520117, + "loss": 1.5188, + "step": 16319 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018362081205842905, + "loss": 1.5417, + "step": 16320 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001836087666933901, + "loss": 1.5722, + "step": 16321 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018359672110016624, + "loss": 1.5609, + "step": 16322 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018358467527883915, + "loss": 1.5376, + "step": 16323 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018357262922949065, + "loss": 1.5572, + "step": 16324 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018356058295220253, + "loss": 1.5278, + "step": 16325 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018354853644705655, + "loss": 1.5325, + "step": 16326 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018353648971413457, + "loss": 1.5122, + "step": 16327 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001835244427535183, + "loss": 1.564, + "step": 16328 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018351239556528952, + "loss": 1.5299, + "step": 16329 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018350034814953016, + "loss": 1.5777, + "step": 16330 + }, + { + "epoch": 1.28, + "learning_rate": 0.00018348830050632188, + "loss": 1.5341, + "step": 16331 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001834762526357465, + "loss": 1.5022, + "step": 16332 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018346420453788586, + "loss": 1.5201, + "step": 16333 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018345215621282172, + "loss": 1.5105, + "step": 16334 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001834401076606359, + "loss": 1.5677, + "step": 16335 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018342805888141024, + "loss": 1.4795, + "step": 16336 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001834160098752265, + "loss": 1.5423, + "step": 16337 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018340396064216646, + "loss": 1.5634, + "step": 16338 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018339191118231198, + "loss": 1.513, + "step": 16339 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018337986149574487, + "loss": 1.5364, + "step": 16340 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018336781158254686, + "loss": 1.5728, + "step": 16341 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018335576144279988, + "loss": 1.516, + "step": 16342 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018334371107658564, + "loss": 1.5397, + "step": 16343 + }, + { + "epoch": 1.29, + "learning_rate": 0.000183331660483986, + "loss": 1.5654, + "step": 16344 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018331960966508286, + "loss": 1.5094, + "step": 16345 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018330755861995792, + "loss": 1.5193, + "step": 16346 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018329550734869305, + "loss": 1.5513, + "step": 16347 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018328345585137, + "loss": 1.545, + "step": 16348 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001832714041280707, + "loss": 1.5378, + "step": 16349 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001832593521788769, + "loss": 1.513, + "step": 16350 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018324730000387045, + "loss": 1.5407, + "step": 16351 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018323524760313322, + "loss": 1.5508, + "step": 16352 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018322319497674695, + "loss": 1.5331, + "step": 16353 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001832111421247936, + "loss": 1.556, + "step": 16354 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018319908904735485, + "loss": 1.5439, + "step": 16355 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018318703574451262, + "loss": 1.5211, + "step": 16356 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018317498221634873, + "loss": 1.5496, + "step": 16357 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018316292846294501, + "loss": 1.5032, + "step": 16358 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018315087448438332, + "loss": 1.5317, + "step": 16359 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018313882028074552, + "loss": 1.4904, + "step": 16360 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018312676585211337, + "loss": 1.5743, + "step": 16361 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001831147111985688, + "loss": 1.5361, + "step": 16362 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018310265632019357, + "loss": 1.5651, + "step": 16363 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018309060121706963, + "loss": 1.5473, + "step": 16364 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018307854588927867, + "loss": 1.5266, + "step": 16365 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018306649033690274, + "loss": 1.5248, + "step": 16366 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018305443456002353, + "loss": 1.5359, + "step": 16367 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018304237855872296, + "loss": 1.5815, + "step": 16368 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001830303223330829, + "loss": 1.5461, + "step": 16369 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018301826588318517, + "loss": 1.5146, + "step": 16370 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001830062092091116, + "loss": 1.4761, + "step": 16371 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018299415231094412, + "loss": 1.5011, + "step": 16372 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018298209518876452, + "loss": 1.5985, + "step": 16373 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018297003784265476, + "loss": 1.5368, + "step": 16374 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018295798027269657, + "loss": 1.4948, + "step": 16375 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018294592247897193, + "loss": 1.5193, + "step": 16376 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018293386446156264, + "loss": 1.5293, + "step": 16377 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018292180622055056, + "loss": 1.4884, + "step": 16378 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018290974775601762, + "loss": 1.5049, + "step": 16379 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001828976890680456, + "loss": 1.5668, + "step": 16380 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018288563015671648, + "loss": 1.5619, + "step": 16381 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018287357102211204, + "loss": 1.5342, + "step": 16382 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018286151166431425, + "loss": 1.521, + "step": 16383 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001828494520834049, + "loss": 1.512, + "step": 16384 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018283739227946587, + "loss": 1.559, + "step": 16385 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001828253322525791, + "loss": 1.5604, + "step": 16386 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018281327200282644, + "loss": 1.4768, + "step": 16387 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018280121153028977, + "loss": 1.5172, + "step": 16388 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018278915083505095, + "loss": 1.5028, + "step": 16389 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018277708991719187, + "loss": 1.515, + "step": 16390 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018276502877679452, + "loss": 1.567, + "step": 16391 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018275296741394065, + "loss": 1.5708, + "step": 16392 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018274090582871223, + "loss": 1.4971, + "step": 16393 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001827288440211911, + "loss": 1.5569, + "step": 16394 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018271678199145917, + "loss": 1.4772, + "step": 16395 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018270471973959836, + "loss": 1.5696, + "step": 16396 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018269265726569055, + "loss": 1.5181, + "step": 16397 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001826805945698177, + "loss": 1.5358, + "step": 16398 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018266853165206157, + "loss": 1.5294, + "step": 16399 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018265646851250416, + "loss": 1.5453, + "step": 16400 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018264440515122738, + "loss": 1.4731, + "step": 16401 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018263234156831306, + "loss": 1.5225, + "step": 16402 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018262027776384319, + "loss": 1.571, + "step": 16403 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018260821373789957, + "loss": 1.5307, + "step": 16404 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018259614949056423, + "loss": 1.4928, + "step": 16405 + }, + { + "epoch": 1.29, + "learning_rate": 0.000182584085021919, + "loss": 1.5419, + "step": 16406 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018257202033204582, + "loss": 1.5038, + "step": 16407 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001825599554210266, + "loss": 1.55, + "step": 16408 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018254789028894323, + "loss": 1.5199, + "step": 16409 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018253582493587772, + "loss": 1.5413, + "step": 16410 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018252375936191184, + "loss": 1.5659, + "step": 16411 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018251169356712756, + "loss": 1.5711, + "step": 16412 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018249962755160687, + "loss": 1.5231, + "step": 16413 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018248756131543167, + "loss": 1.5041, + "step": 16414 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001824754948586838, + "loss": 1.5469, + "step": 16415 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018246342818144525, + "loss": 1.5053, + "step": 16416 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018245136128379797, + "loss": 1.5482, + "step": 16417 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018243929416582387, + "loss": 1.5736, + "step": 16418 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018242722682760483, + "loss": 1.5387, + "step": 16419 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001824151592692228, + "loss": 1.4981, + "step": 16420 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018240309149075975, + "loss": 1.5387, + "step": 16421 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018239102349229755, + "loss": 1.546, + "step": 16422 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018237895527391823, + "loss": 1.5698, + "step": 16423 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018236688683570364, + "loss": 1.5071, + "step": 16424 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018235481817773576, + "loss": 1.5622, + "step": 16425 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018234274930009655, + "loss": 1.5408, + "step": 16426 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018233068020286785, + "loss": 1.5567, + "step": 16427 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018231861088613172, + "loss": 1.5514, + "step": 16428 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018230654134997006, + "loss": 1.5312, + "step": 16429 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001822944715944648, + "loss": 1.5393, + "step": 16430 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018228240161969787, + "loss": 1.5333, + "step": 16431 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018227033142575135, + "loss": 1.5223, + "step": 16432 + }, + { + "epoch": 1.29, + "learning_rate": 0.000182258261012707, + "loss": 1.5477, + "step": 16433 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018224619038064685, + "loss": 1.5928, + "step": 16434 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001822341195296529, + "loss": 1.58, + "step": 16435 + }, + { + "epoch": 1.29, + "learning_rate": 0.000182222048459807, + "loss": 1.5776, + "step": 16436 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018220997717119126, + "loss": 1.5512, + "step": 16437 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018219790566388754, + "loss": 1.5876, + "step": 16438 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018218583393797775, + "loss": 1.5476, + "step": 16439 + }, + { + "epoch": 1.29, + "learning_rate": 0.000182173761993544, + "loss": 1.5602, + "step": 16440 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018216168983066806, + "loss": 1.5374, + "step": 16441 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018214961744943207, + "loss": 1.5602, + "step": 16442 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018213754484991786, + "loss": 1.5552, + "step": 16443 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001821254720322075, + "loss": 1.5146, + "step": 16444 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018211339899638289, + "loss": 1.4569, + "step": 16445 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018210132574252605, + "loss": 1.5064, + "step": 16446 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018208925227071893, + "loss": 1.5106, + "step": 16447 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018207717858104345, + "loss": 1.5936, + "step": 16448 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018206510467358165, + "loss": 1.5031, + "step": 16449 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018205303054841547, + "loss": 1.6035, + "step": 16450 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018204095620562692, + "loss": 1.5168, + "step": 16451 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018202888164529793, + "loss": 1.5432, + "step": 16452 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018201680686751054, + "loss": 1.4718, + "step": 16453 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001820047318723467, + "loss": 1.5212, + "step": 16454 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001819926566598884, + "loss": 1.5676, + "step": 16455 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001819805812302176, + "loss": 1.5238, + "step": 16456 + }, + { + "epoch": 1.29, + "learning_rate": 0.00018196850558341632, + "loss": 1.5692, + "step": 16457 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001819564297195665, + "loss": 1.5492, + "step": 16458 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018194435363875014, + "loss": 1.5072, + "step": 16459 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018193227734104926, + "loss": 1.533, + "step": 16460 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001819202008265459, + "loss": 1.5012, + "step": 16461 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018190812409532193, + "loss": 1.5019, + "step": 16462 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001818960471474594, + "loss": 1.5126, + "step": 16463 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018188396998304037, + "loss": 1.539, + "step": 16464 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018187189260214674, + "loss": 1.5618, + "step": 16465 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018185981500486056, + "loss": 1.5138, + "step": 16466 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018184773719126374, + "loss": 1.5384, + "step": 16467 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018183565916143844, + "loss": 1.5299, + "step": 16468 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001818235809154666, + "loss": 1.5134, + "step": 16469 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018181150245343014, + "loss": 1.4696, + "step": 16470 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001817994237754112, + "loss": 1.5231, + "step": 16471 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001817873448814917, + "loss": 1.5332, + "step": 16472 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018177526577175366, + "loss": 1.4881, + "step": 16473 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001817631864462791, + "loss": 1.5193, + "step": 16474 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018175110690514998, + "loss": 1.5426, + "step": 16475 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018173902714844846, + "loss": 1.54, + "step": 16476 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018172694717625643, + "loss": 1.5257, + "step": 16477 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018171486698865592, + "loss": 1.5229, + "step": 16478 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018170278658572898, + "loss": 1.5238, + "step": 16479 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001816907059675576, + "loss": 1.5331, + "step": 16480 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018167862513422382, + "loss": 1.5203, + "step": 16481 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018166654408580967, + "loss": 1.5583, + "step": 16482 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018165446282239714, + "loss": 1.5003, + "step": 16483 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018164238134406825, + "loss": 1.5469, + "step": 16484 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001816302996509051, + "loss": 1.4957, + "step": 16485 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018161821774298966, + "loss": 1.5432, + "step": 16486 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018160613562040397, + "loss": 1.5399, + "step": 16487 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018159405328323008, + "loss": 1.5455, + "step": 16488 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018158197073155, + "loss": 1.5002, + "step": 16489 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018156988796544572, + "loss": 1.5408, + "step": 16490 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018155780498499934, + "loss": 1.532, + "step": 16491 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018154572179029287, + "loss": 1.5449, + "step": 16492 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001815336383814084, + "loss": 1.5748, + "step": 16493 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018152155475842791, + "loss": 1.5404, + "step": 16494 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001815094709214334, + "loss": 1.5019, + "step": 16495 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001814973868705071, + "loss": 1.5543, + "step": 16496 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001814853026057308, + "loss": 1.5089, + "step": 16497 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018147321812718673, + "loss": 1.4939, + "step": 16498 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018146113343495688, + "loss": 1.53, + "step": 16499 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001814490485291233, + "loss": 1.5072, + "step": 16500 + }, + { + "epoch": 1.3, + "learning_rate": 0.000181436963409768, + "loss": 1.5356, + "step": 16501 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018142487807697307, + "loss": 1.5447, + "step": 16502 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018141279253082058, + "loss": 1.5582, + "step": 16503 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018140070677139257, + "loss": 1.5907, + "step": 16504 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001813886207987711, + "loss": 1.4979, + "step": 16505 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018137653461303813, + "loss": 1.552, + "step": 16506 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001813644482142759, + "loss": 1.5411, + "step": 16507 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018135236160256633, + "loss": 1.5918, + "step": 16508 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018134027477799153, + "loss": 1.5267, + "step": 16509 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018132818774063358, + "loss": 1.5006, + "step": 16510 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001813161004905745, + "loss": 1.5032, + "step": 16511 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018130401302789639, + "loss": 1.5121, + "step": 16512 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018129192535268134, + "loss": 1.6073, + "step": 16513 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001812798374650113, + "loss": 1.4933, + "step": 16514 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018126774936496853, + "loss": 1.5607, + "step": 16515 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018125566105263493, + "loss": 1.57, + "step": 16516 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018124357252809266, + "loss": 1.5837, + "step": 16517 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018123148379142377, + "loss": 1.5358, + "step": 16518 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018121939484271033, + "loss": 1.5383, + "step": 16519 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018120730568203444, + "loss": 1.5504, + "step": 16520 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018119521630947818, + "loss": 1.5201, + "step": 16521 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018118312672512355, + "loss": 1.5585, + "step": 16522 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018117103692905277, + "loss": 1.5229, + "step": 16523 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001811589469213478, + "loss": 1.5348, + "step": 16524 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018114685670209084, + "loss": 1.5854, + "step": 16525 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018113476627136388, + "loss": 1.5402, + "step": 16526 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018112267562924906, + "loss": 1.5781, + "step": 16527 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018111058477582838, + "loss": 1.4861, + "step": 16528 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018109849371118406, + "loss": 1.5285, + "step": 16529 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018108640243539808, + "loss": 1.4923, + "step": 16530 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018107431094855259, + "loss": 1.4901, + "step": 16531 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018106221925072972, + "loss": 1.506, + "step": 16532 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018105012734201148, + "loss": 1.5613, + "step": 16533 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018103803522248008, + "loss": 1.5436, + "step": 16534 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018102594289221748, + "loss": 1.6066, + "step": 16535 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018101385035130586, + "loss": 1.5616, + "step": 16536 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018100175759982735, + "loss": 1.4983, + "step": 16537 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001809896646378639, + "loss": 1.587, + "step": 16538 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018097757146549786, + "loss": 1.5932, + "step": 16539 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018096547808281113, + "loss": 1.552, + "step": 16540 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018095338448988592, + "loss": 1.5926, + "step": 16541 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018094129068680435, + "loss": 1.5342, + "step": 16542 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018092919667364842, + "loss": 1.531, + "step": 16543 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018091710245050037, + "loss": 1.5433, + "step": 16544 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001809050080174422, + "loss": 1.5484, + "step": 16545 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018089291337455613, + "loss": 1.5168, + "step": 16546 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001808808185219242, + "loss": 1.5261, + "step": 16547 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018086872345962854, + "loss": 1.5664, + "step": 16548 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018085662818775132, + "loss": 1.5343, + "step": 16549 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018084453270637458, + "loss": 1.5537, + "step": 16550 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018083243701558054, + "loss": 1.5217, + "step": 16551 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018082034111545123, + "loss": 1.5626, + "step": 16552 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018080824500606879, + "loss": 1.5192, + "step": 16553 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001807961486875154, + "loss": 1.4931, + "step": 16554 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018078405215987315, + "loss": 1.5255, + "step": 16555 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001807719554232242, + "loss": 1.4813, + "step": 16556 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018075985847765063, + "loss": 1.5391, + "step": 16557 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018074776132323455, + "loss": 1.5426, + "step": 16558 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018073566396005822, + "loss": 1.5817, + "step": 16559 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018072356638820366, + "loss": 1.5466, + "step": 16560 + }, + { + "epoch": 1.3, + "learning_rate": 0.000180711468607753, + "loss": 1.5461, + "step": 16561 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018069937061878847, + "loss": 1.5393, + "step": 16562 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018068727242139213, + "loss": 1.4822, + "step": 16563 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018067517401564617, + "loss": 1.5307, + "step": 16564 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018066307540163265, + "loss": 1.5076, + "step": 16565 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018065097657943383, + "loss": 1.5291, + "step": 16566 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018063887754913175, + "loss": 1.5325, + "step": 16567 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018062677831080863, + "loss": 1.5513, + "step": 16568 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018061467886454656, + "loss": 1.5321, + "step": 16569 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018060257921042772, + "loss": 1.5225, + "step": 16570 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018059047934853429, + "loss": 1.5359, + "step": 16571 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018057837927894834, + "loss": 1.5596, + "step": 16572 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018056627900175213, + "loss": 1.5211, + "step": 16573 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001805541785170277, + "loss": 1.4846, + "step": 16574 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018054207782485724, + "loss": 1.5538, + "step": 16575 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018052997692532302, + "loss": 1.5473, + "step": 16576 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018051787581850699, + "loss": 1.52, + "step": 16577 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018050577450449149, + "loss": 1.5654, + "step": 16578 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018049367298335862, + "loss": 1.5162, + "step": 16579 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018048157125519053, + "loss": 1.5303, + "step": 16580 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001804694693200694, + "loss": 1.514, + "step": 16581 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018045736717807735, + "loss": 1.5479, + "step": 16582 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018044526482929662, + "loss": 1.527, + "step": 16583 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001804331622738093, + "loss": 1.5027, + "step": 16584 + }, + { + "epoch": 1.3, + "learning_rate": 0.00018042105951169765, + "loss": 1.5051, + "step": 16585 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018040895654304376, + "loss": 1.5746, + "step": 16586 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018039685336792985, + "loss": 1.4905, + "step": 16587 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018038474998643812, + "loss": 1.5271, + "step": 16588 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018037264639865066, + "loss": 1.5369, + "step": 16589 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001803605426046497, + "loss": 1.5348, + "step": 16590 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018034843860451739, + "loss": 1.5265, + "step": 16591 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018033633439833597, + "loss": 1.5696, + "step": 16592 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018032422998618753, + "loss": 1.4765, + "step": 16593 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018031212536815433, + "loss": 1.5445, + "step": 16594 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018030002054431857, + "loss": 1.568, + "step": 16595 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018028791551476234, + "loss": 1.5599, + "step": 16596 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018027581027956787, + "loss": 1.4862, + "step": 16597 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001802637048388174, + "loss": 1.527, + "step": 16598 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018025159919259304, + "loss": 1.5254, + "step": 16599 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018023949334097705, + "loss": 1.5208, + "step": 16600 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001802273872840515, + "loss": 1.5753, + "step": 16601 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018021528102189877, + "loss": 1.5344, + "step": 16602 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018020317455460093, + "loss": 1.5307, + "step": 16603 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018019106788224015, + "loss": 1.5295, + "step": 16604 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018017896100489873, + "loss": 1.5273, + "step": 16605 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018016685392265882, + "loss": 1.4794, + "step": 16606 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001801547466356026, + "loss": 1.5783, + "step": 16607 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018014263914381228, + "loss": 1.567, + "step": 16608 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001801305314473701, + "loss": 1.5356, + "step": 16609 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018011842354635825, + "loss": 1.5949, + "step": 16610 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001801063154408589, + "loss": 1.5522, + "step": 16611 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018009420713095432, + "loss": 1.5694, + "step": 16612 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018008209861672663, + "loss": 1.5319, + "step": 16613 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018006998989825813, + "loss": 1.5035, + "step": 16614 + }, + { + "epoch": 1.31, + "learning_rate": 0.000180057880975631, + "loss": 1.5348, + "step": 16615 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018004577184892734, + "loss": 1.5133, + "step": 16616 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001800336625182296, + "loss": 1.51, + "step": 16617 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018002155298361982, + "loss": 1.557, + "step": 16618 + }, + { + "epoch": 1.31, + "learning_rate": 0.00018000944324518027, + "loss": 1.5345, + "step": 16619 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017999733330299313, + "loss": 1.5707, + "step": 16620 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017998522315714068, + "loss": 1.513, + "step": 16621 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017997311280770512, + "loss": 1.5437, + "step": 16622 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017996100225476863, + "loss": 1.5899, + "step": 16623 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017994889149841348, + "loss": 1.5644, + "step": 16624 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017993678053872188, + "loss": 1.5012, + "step": 16625 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017992466937577606, + "loss": 1.543, + "step": 16626 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001799125580096583, + "loss": 1.5251, + "step": 16627 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001799004464404507, + "loss": 1.5415, + "step": 16628 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017988833466823563, + "loss": 1.5317, + "step": 16629 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017987622269309523, + "loss": 1.4821, + "step": 16630 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017986411051511178, + "loss": 1.5651, + "step": 16631 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017985199813436747, + "loss": 1.5198, + "step": 16632 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017983988555094458, + "loss": 1.5216, + "step": 16633 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017982777276492537, + "loss": 1.4658, + "step": 16634 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017981565977639202, + "loss": 1.5508, + "step": 16635 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017980354658542677, + "loss": 1.5374, + "step": 16636 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017979143319211193, + "loss": 1.518, + "step": 16637 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017977931959652966, + "loss": 1.4948, + "step": 16638 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017976720579876228, + "loss": 1.5337, + "step": 16639 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017975509179889192, + "loss": 1.495, + "step": 16640 + }, + { + "epoch": 1.31, + "learning_rate": 0.000179742977597001, + "loss": 1.5439, + "step": 16641 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017973086319317166, + "loss": 1.5465, + "step": 16642 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017971874858748612, + "loss": 1.5023, + "step": 16643 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017970663378002671, + "loss": 1.5244, + "step": 16644 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017969451877087567, + "loss": 1.541, + "step": 16645 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017968240356011522, + "loss": 1.5324, + "step": 16646 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017967028814782759, + "loss": 1.5176, + "step": 16647 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001796581725340951, + "loss": 1.5147, + "step": 16648 + }, + { + "epoch": 1.31, + "learning_rate": 0.000179646056719, + "loss": 1.5321, + "step": 16649 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001796339407026245, + "loss": 1.5635, + "step": 16650 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017962182448505096, + "loss": 1.5656, + "step": 16651 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017960970806636152, + "loss": 1.5635, + "step": 16652 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001795975914466385, + "loss": 1.5155, + "step": 16653 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017958547462596422, + "loss": 1.5374, + "step": 16654 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017957335760442086, + "loss": 1.5247, + "step": 16655 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001795612403820907, + "loss": 1.5657, + "step": 16656 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017954912295905606, + "loss": 1.5002, + "step": 16657 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001795370053353992, + "loss": 1.5122, + "step": 16658 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017952488751120233, + "loss": 1.4617, + "step": 16659 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001795127694865478, + "loss": 1.5393, + "step": 16660 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017950065126151786, + "loss": 1.5846, + "step": 16661 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001794885328361947, + "loss": 1.4943, + "step": 16662 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017947641421066075, + "loss": 1.5414, + "step": 16663 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001794642953849982, + "loss": 1.5907, + "step": 16664 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017945217635928932, + "loss": 1.51, + "step": 16665 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017944005713361644, + "loss": 1.4794, + "step": 16666 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017942793770806182, + "loss": 1.5346, + "step": 16667 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017941581808270774, + "loss": 1.5225, + "step": 16668 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017940369825763652, + "loss": 1.5633, + "step": 16669 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017939157823293036, + "loss": 1.5494, + "step": 16670 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001793794580086716, + "loss": 1.5969, + "step": 16671 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017936733758494255, + "loss": 1.5494, + "step": 16672 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017935521696182553, + "loss": 1.5629, + "step": 16673 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017934309613940275, + "loss": 1.5137, + "step": 16674 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017933097511775654, + "loss": 1.5092, + "step": 16675 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017931885389696917, + "loss": 1.5158, + "step": 16676 + }, + { + "epoch": 1.31, + "learning_rate": 0.000179306732477123, + "loss": 1.551, + "step": 16677 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017929461085830028, + "loss": 1.5631, + "step": 16678 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017928248904058327, + "loss": 1.5424, + "step": 16679 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017927036702405436, + "loss": 1.5436, + "step": 16680 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001792582448087958, + "loss": 1.5198, + "step": 16681 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017924612239488992, + "loss": 1.5375, + "step": 16682 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017923399978241904, + "loss": 1.5626, + "step": 16683 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001792218769714654, + "loss": 1.4965, + "step": 16684 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017920975396211133, + "loss": 1.5146, + "step": 16685 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017919763075443916, + "loss": 1.5222, + "step": 16686 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001791855073485312, + "loss": 1.4949, + "step": 16687 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017917338374446971, + "loss": 1.5652, + "step": 16688 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017916125994233705, + "loss": 1.5382, + "step": 16689 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017914913594221558, + "loss": 1.5388, + "step": 16690 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017913701174418755, + "loss": 1.5105, + "step": 16691 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017912488734833523, + "loss": 1.5638, + "step": 16692 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017911276275474108, + "loss": 1.5136, + "step": 16693 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017910063796348728, + "loss": 1.5409, + "step": 16694 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001790885129746562, + "loss": 1.5132, + "step": 16695 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001790763877883302, + "loss": 1.5338, + "step": 16696 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001790642624045916, + "loss": 1.5213, + "step": 16697 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017905213682352264, + "loss": 1.6199, + "step": 16698 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017904001104520573, + "loss": 1.5319, + "step": 16699 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017902788506972316, + "loss": 1.5638, + "step": 16700 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001790157588971573, + "loss": 1.5427, + "step": 16701 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017900363252759045, + "loss": 1.5492, + "step": 16702 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017899150596110486, + "loss": 1.5081, + "step": 16703 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017897937919778302, + "loss": 1.5494, + "step": 16704 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017896725223770716, + "loss": 1.5051, + "step": 16705 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017895512508095965, + "loss": 1.5114, + "step": 16706 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017894299772762282, + "loss": 1.5071, + "step": 16707 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017893087017777903, + "loss": 1.5255, + "step": 16708 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017891874243151055, + "loss": 1.5744, + "step": 16709 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001789066144888998, + "loss": 1.5224, + "step": 16710 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017889448635002904, + "loss": 1.4975, + "step": 16711 + }, + { + "epoch": 1.31, + "learning_rate": 0.00017888235801498075, + "loss": 1.4711, + "step": 16712 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017887022948383713, + "loss": 1.4891, + "step": 16713 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001788581007566806, + "loss": 1.5184, + "step": 16714 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017884597183359348, + "loss": 1.5165, + "step": 16715 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001788338427146581, + "loss": 1.4972, + "step": 16716 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017882171339995693, + "loss": 1.5232, + "step": 16717 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017880958388957212, + "loss": 1.549, + "step": 16718 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017879745418358624, + "loss": 1.502, + "step": 16719 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017878532428208146, + "loss": 1.5195, + "step": 16720 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017877319418514023, + "loss": 1.4714, + "step": 16721 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017876106389284495, + "loss": 1.5025, + "step": 16722 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017874893340527785, + "loss": 1.5509, + "step": 16723 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017873680272252138, + "loss": 1.5132, + "step": 16724 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017872467184465787, + "loss": 1.5324, + "step": 16725 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001787125407717697, + "loss": 1.5103, + "step": 16726 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001787004095039392, + "loss": 1.5533, + "step": 16727 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017868827804124878, + "loss": 1.5167, + "step": 16728 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017867614638378078, + "loss": 1.5644, + "step": 16729 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017866401453161756, + "loss": 1.5175, + "step": 16730 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017865188248484154, + "loss": 1.4567, + "step": 16731 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017863975024353502, + "loss": 1.545, + "step": 16732 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017862761780778038, + "loss": 1.4891, + "step": 16733 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017861548517766, + "loss": 1.5809, + "step": 16734 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001786033523532563, + "loss": 1.5125, + "step": 16735 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017859121933465165, + "loss": 1.5227, + "step": 16736 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017857908612192835, + "loss": 1.5163, + "step": 16737 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017856695271516884, + "loss": 1.5451, + "step": 16738 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017855481911445553, + "loss": 1.5315, + "step": 16739 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017854268531987072, + "loss": 1.5693, + "step": 16740 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017853055133149683, + "loss": 1.4843, + "step": 16741 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001785184171494162, + "loss": 1.5337, + "step": 16742 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001785062827737113, + "loss": 1.5326, + "step": 16743 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017849414820446448, + "loss": 1.5325, + "step": 16744 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017848201344175806, + "loss": 1.5192, + "step": 16745 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001784698784856746, + "loss": 1.5165, + "step": 16746 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017845774333629625, + "loss": 1.5573, + "step": 16747 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017844560799370557, + "loss": 1.5768, + "step": 16748 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017843347245798493, + "loss": 1.512, + "step": 16749 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017842133672921667, + "loss": 1.5548, + "step": 16750 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017840920080748325, + "loss": 1.5565, + "step": 16751 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017839706469286704, + "loss": 1.472, + "step": 16752 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017838492838545043, + "loss": 1.5727, + "step": 16753 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001783727918853158, + "loss": 1.5443, + "step": 16754 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017836065519254556, + "loss": 1.5453, + "step": 16755 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017834851830722217, + "loss": 1.4833, + "step": 16756 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017833638122942793, + "loss": 1.5497, + "step": 16757 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017832424395924532, + "loss": 1.5488, + "step": 16758 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017831210649675672, + "loss": 1.5492, + "step": 16759 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017829996884204458, + "loss": 1.4983, + "step": 16760 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001782878309951912, + "loss": 1.5459, + "step": 16761 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001782756929562791, + "loss": 1.5452, + "step": 16762 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017826355472539063, + "loss": 1.5501, + "step": 16763 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017825141630260826, + "loss": 1.5413, + "step": 16764 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001782392776880143, + "loss": 1.5659, + "step": 16765 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017822713888169126, + "loss": 1.4408, + "step": 16766 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017821499988372153, + "loss": 1.5699, + "step": 16767 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017820286069418755, + "loss": 1.5451, + "step": 16768 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017819072131317168, + "loss": 1.5131, + "step": 16769 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017817858174075637, + "loss": 1.5757, + "step": 16770 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017816644197702405, + "loss": 1.5114, + "step": 16771 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001781543020220571, + "loss": 1.5098, + "step": 16772 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017814216187593798, + "loss": 1.5878, + "step": 16773 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017813002153874914, + "loss": 1.5945, + "step": 16774 + }, + { + "epoch": 1.32, + "learning_rate": 0.000178117881010573, + "loss": 1.5361, + "step": 16775 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001781057402914919, + "loss": 1.5967, + "step": 16776 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017809359938158838, + "loss": 1.486, + "step": 16777 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017808145828094481, + "loss": 1.5486, + "step": 16778 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017806931698964362, + "loss": 1.5307, + "step": 16779 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001780571755077673, + "loss": 1.5512, + "step": 16780 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017804503383539818, + "loss": 1.6243, + "step": 16781 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017803289197261882, + "loss": 1.5505, + "step": 16782 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001780207499195115, + "loss": 1.5021, + "step": 16783 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017800860767615883, + "loss": 1.5306, + "step": 16784 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001779964652426432, + "loss": 1.5352, + "step": 16785 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017798432261904694, + "loss": 1.5816, + "step": 16786 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017797217980545265, + "loss": 1.5438, + "step": 16787 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017796003680194263, + "loss": 1.5259, + "step": 16788 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017794789360859936, + "loss": 1.5361, + "step": 16789 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001779357502255054, + "loss": 1.5418, + "step": 16790 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017792360665274307, + "loss": 1.5507, + "step": 16791 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001779114628903949, + "loss": 1.543, + "step": 16792 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017789931893854324, + "loss": 1.5762, + "step": 16793 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017788717479727062, + "loss": 1.525, + "step": 16794 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001778750304666595, + "loss": 1.5333, + "step": 16795 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017786288594679229, + "loss": 1.5189, + "step": 16796 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017785074123775145, + "loss": 1.5627, + "step": 16797 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017783859633961946, + "loss": 1.5496, + "step": 16798 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017782645125247879, + "loss": 1.511, + "step": 16799 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001778143059764118, + "loss": 1.5038, + "step": 16800 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017780216051150105, + "loss": 1.5805, + "step": 16801 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017779001485782901, + "loss": 1.5102, + "step": 16802 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017777786901547807, + "loss": 1.5165, + "step": 16803 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017776572298453073, + "loss": 1.5041, + "step": 16804 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017775357676506944, + "loss": 1.55, + "step": 16805 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017774143035717668, + "loss": 1.5521, + "step": 16806 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017772928376093498, + "loss": 1.6077, + "step": 16807 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001777171369764267, + "loss": 1.5281, + "step": 16808 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001777049900037344, + "loss": 1.521, + "step": 16809 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017769284284294045, + "loss": 1.5112, + "step": 16810 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017768069549412734, + "loss": 1.5065, + "step": 16811 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017766854795737768, + "loss": 1.5106, + "step": 16812 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017765640023277376, + "loss": 1.5052, + "step": 16813 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017764425232039824, + "loss": 1.5279, + "step": 16814 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017763210422033342, + "loss": 1.571, + "step": 16815 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001776199559326619, + "loss": 1.5413, + "step": 16816 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017760780745746613, + "loss": 1.5198, + "step": 16817 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017759565879482857, + "loss": 1.5507, + "step": 16818 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017758350994483173, + "loss": 1.5093, + "step": 16819 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017757136090755806, + "loss": 1.4829, + "step": 16820 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017755921168309004, + "loss": 1.4869, + "step": 16821 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001775470622715102, + "loss": 1.5069, + "step": 16822 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017753491267290098, + "loss": 1.5489, + "step": 16823 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017752276288734498, + "loss": 1.5179, + "step": 16824 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017751061291492457, + "loss": 1.5328, + "step": 16825 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017749846275572228, + "loss": 1.6075, + "step": 16826 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017748631240982056, + "loss": 1.4778, + "step": 16827 + }, + { + "epoch": 1.32, + "learning_rate": 0.000177474161877302, + "loss": 1.5366, + "step": 16828 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017746201115824902, + "loss": 1.5237, + "step": 16829 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017744986025274414, + "loss": 1.5178, + "step": 16830 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017743770916086985, + "loss": 1.4972, + "step": 16831 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001774255578827087, + "loss": 1.5046, + "step": 16832 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001774134064183431, + "loss": 1.5437, + "step": 16833 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017740125476785562, + "loss": 1.5792, + "step": 16834 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001773891029313287, + "loss": 1.5017, + "step": 16835 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017737695090884494, + "loss": 1.5406, + "step": 16836 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017736479870048675, + "loss": 1.5777, + "step": 16837 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017735264630633674, + "loss": 1.5365, + "step": 16838 + }, + { + "epoch": 1.32, + "learning_rate": 0.00017734049372647727, + "loss": 1.4745, + "step": 16839 + }, + { + "epoch": 1.32, + "learning_rate": 0.000177328340960991, + "loss": 1.5516, + "step": 16840 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001773161880099604, + "loss": 1.4901, + "step": 16841 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001773040348734679, + "loss": 1.5417, + "step": 16842 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017729188155159607, + "loss": 1.5546, + "step": 16843 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017727972804442742, + "loss": 1.5312, + "step": 16844 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001772675743520445, + "loss": 1.5614, + "step": 16845 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017725542047452978, + "loss": 1.5539, + "step": 16846 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017724326641196578, + "loss": 1.516, + "step": 16847 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001772311121644351, + "loss": 1.4982, + "step": 16848 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017721895773202014, + "loss": 1.5659, + "step": 16849 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017720680311480349, + "loss": 1.4694, + "step": 16850 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017719464831286768, + "loss": 1.5999, + "step": 16851 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017718249332629514, + "loss": 1.5603, + "step": 16852 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017717033815516857, + "loss": 1.5591, + "step": 16853 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017715818279957034, + "loss": 1.5166, + "step": 16854 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001771460272595831, + "loss": 1.5476, + "step": 16855 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017713387153528922, + "loss": 1.5324, + "step": 16856 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017712171562677138, + "loss": 1.5162, + "step": 16857 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017710955953411208, + "loss": 1.504, + "step": 16858 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001770974032573938, + "loss": 1.5466, + "step": 16859 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017708524679669907, + "loss": 1.5129, + "step": 16860 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001770730901521105, + "loss": 1.4881, + "step": 16861 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001770609333237106, + "loss": 1.5245, + "step": 16862 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017704877631158188, + "loss": 1.5441, + "step": 16863 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001770366191158069, + "loss": 1.5383, + "step": 16864 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017702446173646822, + "loss": 1.5749, + "step": 16865 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001770123041736483, + "loss": 1.5654, + "step": 16866 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001770001464274298, + "loss": 1.5382, + "step": 16867 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017698798849789517, + "loss": 1.595, + "step": 16868 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017697583038512696, + "loss": 1.5319, + "step": 16869 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001769636720892078, + "loss": 1.5559, + "step": 16870 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017695151361022017, + "loss": 1.5102, + "step": 16871 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017693935494824667, + "loss": 1.579, + "step": 16872 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001769271961033698, + "loss": 1.5354, + "step": 16873 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001769150370756721, + "loss": 1.5841, + "step": 16874 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001769028778652362, + "loss": 1.4942, + "step": 16875 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017689071847214454, + "loss": 1.549, + "step": 16876 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017687855889647977, + "loss": 1.5333, + "step": 16877 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001768663991383244, + "loss": 1.5289, + "step": 16878 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017685423919776104, + "loss": 1.5533, + "step": 16879 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017684207907487222, + "loss": 1.4988, + "step": 16880 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017682991876974047, + "loss": 1.5819, + "step": 16881 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001768177582824484, + "loss": 1.5101, + "step": 16882 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017680559761307853, + "loss": 1.5236, + "step": 16883 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017679343676171345, + "loss": 1.4957, + "step": 16884 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017678127572843573, + "loss": 1.5627, + "step": 16885 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017676911451332793, + "loss": 1.517, + "step": 16886 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001767569531164726, + "loss": 1.5449, + "step": 16887 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017674479153795232, + "loss": 1.5781, + "step": 16888 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017673262977784966, + "loss": 1.5252, + "step": 16889 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001767204678362472, + "loss": 1.4743, + "step": 16890 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001767083057132275, + "loss": 1.537, + "step": 16891 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017669614340887319, + "loss": 1.5471, + "step": 16892 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017668398092326676, + "loss": 1.489, + "step": 16893 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017667181825649085, + "loss": 1.5137, + "step": 16894 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017665965540862797, + "loss": 1.5677, + "step": 16895 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001766474923797608, + "loss": 1.5488, + "step": 16896 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017663532916997182, + "loss": 1.5243, + "step": 16897 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017662316577934367, + "loss": 1.5453, + "step": 16898 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001766110022079589, + "loss": 1.5408, + "step": 16899 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017659883845590012, + "loss": 1.518, + "step": 16900 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017658667452324987, + "loss": 1.4873, + "step": 16901 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017657451041009085, + "loss": 1.5153, + "step": 16902 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001765623461165055, + "loss": 1.5446, + "step": 16903 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017655018164257653, + "loss": 1.5559, + "step": 16904 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017653801698838646, + "loss": 1.5466, + "step": 16905 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001765258521540179, + "loss": 1.5394, + "step": 16906 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001765136871395534, + "loss": 1.5192, + "step": 16907 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017650152194507564, + "loss": 1.5472, + "step": 16908 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017648935657066714, + "loss": 1.5108, + "step": 16909 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017647719101641056, + "loss": 1.5105, + "step": 16910 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017646502528238849, + "loss": 1.5469, + "step": 16911 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017645285936868343, + "loss": 1.5487, + "step": 16912 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001764406932753781, + "loss": 1.4662, + "step": 16913 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017642852700255505, + "loss": 1.5229, + "step": 16914 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017641636055029683, + "loss": 1.544, + "step": 16915 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017640419391868616, + "loss": 1.5466, + "step": 16916 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001763920271078056, + "loss": 1.5433, + "step": 16917 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001763798601177377, + "loss": 1.5114, + "step": 16918 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017636769294856512, + "loss": 1.5626, + "step": 16919 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017635552560037047, + "loss": 1.5096, + "step": 16920 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017634335807323632, + "loss": 1.5325, + "step": 16921 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017633119036724533, + "loss": 1.4989, + "step": 16922 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017631902248248005, + "loss": 1.5228, + "step": 16923 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017630685441902315, + "loss": 1.5481, + "step": 16924 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017629468617695723, + "loss": 1.5035, + "step": 16925 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017628251775636493, + "loss": 1.5009, + "step": 16926 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001762703491573288, + "loss": 1.5316, + "step": 16927 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001762581803799315, + "loss": 1.5404, + "step": 16928 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017624601142425569, + "loss": 1.5459, + "step": 16929 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017623384229038388, + "loss": 1.539, + "step": 16930 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017622167297839876, + "loss": 1.5481, + "step": 16931 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017620950348838302, + "loss": 1.5984, + "step": 16932 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017619733382041918, + "loss": 1.5358, + "step": 16933 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017618516397458988, + "loss": 1.5302, + "step": 16934 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017617299395097778, + "loss": 1.499, + "step": 16935 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001761608237496655, + "loss": 1.4916, + "step": 16936 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017614865337073568, + "loss": 1.5617, + "step": 16937 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017613648281427087, + "loss": 1.528, + "step": 16938 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017612431208035382, + "loss": 1.5468, + "step": 16939 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001761121411690671, + "loss": 1.5189, + "step": 16940 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017609997008049335, + "loss": 1.5031, + "step": 16941 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001760877988147152, + "loss": 1.5819, + "step": 16942 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017607562737181532, + "loss": 1.5215, + "step": 16943 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017606345575187627, + "loss": 1.5359, + "step": 16944 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017605128395498074, + "loss": 1.5365, + "step": 16945 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001760391119812114, + "loss": 1.5682, + "step": 16946 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017602693983065083, + "loss": 1.5378, + "step": 16947 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017601476750338176, + "loss": 1.5518, + "step": 16948 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017600259499948672, + "loss": 1.5115, + "step": 16949 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017599042231904844, + "loss": 1.4951, + "step": 16950 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001759782494621495, + "loss": 1.5535, + "step": 16951 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017596607642887262, + "loss": 1.484, + "step": 16952 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017595390321930042, + "loss": 1.4941, + "step": 16953 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017594172983351544, + "loss": 1.5596, + "step": 16954 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017592955627160058, + "loss": 1.5271, + "step": 16955 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017591738253363825, + "loss": 1.4967, + "step": 16956 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001759052086197112, + "loss": 1.5269, + "step": 16957 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001758930345299021, + "loss": 1.5156, + "step": 16958 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017588086026429356, + "loss": 1.4913, + "step": 16959 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001758686858229683, + "loss": 1.5319, + "step": 16960 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001758565112060089, + "loss": 1.6106, + "step": 16961 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017584433641349806, + "loss": 1.5156, + "step": 16962 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017583216144551845, + "loss": 1.4972, + "step": 16963 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001758199863021527, + "loss": 1.5639, + "step": 16964 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017580781098348357, + "loss": 1.5224, + "step": 16965 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017579563548959356, + "loss": 1.549, + "step": 16966 + }, + { + "epoch": 1.33, + "learning_rate": 0.00017578345982056546, + "loss": 1.5461, + "step": 16967 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001757712839764819, + "loss": 1.5276, + "step": 16968 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001757591079574255, + "loss": 1.5419, + "step": 16969 + }, + { + "epoch": 1.34, + "learning_rate": 0.000175746931763479, + "loss": 1.5809, + "step": 16970 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017573475539472502, + "loss": 1.4794, + "step": 16971 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001757225788512463, + "loss": 1.5131, + "step": 16972 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017571040213312542, + "loss": 1.5279, + "step": 16973 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001756982252404451, + "loss": 1.5759, + "step": 16974 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017568604817328804, + "loss": 1.5113, + "step": 16975 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017567387093173688, + "loss": 1.5393, + "step": 16976 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017566169351587434, + "loss": 1.5392, + "step": 16977 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017564951592578294, + "loss": 1.5329, + "step": 16978 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001756373381615456, + "loss": 1.5479, + "step": 16979 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017562516022324483, + "loss": 1.5563, + "step": 16980 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017561298211096337, + "loss": 1.5138, + "step": 16981 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017560080382478393, + "loss": 1.4542, + "step": 16982 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017558862536478913, + "loss": 1.5495, + "step": 16983 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001755764467310617, + "loss": 1.5381, + "step": 16984 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001755642679236843, + "loss": 1.5615, + "step": 16985 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017555208894273958, + "loss": 1.5469, + "step": 16986 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017553990978831036, + "loss": 1.5218, + "step": 16987 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001755277304604792, + "loss": 1.5387, + "step": 16988 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017551555095932886, + "loss": 1.5845, + "step": 16989 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017550337128494198, + "loss": 1.52, + "step": 16990 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001754911914374013, + "loss": 1.4728, + "step": 16991 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017547901141678953, + "loss": 1.543, + "step": 16992 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017546683122318925, + "loss": 1.5253, + "step": 16993 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017545465085668332, + "loss": 1.5154, + "step": 16994 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017544247031735434, + "loss": 1.5086, + "step": 16995 + }, + { + "epoch": 1.34, + "learning_rate": 0.000175430289605285, + "loss": 1.5095, + "step": 16996 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017541810872055805, + "loss": 1.4928, + "step": 16997 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017540592766325617, + "loss": 1.52, + "step": 16998 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017539374643346206, + "loss": 1.5822, + "step": 16999 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017538156503125842, + "loss": 1.4905, + "step": 17000 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001753693834567279, + "loss": 1.5511, + "step": 17001 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017535720170995335, + "loss": 1.5317, + "step": 17002 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017534501979101736, + "loss": 1.5585, + "step": 17003 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001753328377000027, + "loss": 1.5458, + "step": 17004 + }, + { + "epoch": 1.34, + "learning_rate": 0.000175320655436992, + "loss": 1.5033, + "step": 17005 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001753084730020681, + "loss": 1.5388, + "step": 17006 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017529629039531356, + "loss": 1.5634, + "step": 17007 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001752841076168112, + "loss": 1.4858, + "step": 17008 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001752719246666437, + "loss": 1.4894, + "step": 17009 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017525974154489375, + "loss": 1.541, + "step": 17010 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017524755825164417, + "loss": 1.5027, + "step": 17011 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017523537478697753, + "loss": 1.5733, + "step": 17012 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017522319115097665, + "loss": 1.5385, + "step": 17013 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017521100734372422, + "loss": 1.4957, + "step": 17014 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017519882336530297, + "loss": 1.5678, + "step": 17015 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001751866392157956, + "loss": 1.5918, + "step": 17016 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001751744548952848, + "loss": 1.5545, + "step": 17017 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017516227040385344, + "loss": 1.4933, + "step": 17018 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001751500857415841, + "loss": 1.5343, + "step": 17019 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017513790090855955, + "loss": 1.5413, + "step": 17020 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017512571590486256, + "loss": 1.5172, + "step": 17021 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001751135307305758, + "loss": 1.5617, + "step": 17022 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017510134538578203, + "loss": 1.5786, + "step": 17023 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017508915987056396, + "loss": 1.5034, + "step": 17024 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017507697418500437, + "loss": 1.5852, + "step": 17025 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017506478832918595, + "loss": 1.5136, + "step": 17026 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017505260230319143, + "loss": 1.5282, + "step": 17027 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017504041610710359, + "loss": 1.4995, + "step": 17028 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017502822974100514, + "loss": 1.5112, + "step": 17029 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001750160432049788, + "loss": 1.5431, + "step": 17030 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001750038564991074, + "loss": 1.4808, + "step": 17031 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017499166962347355, + "loss": 1.5407, + "step": 17032 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017497948257816002, + "loss": 1.5268, + "step": 17033 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017496729536324964, + "loss": 1.5038, + "step": 17034 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017495510797882512, + "loss": 1.5262, + "step": 17035 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017494292042496916, + "loss": 1.5306, + "step": 17036 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017493073270176453, + "loss": 1.5508, + "step": 17037 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017491854480929404, + "loss": 1.5083, + "step": 17038 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001749063567476403, + "loss": 1.5487, + "step": 17039 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001748941685168862, + "loss": 1.5336, + "step": 17040 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001748819801171144, + "loss": 1.5252, + "step": 17041 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017486979154840765, + "loss": 1.5252, + "step": 17042 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017485760281084884, + "loss": 1.5018, + "step": 17043 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017484541390452055, + "loss": 1.524, + "step": 17044 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017483322482950565, + "loss": 1.5282, + "step": 17045 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017482103558588683, + "loss": 1.5114, + "step": 17046 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017480884617374689, + "loss": 1.5583, + "step": 17047 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017479665659316857, + "loss": 1.5252, + "step": 17048 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017478446684423462, + "loss": 1.5146, + "step": 17049 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017477227692702784, + "loss": 1.5061, + "step": 17050 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017476008684163093, + "loss": 1.5881, + "step": 17051 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017474789658812677, + "loss": 1.5007, + "step": 17052 + }, + { + "epoch": 1.34, + "learning_rate": 0.000174735706166598, + "loss": 1.5015, + "step": 17053 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017472351557712743, + "loss": 1.4902, + "step": 17054 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017471132481979785, + "loss": 1.5271, + "step": 17055 + }, + { + "epoch": 1.34, + "learning_rate": 0.000174699133894692, + "loss": 1.5003, + "step": 17056 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017468694280189267, + "loss": 1.5442, + "step": 17057 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001746747515414826, + "loss": 1.5694, + "step": 17058 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017466256011354462, + "loss": 1.5106, + "step": 17059 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017465036851816145, + "loss": 1.5306, + "step": 17060 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001746381767554159, + "loss": 1.4954, + "step": 17061 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001746259848253907, + "loss": 1.5789, + "step": 17062 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017461379272816867, + "loss": 1.5571, + "step": 17063 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017460160046383252, + "loss": 1.5056, + "step": 17064 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017458940803246516, + "loss": 1.5418, + "step": 17065 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001745772154341492, + "loss": 1.5571, + "step": 17066 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017456502266896757, + "loss": 1.5968, + "step": 17067 + }, + { + "epoch": 1.34, + "learning_rate": 0.000174552829737003, + "loss": 1.5205, + "step": 17068 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017454063663833823, + "loss": 1.5502, + "step": 17069 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001745284433730561, + "loss": 1.563, + "step": 17070 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017451624994123936, + "loss": 1.5499, + "step": 17071 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017450405634297084, + "loss": 1.5024, + "step": 17072 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017449186257833326, + "loss": 1.5339, + "step": 17073 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017447966864740948, + "loss": 1.5217, + "step": 17074 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017446747455028227, + "loss": 1.4797, + "step": 17075 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017445528028703437, + "loss": 1.522, + "step": 17076 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017444308585774866, + "loss": 1.5376, + "step": 17077 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017443089126250786, + "loss": 1.5431, + "step": 17078 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001744186965013948, + "loss": 1.5494, + "step": 17079 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001744065015744922, + "loss": 1.5454, + "step": 17080 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017439430648188303, + "loss": 1.5837, + "step": 17081 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001743821112236499, + "loss": 1.543, + "step": 17082 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017436991579987572, + "loss": 1.4887, + "step": 17083 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017435772021064328, + "loss": 1.5369, + "step": 17084 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017434552445603533, + "loss": 1.5276, + "step": 17085 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001743333285361347, + "loss": 1.5348, + "step": 17086 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017432113245102423, + "loss": 1.5086, + "step": 17087 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017430893620078665, + "loss": 1.5535, + "step": 17088 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017429673978550483, + "loss": 1.5234, + "step": 17089 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017428454320526156, + "loss": 1.4983, + "step": 17090 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017427234646013966, + "loss": 1.5142, + "step": 17091 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017426014955022193, + "loss": 1.5642, + "step": 17092 + }, + { + "epoch": 1.34, + "learning_rate": 0.0001742479524755911, + "loss": 1.4969, + "step": 17093 + }, + { + "epoch": 1.34, + "learning_rate": 0.00017423575523633011, + "loss": 1.5485, + "step": 17094 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001742235578325217, + "loss": 1.5218, + "step": 17095 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017421136026424873, + "loss": 1.5082, + "step": 17096 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017419916253159394, + "loss": 1.583, + "step": 17097 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017418696463464018, + "loss": 1.5687, + "step": 17098 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017417476657347034, + "loss": 1.5099, + "step": 17099 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017416256834816714, + "loss": 1.583, + "step": 17100 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017415036995881345, + "loss": 1.5553, + "step": 17101 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017413817140549205, + "loss": 1.5076, + "step": 17102 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001741259726882858, + "loss": 1.5539, + "step": 17103 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001741137738072775, + "loss": 1.5487, + "step": 17104 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017410157476255, + "loss": 1.5221, + "step": 17105 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001740893755541861, + "loss": 1.5662, + "step": 17106 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001740771761822686, + "loss": 1.5561, + "step": 17107 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017406497664688045, + "loss": 1.4688, + "step": 17108 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017405277694810433, + "loss": 1.5229, + "step": 17109 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001740405770860231, + "loss": 1.5272, + "step": 17110 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017402837706071962, + "loss": 1.5753, + "step": 17111 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017401617687227676, + "loss": 1.6127, + "step": 17112 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017400397652077732, + "loss": 1.5643, + "step": 17113 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017399177600630413, + "loss": 1.541, + "step": 17114 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017397957532894, + "loss": 1.53, + "step": 17115 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001739673744887678, + "loss": 1.4654, + "step": 17116 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001739551734858703, + "loss": 1.5555, + "step": 17117 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001739429723203305, + "loss": 1.5291, + "step": 17118 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017393077099223098, + "loss": 1.5445, + "step": 17119 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017391856950165483, + "loss": 1.5669, + "step": 17120 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017390636784868477, + "loss": 1.551, + "step": 17121 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017389416603340367, + "loss": 1.5353, + "step": 17122 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017388196405589438, + "loss": 1.5334, + "step": 17123 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001738697619162397, + "loss": 1.5425, + "step": 17124 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017385755961452253, + "loss": 1.5194, + "step": 17125 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017384535715082573, + "loss": 1.5256, + "step": 17126 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017383315452523202, + "loss": 1.5191, + "step": 17127 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017382095173782444, + "loss": 1.5448, + "step": 17128 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001738087487886857, + "loss": 1.5086, + "step": 17129 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017379654567789871, + "loss": 1.5494, + "step": 17130 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017378434240554631, + "loss": 1.5341, + "step": 17131 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017377213897171132, + "loss": 1.5699, + "step": 17132 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017375993537647666, + "loss": 1.5045, + "step": 17133 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017374773161992513, + "loss": 1.5158, + "step": 17134 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017373552770213958, + "loss": 1.499, + "step": 17135 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017372332362320292, + "loss": 1.5534, + "step": 17136 + }, + { + "epoch": 1.35, + "learning_rate": 0.000173711119383198, + "loss": 1.5489, + "step": 17137 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017369891498220767, + "loss": 1.557, + "step": 17138 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017368671042031477, + "loss": 1.5578, + "step": 17139 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001736745056976022, + "loss": 1.4834, + "step": 17140 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017366230081415274, + "loss": 1.5468, + "step": 17141 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017365009577004938, + "loss": 1.5077, + "step": 17142 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017363789056537487, + "loss": 1.4729, + "step": 17143 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001736256852002121, + "loss": 1.5503, + "step": 17144 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001736134796746441, + "loss": 1.4944, + "step": 17145 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017360127398875349, + "loss": 1.5543, + "step": 17146 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017358906814262328, + "loss": 1.5363, + "step": 17147 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017357686213633635, + "loss": 1.5412, + "step": 17148 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001735646559699755, + "loss": 1.5184, + "step": 17149 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017355244964362363, + "loss": 1.5248, + "step": 17150 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017354024315736362, + "loss": 1.5704, + "step": 17151 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017352803651127837, + "loss": 1.5201, + "step": 17152 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017351582970545073, + "loss": 1.5442, + "step": 17153 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001735036227399636, + "loss": 1.6035, + "step": 17154 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017349141561489987, + "loss": 1.4942, + "step": 17155 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017347920833034233, + "loss": 1.5099, + "step": 17156 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017346700088637394, + "loss": 1.4712, + "step": 17157 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017345479328307754, + "loss": 1.5261, + "step": 17158 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001734425855205361, + "loss": 1.5015, + "step": 17159 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001734303775988324, + "loss": 1.5635, + "step": 17160 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017341816951804936, + "loss": 1.5621, + "step": 17161 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001734059612782699, + "loss": 1.5212, + "step": 17162 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017339375287957686, + "loss": 1.5856, + "step": 17163 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017338154432205318, + "loss": 1.5623, + "step": 17164 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001733693356057817, + "loss": 1.5092, + "step": 17165 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001733571267308453, + "loss": 1.5434, + "step": 17166 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001733449176973269, + "loss": 1.4802, + "step": 17167 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001733327085053094, + "loss": 1.4992, + "step": 17168 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017332049915487572, + "loss": 1.5504, + "step": 17169 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001733082896461087, + "loss": 1.5019, + "step": 17170 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017329607997909125, + "loss": 1.5464, + "step": 17171 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017328387015390627, + "loss": 1.5431, + "step": 17172 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017327166017063665, + "loss": 1.5066, + "step": 17173 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017325945002936532, + "loss": 1.5267, + "step": 17174 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017324723973017515, + "loss": 1.5209, + "step": 17175 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017323502927314905, + "loss": 1.5405, + "step": 17176 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017322281865836994, + "loss": 1.5222, + "step": 17177 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017321060788592067, + "loss": 1.5216, + "step": 17178 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017319839695588424, + "loss": 1.5031, + "step": 17179 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017318618586834345, + "loss": 1.5291, + "step": 17180 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017317397462338126, + "loss": 1.5053, + "step": 17181 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017316176322108056, + "loss": 1.5045, + "step": 17182 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001731495516615243, + "loss": 1.5722, + "step": 17183 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017313733994479531, + "loss": 1.4852, + "step": 17184 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001731251280709766, + "loss": 1.5937, + "step": 17185 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017311291604015105, + "loss": 1.5416, + "step": 17186 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001731007038524015, + "loss": 1.5481, + "step": 17187 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017308849150781094, + "loss": 1.5503, + "step": 17188 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017307627900646228, + "loss": 1.6046, + "step": 17189 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001730640663484384, + "loss": 1.5427, + "step": 17190 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017305185353382223, + "loss": 1.5582, + "step": 17191 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017303964056269668, + "loss": 1.5239, + "step": 17192 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001730274274351447, + "loss": 1.5528, + "step": 17193 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017301521415124925, + "loss": 1.5167, + "step": 17194 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017300300071109315, + "loss": 1.4923, + "step": 17195 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001729907871147594, + "loss": 1.5405, + "step": 17196 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017297857336233085, + "loss": 1.5119, + "step": 17197 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001729663594538905, + "loss": 1.4842, + "step": 17198 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001729541453895212, + "loss": 1.5193, + "step": 17199 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017294193116930594, + "loss": 1.5912, + "step": 17200 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017292971679332765, + "loss": 1.5508, + "step": 17201 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017291750226166918, + "loss": 1.5504, + "step": 17202 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001729052875744136, + "loss": 1.5434, + "step": 17203 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017289307273164373, + "loss": 1.5311, + "step": 17204 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001728808577334425, + "loss": 1.4916, + "step": 17205 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017286864257989287, + "loss": 1.5247, + "step": 17206 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001728564272710778, + "loss": 1.5345, + "step": 17207 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001728442118070802, + "loss": 1.5934, + "step": 17208 + }, + { + "epoch": 1.35, + "learning_rate": 0.000172831996187983, + "loss": 1.5649, + "step": 17209 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017281978041386913, + "loss": 1.5375, + "step": 17210 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001728075644848216, + "loss": 1.5787, + "step": 17211 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017279534840092324, + "loss": 1.5557, + "step": 17212 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017278313216225705, + "loss": 1.5696, + "step": 17213 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017277091576890598, + "loss": 1.5153, + "step": 17214 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017275869922095296, + "loss": 1.5379, + "step": 17215 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017274648251848092, + "loss": 1.4985, + "step": 17216 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001727342656615728, + "loss": 1.5191, + "step": 17217 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017272204865031163, + "loss": 1.6207, + "step": 17218 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017270983148478023, + "loss": 1.5099, + "step": 17219 + }, + { + "epoch": 1.35, + "learning_rate": 0.00017269761416506164, + "loss": 1.5572, + "step": 17220 + }, + { + "epoch": 1.35, + "learning_rate": 0.0001726853966912387, + "loss": 1.483, + "step": 17221 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001726731790633945, + "loss": 1.524, + "step": 17222 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017266096128161192, + "loss": 1.5318, + "step": 17223 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001726487433459739, + "loss": 1.52, + "step": 17224 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017263652525656347, + "loss": 1.5552, + "step": 17225 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017262430701346347, + "loss": 1.484, + "step": 17226 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001726120886167569, + "loss": 1.5453, + "step": 17227 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017259987006652678, + "loss": 1.4997, + "step": 17228 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017258765136285597, + "loss": 1.4844, + "step": 17229 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001725754325058275, + "loss": 1.5499, + "step": 17230 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017256321349552427, + "loss": 1.553, + "step": 17231 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001725509943320293, + "loss": 1.4895, + "step": 17232 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017253877501542553, + "loss": 1.5023, + "step": 17233 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017252655554579588, + "loss": 1.5057, + "step": 17234 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017251433592322337, + "loss": 1.5527, + "step": 17235 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017250211614779093, + "loss": 1.5732, + "step": 17236 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017248989621958155, + "loss": 1.5469, + "step": 17237 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017247767613867818, + "loss": 1.5501, + "step": 17238 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001724654559051638, + "loss": 1.4859, + "step": 17239 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017245323551912136, + "loss": 1.5474, + "step": 17240 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017244101498063385, + "loss": 1.5508, + "step": 17241 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017242879428978428, + "loss": 1.5616, + "step": 17242 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017241657344665553, + "loss": 1.4713, + "step": 17243 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017240435245133057, + "loss": 1.5773, + "step": 17244 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017239213130389245, + "loss": 1.5271, + "step": 17245 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017237991000442412, + "loss": 1.5192, + "step": 17246 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017236768855300862, + "loss": 1.5474, + "step": 17247 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017235546694972876, + "loss": 1.4942, + "step": 17248 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017234324519466764, + "loss": 1.575, + "step": 17249 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017233102328790826, + "loss": 1.5747, + "step": 17250 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017231880122953354, + "loss": 1.5788, + "step": 17251 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001723065790196265, + "loss": 1.4819, + "step": 17252 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017229435665826998, + "loss": 1.5552, + "step": 17253 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017228213414554718, + "loss": 1.4696, + "step": 17254 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017226991148154097, + "loss": 1.5171, + "step": 17255 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017225768866633434, + "loss": 1.5369, + "step": 17256 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001722454657000103, + "loss": 1.5317, + "step": 17257 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017223324258265182, + "loss": 1.5336, + "step": 17258 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017222101931434194, + "loss": 1.5324, + "step": 17259 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017220879589516352, + "loss": 1.5155, + "step": 17260 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017219657232519963, + "loss": 1.5784, + "step": 17261 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017218434860453332, + "loss": 1.5605, + "step": 17262 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001721721247332475, + "loss": 1.5264, + "step": 17263 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017215990071142522, + "loss": 1.4776, + "step": 17264 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001721476765391494, + "loss": 1.5422, + "step": 17265 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017213545221650306, + "loss": 1.4895, + "step": 17266 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017212322774356927, + "loss": 1.5099, + "step": 17267 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001721110031204309, + "loss": 1.5163, + "step": 17268 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017209877834717112, + "loss": 1.5114, + "step": 17269 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017208655342387276, + "loss": 1.5462, + "step": 17270 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017207432835061894, + "loss": 1.48, + "step": 17271 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017206210312749258, + "loss": 1.5122, + "step": 17272 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001720498777545767, + "loss": 1.4971, + "step": 17273 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017203765223195434, + "loss": 1.5756, + "step": 17274 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017202542655970847, + "loss": 1.5803, + "step": 17275 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017201320073792213, + "loss": 1.5031, + "step": 17276 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017200097476667827, + "loss": 1.5591, + "step": 17277 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017198874864605995, + "loss": 1.534, + "step": 17278 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017197652237615018, + "loss": 1.5248, + "step": 17279 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017196429595703195, + "loss": 1.4905, + "step": 17280 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017195206938878826, + "loss": 1.5315, + "step": 17281 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017193984267150212, + "loss": 1.4967, + "step": 17282 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017192761580525658, + "loss": 1.5137, + "step": 17283 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017191538879013458, + "loss": 1.5539, + "step": 17284 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001719031616262192, + "loss": 1.5176, + "step": 17285 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001718909343135935, + "loss": 1.506, + "step": 17286 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001718787068523404, + "loss": 1.5509, + "step": 17287 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017186647924254296, + "loss": 1.5307, + "step": 17288 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017185425148428417, + "loss": 1.6049, + "step": 17289 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017184202357764706, + "loss": 1.4907, + "step": 17290 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001718297955227147, + "loss": 1.4793, + "step": 17291 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017181756731957004, + "loss": 1.5237, + "step": 17292 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001718053389682962, + "loss": 1.5224, + "step": 17293 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017179311046897606, + "loss": 1.5648, + "step": 17294 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017178088182169277, + "loss": 1.5137, + "step": 17295 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017176865302652935, + "loss": 1.5922, + "step": 17296 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017175642408356873, + "loss": 1.5253, + "step": 17297 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017174419499289405, + "loss": 1.6006, + "step": 17298 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017173196575458822, + "loss": 1.5337, + "step": 17299 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017171973636873438, + "loss": 1.5472, + "step": 17300 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001717075068354155, + "loss": 1.5345, + "step": 17301 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001716952771547146, + "loss": 1.5058, + "step": 17302 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001716830473267148, + "loss": 1.5385, + "step": 17303 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017167081735149905, + "loss": 1.5288, + "step": 17304 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017165858722915039, + "loss": 1.4915, + "step": 17305 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017164635695975192, + "loss": 1.5557, + "step": 17306 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001716341265433866, + "loss": 1.5398, + "step": 17307 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001716218959801375, + "loss": 1.478, + "step": 17308 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001716096652700876, + "loss": 1.4914, + "step": 17309 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001715974344133201, + "loss": 1.5564, + "step": 17310 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017158520340991787, + "loss": 1.5397, + "step": 17311 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017157297225996407, + "loss": 1.5178, + "step": 17312 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001715607409635417, + "loss": 1.5193, + "step": 17313 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017154850952073373, + "loss": 1.5339, + "step": 17314 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017153627793162335, + "loss": 1.565, + "step": 17315 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017152404619629342, + "loss": 1.5835, + "step": 17316 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001715118143148272, + "loss": 1.5715, + "step": 17317 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017149958228730757, + "loss": 1.5339, + "step": 17318 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017148735011381766, + "loss": 1.4888, + "step": 17319 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017147511779444055, + "loss": 1.5024, + "step": 17320 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017146288532925917, + "loss": 1.5749, + "step": 17321 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017145065271835665, + "loss": 1.5258, + "step": 17322 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017143841996181608, + "loss": 1.5486, + "step": 17323 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001714261870597204, + "loss": 1.4907, + "step": 17324 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001714139540121528, + "loss": 1.5611, + "step": 17325 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017140172081919622, + "loss": 1.4928, + "step": 17326 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017138948748093383, + "loss": 1.5602, + "step": 17327 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017137725399744857, + "loss": 1.5576, + "step": 17328 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017136502036882358, + "loss": 1.5678, + "step": 17329 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001713527865951419, + "loss": 1.59, + "step": 17330 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017134055267648652, + "loss": 1.5534, + "step": 17331 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001713283186129406, + "loss": 1.5184, + "step": 17332 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017131608440458719, + "loss": 1.5001, + "step": 17333 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001713038500515093, + "loss": 1.5713, + "step": 17334 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017129161555379005, + "loss": 1.5653, + "step": 17335 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017127938091151247, + "loss": 1.5436, + "step": 17336 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017126714612475966, + "loss": 1.5092, + "step": 17337 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017125491119361462, + "loss": 1.5583, + "step": 17338 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017124267611816048, + "loss": 1.5524, + "step": 17339 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001712304408984803, + "loss": 1.5506, + "step": 17340 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017121820553465714, + "loss": 1.5285, + "step": 17341 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017120597002677406, + "loss": 1.5081, + "step": 17342 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017119373437491414, + "loss": 1.5421, + "step": 17343 + }, + { + "epoch": 1.36, + "learning_rate": 0.0001711814985791605, + "loss": 1.5186, + "step": 17344 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017116926263959615, + "loss": 1.5289, + "step": 17345 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017115702655630415, + "loss": 1.5381, + "step": 17346 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017114479032936768, + "loss": 1.5394, + "step": 17347 + }, + { + "epoch": 1.36, + "learning_rate": 0.00017113255395886972, + "loss": 1.5095, + "step": 17348 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017112031744489337, + "loss": 1.5272, + "step": 17349 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017110808078752172, + "loss": 1.5196, + "step": 17350 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017109584398683787, + "loss": 1.4618, + "step": 17351 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017108360704292492, + "loss": 1.5376, + "step": 17352 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017107136995586584, + "loss": 1.5254, + "step": 17353 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017105913272574382, + "loss": 1.4973, + "step": 17354 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017104689535264186, + "loss": 1.4862, + "step": 17355 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017103465783664318, + "loss": 1.5719, + "step": 17356 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017102242017783074, + "loss": 1.532, + "step": 17357 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017101018237628763, + "loss": 1.5239, + "step": 17358 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017099794443209705, + "loss": 1.5175, + "step": 17359 + }, + { + "epoch": 1.37, + "learning_rate": 0.000170985706345342, + "loss": 1.4996, + "step": 17360 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017097346811610555, + "loss": 1.5234, + "step": 17361 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017096122974447084, + "loss": 1.5276, + "step": 17362 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001709489912305209, + "loss": 1.4901, + "step": 17363 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017093675257433892, + "loss": 1.5651, + "step": 17364 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017092451377600794, + "loss": 1.5251, + "step": 17365 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001709122748356111, + "loss": 1.5422, + "step": 17366 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017090003575323138, + "loss": 1.5801, + "step": 17367 + }, + { + "epoch": 1.37, + "learning_rate": 0.000170887796528952, + "loss": 1.5184, + "step": 17368 + }, + { + "epoch": 1.37, + "learning_rate": 0.000170875557162856, + "loss": 1.5063, + "step": 17369 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001708633176550265, + "loss": 1.5147, + "step": 17370 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017085107800554654, + "loss": 1.5313, + "step": 17371 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017083883821449928, + "loss": 1.4681, + "step": 17372 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017082659828196787, + "loss": 1.5258, + "step": 17373 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001708143582080353, + "loss": 1.5137, + "step": 17374 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001708021179927847, + "loss": 1.5408, + "step": 17375 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017078987763629927, + "loss": 1.5824, + "step": 17376 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017077763713866197, + "loss": 1.5124, + "step": 17377 + }, + { + "epoch": 1.37, + "learning_rate": 0.000170765396499956, + "loss": 1.5072, + "step": 17378 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017075315572026442, + "loss": 1.5202, + "step": 17379 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001707409147996704, + "loss": 1.5091, + "step": 17380 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017072867373825703, + "loss": 1.5121, + "step": 17381 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017071643253610742, + "loss": 1.5001, + "step": 17382 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001707041911933046, + "loss": 1.5561, + "step": 17383 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017069194970993181, + "loss": 1.4914, + "step": 17384 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017067970808607203, + "loss": 1.5131, + "step": 17385 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017066746632180848, + "loss": 1.5351, + "step": 17386 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017065522441722425, + "loss": 1.4892, + "step": 17387 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017064298237240248, + "loss": 1.4898, + "step": 17388 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001706307401874262, + "loss": 1.527, + "step": 17389 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017061849786237856, + "loss": 1.512, + "step": 17390 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017060625539734277, + "loss": 1.522, + "step": 17391 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001705940127924018, + "loss": 1.5269, + "step": 17392 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001705817700476389, + "loss": 1.4887, + "step": 17393 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017056952716313712, + "loss": 1.5201, + "step": 17394 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001705572841389796, + "loss": 1.5039, + "step": 17395 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017054504097524948, + "loss": 1.562, + "step": 17396 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017053279767202984, + "loss": 1.54, + "step": 17397 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001705205542294039, + "loss": 1.5189, + "step": 17398 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017050831064745463, + "loss": 1.4841, + "step": 17399 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017049606692626533, + "loss": 1.4806, + "step": 17400 + }, + { + "epoch": 1.37, + "learning_rate": 0.000170483823065919, + "loss": 1.523, + "step": 17401 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017047157906649883, + "loss": 1.5533, + "step": 17402 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017045933492808792, + "loss": 1.518, + "step": 17403 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001704470906507694, + "loss": 1.4726, + "step": 17404 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017043484623462647, + "loss": 1.5992, + "step": 17405 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017042260167974218, + "loss": 1.517, + "step": 17406 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001704103569861997, + "loss": 1.54, + "step": 17407 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017039811215408218, + "loss": 1.5604, + "step": 17408 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001703858671834727, + "loss": 1.4863, + "step": 17409 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017037362207445445, + "loss": 1.5199, + "step": 17410 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017036137682711054, + "loss": 1.4933, + "step": 17411 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017034913144152415, + "loss": 1.5222, + "step": 17412 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001703368859177783, + "loss": 1.5125, + "step": 17413 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001703246402559563, + "loss": 1.5001, + "step": 17414 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017031239445614122, + "loss": 1.5034, + "step": 17415 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017030014851841615, + "loss": 1.5759, + "step": 17416 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017028790244286426, + "loss": 1.5908, + "step": 17417 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001702756562295687, + "loss": 1.5297, + "step": 17418 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017026340987861266, + "loss": 1.529, + "step": 17419 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017025116339007925, + "loss": 1.5333, + "step": 17420 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001702389167640516, + "loss": 1.5202, + "step": 17421 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017022667000061293, + "loss": 1.5518, + "step": 17422 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017021442309984628, + "loss": 1.5299, + "step": 17423 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001702021760618348, + "loss": 1.5479, + "step": 17424 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001701899288866618, + "loss": 1.5597, + "step": 17425 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017017768157441025, + "loss": 1.5021, + "step": 17426 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017016543412516342, + "loss": 1.557, + "step": 17427 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017015318653900439, + "loss": 1.5447, + "step": 17428 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017014093881601635, + "loss": 1.5608, + "step": 17429 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017012869095628247, + "loss": 1.535, + "step": 17430 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017011644295988583, + "loss": 1.5686, + "step": 17431 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017010419482690973, + "loss": 1.4905, + "step": 17432 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017009194655743718, + "loss": 1.493, + "step": 17433 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017007969815155145, + "loss": 1.561, + "step": 17434 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017006744960933558, + "loss": 1.5095, + "step": 17435 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017005520093087284, + "loss": 1.5023, + "step": 17436 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017004295211624635, + "loss": 1.5082, + "step": 17437 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001700307031655393, + "loss": 1.5218, + "step": 17438 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017001845407883483, + "loss": 1.5587, + "step": 17439 + }, + { + "epoch": 1.37, + "learning_rate": 0.00017000620485621608, + "loss": 1.5257, + "step": 17440 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016999395549776623, + "loss": 1.5398, + "step": 17441 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016998170600356847, + "loss": 1.4871, + "step": 17442 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016996945637370593, + "loss": 1.5079, + "step": 17443 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016995720660826184, + "loss": 1.5628, + "step": 17444 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016994495670731932, + "loss": 1.5037, + "step": 17445 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016993270667096152, + "loss": 1.5031, + "step": 17446 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001699204564992717, + "loss": 1.5414, + "step": 17447 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016990820619233293, + "loss": 1.5249, + "step": 17448 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016989595575022843, + "loss": 1.5024, + "step": 17449 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016988370517304134, + "loss": 1.5403, + "step": 17450 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016987145446085492, + "loss": 1.5538, + "step": 17451 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016985920361375228, + "loss": 1.548, + "step": 17452 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016984695263181656, + "loss": 1.5753, + "step": 17453 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016983470151513103, + "loss": 1.5647, + "step": 17454 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016982245026377885, + "loss": 1.5428, + "step": 17455 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016981019887784312, + "loss": 1.5622, + "step": 17456 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016979794735740708, + "loss": 1.5694, + "step": 17457 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001697856957025539, + "loss": 1.5506, + "step": 17458 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016977344391336675, + "loss": 1.5566, + "step": 17459 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016976119198992888, + "loss": 1.5531, + "step": 17460 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001697489399323234, + "loss": 1.5702, + "step": 17461 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001697366877406335, + "loss": 1.5447, + "step": 17462 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016972443541494239, + "loss": 1.5294, + "step": 17463 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001697121829553333, + "loss": 1.5523, + "step": 17464 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016969993036188924, + "loss": 1.4913, + "step": 17465 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016968767763469363, + "loss": 1.497, + "step": 17466 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001696754247738295, + "loss": 1.5043, + "step": 17467 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016966317177938015, + "loss": 1.5152, + "step": 17468 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016965091865142867, + "loss": 1.5746, + "step": 17469 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001696386653900583, + "loss": 1.4945, + "step": 17470 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016962641199535225, + "loss": 1.5512, + "step": 17471 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016961415846739365, + "loss": 1.4878, + "step": 17472 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016960190480626576, + "loss": 1.5478, + "step": 17473 + }, + { + "epoch": 1.37, + "learning_rate": 0.0001695896510120518, + "loss": 1.5924, + "step": 17474 + }, + { + "epoch": 1.37, + "learning_rate": 0.00016957739708483484, + "loss": 1.5197, + "step": 17475 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016956514302469823, + "loss": 1.5804, + "step": 17476 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016955288883172508, + "loss": 1.5047, + "step": 17477 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016954063450599858, + "loss": 1.5177, + "step": 17478 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016952838004760198, + "loss": 1.5006, + "step": 17479 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001695161254566184, + "loss": 1.5721, + "step": 17480 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016950387073313115, + "loss": 1.4999, + "step": 17481 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016949161587722337, + "loss": 1.5715, + "step": 17482 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016947936088897826, + "loss": 1.5428, + "step": 17483 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016946710576847907, + "loss": 1.4997, + "step": 17484 + }, + { + "epoch": 1.38, + "learning_rate": 0.000169454850515809, + "loss": 1.5298, + "step": 17485 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016944259513105116, + "loss": 1.5715, + "step": 17486 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016943033961428882, + "loss": 1.5442, + "step": 17487 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016941808396560523, + "loss": 1.5186, + "step": 17488 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001694058281850836, + "loss": 1.5165, + "step": 17489 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016939357227280707, + "loss": 1.5665, + "step": 17490 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016938131622885888, + "loss": 1.4658, + "step": 17491 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016936906005332226, + "loss": 1.5474, + "step": 17492 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016935680374628042, + "loss": 1.557, + "step": 17493 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001693445473078166, + "loss": 1.5283, + "step": 17494 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016933229073801394, + "loss": 1.5368, + "step": 17495 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016932003403695564, + "loss": 1.4972, + "step": 17496 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016930777720472505, + "loss": 1.5096, + "step": 17497 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016929552024140524, + "loss": 1.5034, + "step": 17498 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016928326314707954, + "loss": 1.4966, + "step": 17499 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016927100592183114, + "loss": 1.5236, + "step": 17500 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001692587485657432, + "loss": 1.5986, + "step": 17501 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016924649107889902, + "loss": 1.5516, + "step": 17502 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016923423346138178, + "loss": 1.4911, + "step": 17503 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001692219757132747, + "loss": 1.4777, + "step": 17504 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016920971783466101, + "loss": 1.5808, + "step": 17505 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016919745982562392, + "loss": 1.5754, + "step": 17506 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016918520168624675, + "loss": 1.508, + "step": 17507 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016917294341661256, + "loss": 1.5387, + "step": 17508 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001691606850168047, + "loss": 1.5134, + "step": 17509 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016914842648690638, + "loss": 1.5017, + "step": 17510 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001691361678270008, + "loss": 1.55, + "step": 17511 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016912390903717117, + "loss": 1.5219, + "step": 17512 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016911165011750074, + "loss": 1.5277, + "step": 17513 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001690993910680728, + "loss": 1.508, + "step": 17514 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016908713188897053, + "loss": 1.5312, + "step": 17515 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016907487258027715, + "loss": 1.5092, + "step": 17516 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016906261314207595, + "loss": 1.4974, + "step": 17517 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016905035357445006, + "loss": 1.5368, + "step": 17518 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016903809387748282, + "loss": 1.5229, + "step": 17519 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016902583405125742, + "loss": 1.5226, + "step": 17520 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001690135740958571, + "loss": 1.518, + "step": 17521 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016900131401136515, + "loss": 1.5084, + "step": 17522 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001689890537978647, + "loss": 1.49, + "step": 17523 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016897679345543912, + "loss": 1.5476, + "step": 17524 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016896453298417152, + "loss": 1.5068, + "step": 17525 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016895227238414526, + "loss": 1.5274, + "step": 17526 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001689400116554435, + "loss": 1.4907, + "step": 17527 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016892775079814946, + "loss": 1.5221, + "step": 17528 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016891548981234656, + "loss": 1.4886, + "step": 17529 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016890322869811782, + "loss": 1.541, + "step": 17530 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001688909674555466, + "loss": 1.4807, + "step": 17531 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016887870608471619, + "loss": 1.5277, + "step": 17532 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016886644458570976, + "loss": 1.5135, + "step": 17533 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001688541829586106, + "loss": 1.4854, + "step": 17534 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016884192120350189, + "loss": 1.5056, + "step": 17535 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016882965932046696, + "loss": 1.5318, + "step": 17536 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016881739730958904, + "loss": 1.4831, + "step": 17537 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016880513517095137, + "loss": 1.4664, + "step": 17538 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016879287290463724, + "loss": 1.5387, + "step": 17539 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016878061051072983, + "loss": 1.5377, + "step": 17540 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016876834798931246, + "loss": 1.5276, + "step": 17541 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016875608534046838, + "loss": 1.5621, + "step": 17542 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016874382256428078, + "loss": 1.5356, + "step": 17543 + }, + { + "epoch": 1.38, + "learning_rate": 0.000168731559660833, + "loss": 1.5298, + "step": 17544 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016871929663020825, + "loss": 1.5004, + "step": 17545 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016870703347248984, + "loss": 1.5036, + "step": 17546 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016869477018776097, + "loss": 1.4937, + "step": 17547 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016868250677610496, + "loss": 1.5586, + "step": 17548 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016867024323760502, + "loss": 1.458, + "step": 17549 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016865797957234442, + "loss": 1.5677, + "step": 17550 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016864571578040645, + "loss": 1.5688, + "step": 17551 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001686334518618743, + "loss": 1.5451, + "step": 17552 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001686211878168314, + "loss": 1.5688, + "step": 17553 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016860892364536082, + "loss": 1.5236, + "step": 17554 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016859665934754596, + "loss": 1.5244, + "step": 17555 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016858439492347006, + "loss": 1.5026, + "step": 17556 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016857213037321634, + "loss": 1.5425, + "step": 17557 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016855986569686812, + "loss": 1.5694, + "step": 17558 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016854760089450864, + "loss": 1.544, + "step": 17559 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001685353359662212, + "loss": 1.5604, + "step": 17560 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016852307091208907, + "loss": 1.4932, + "step": 17561 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016851080573219548, + "loss": 1.5282, + "step": 17562 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016849854042662375, + "loss": 1.5161, + "step": 17563 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016848627499545712, + "loss": 1.5041, + "step": 17564 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016847400943877891, + "loss": 1.5234, + "step": 17565 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016846174375667236, + "loss": 1.4888, + "step": 17566 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016844947794922074, + "loss": 1.4846, + "step": 17567 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001684372120165074, + "loss": 1.5578, + "step": 17568 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016842494595861553, + "loss": 1.5059, + "step": 17569 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016841267977562842, + "loss": 1.5558, + "step": 17570 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016840041346762944, + "loss": 1.4837, + "step": 17571 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016838814703470177, + "loss": 1.5591, + "step": 17572 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016837588047692874, + "loss": 1.5266, + "step": 17573 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016836361379439358, + "loss": 1.5016, + "step": 17574 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016835134698717962, + "loss": 1.4967, + "step": 17575 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001683390800553702, + "loss": 1.5658, + "step": 17576 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016832681299904848, + "loss": 1.568, + "step": 17577 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001683145458182979, + "loss": 1.528, + "step": 17578 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016830227851320157, + "loss": 1.5189, + "step": 17579 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016829001108384294, + "loss": 1.5706, + "step": 17580 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016827774353030518, + "loss": 1.5125, + "step": 17581 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016826547585267163, + "loss": 1.4921, + "step": 17582 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016825320805102556, + "loss": 1.4682, + "step": 17583 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016824094012545034, + "loss": 1.494, + "step": 17584 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001682286720760292, + "loss": 1.5612, + "step": 17585 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001682164039028454, + "loss": 1.5238, + "step": 17586 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016820413560598226, + "loss": 1.5461, + "step": 17587 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016819186718552311, + "loss": 1.584, + "step": 17588 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001681795986415512, + "loss": 1.5143, + "step": 17589 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001681673299741499, + "loss": 1.514, + "step": 17590 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016815506118340236, + "loss": 1.5147, + "step": 17591 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016814279226939205, + "loss": 1.5037, + "step": 17592 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001681305232322022, + "loss": 1.5575, + "step": 17593 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016811825407191605, + "loss": 1.5401, + "step": 17594 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016810598478861702, + "loss": 1.5315, + "step": 17595 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016809371538238827, + "loss": 1.5285, + "step": 17596 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016808144585331325, + "loss": 1.5528, + "step": 17597 + }, + { + "epoch": 1.38, + "learning_rate": 0.0001680691762014751, + "loss": 1.451, + "step": 17598 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016805690642695726, + "loss": 1.5248, + "step": 17599 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016804463652984303, + "loss": 1.5726, + "step": 17600 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016803236651021563, + "loss": 1.5147, + "step": 17601 + }, + { + "epoch": 1.38, + "learning_rate": 0.00016802009636815844, + "loss": 1.6087, + "step": 17602 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001680078261037547, + "loss": 1.56, + "step": 17603 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016799555571708782, + "loss": 1.6017, + "step": 17604 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016798328520824102, + "loss": 1.538, + "step": 17605 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001679710145772976, + "loss": 1.5265, + "step": 17606 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016795874382434094, + "loss": 1.5472, + "step": 17607 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016794647294945432, + "loss": 1.5011, + "step": 17608 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016793420195272107, + "loss": 1.5646, + "step": 17609 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016792193083422444, + "loss": 1.5351, + "step": 17610 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016790965959404783, + "loss": 1.5026, + "step": 17611 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016789738823227453, + "loss": 1.4908, + "step": 17612 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016788511674898778, + "loss": 1.5444, + "step": 17613 + }, + { + "epoch": 1.39, + "learning_rate": 0.000167872845144271, + "loss": 1.5231, + "step": 17614 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016786057341820743, + "loss": 1.487, + "step": 17615 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016784830157088045, + "loss": 1.6044, + "step": 17616 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016783602960237338, + "loss": 1.5282, + "step": 17617 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016782375751276944, + "loss": 1.554, + "step": 17618 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016781148530215209, + "loss": 1.5021, + "step": 17619 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016779921297060455, + "loss": 1.5251, + "step": 17620 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016778694051821017, + "loss": 1.53, + "step": 17621 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016777466794505228, + "loss": 1.5231, + "step": 17622 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001677623952512142, + "loss": 1.5284, + "step": 17623 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016775012243677931, + "loss": 1.4942, + "step": 17624 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016773784950183083, + "loss": 1.5193, + "step": 17625 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016772557644645217, + "loss": 1.4875, + "step": 17626 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016771330327072662, + "loss": 1.5324, + "step": 17627 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001677010299747375, + "loss": 1.5104, + "step": 17628 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001676887565585682, + "loss": 1.5434, + "step": 17629 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016767648302230194, + "loss": 1.5204, + "step": 17630 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016766420936602214, + "loss": 1.517, + "step": 17631 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001676519355898121, + "loss": 1.5445, + "step": 17632 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016763966169375518, + "loss": 1.5066, + "step": 17633 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001676273876779347, + "loss": 1.4592, + "step": 17634 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016761511354243397, + "loss": 1.541, + "step": 17635 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016760283928733636, + "loss": 1.547, + "step": 17636 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016759056491272515, + "loss": 1.5584, + "step": 17637 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001675782904186837, + "loss": 1.5518, + "step": 17638 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016756601580529537, + "loss": 1.5574, + "step": 17639 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001675537410726435, + "loss": 1.5822, + "step": 17640 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016754146622081144, + "loss": 1.5409, + "step": 17641 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016752919124988247, + "loss": 1.4933, + "step": 17642 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016751691615993995, + "loss": 1.5626, + "step": 17643 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001675046409510673, + "loss": 1.5665, + "step": 17644 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016749236562334775, + "loss": 1.596, + "step": 17645 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016748009017686466, + "loss": 1.5712, + "step": 17646 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016746781461170145, + "loss": 1.5721, + "step": 17647 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016745553892794145, + "loss": 1.4711, + "step": 17648 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001674432631256679, + "loss": 1.5173, + "step": 17649 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016743098720496425, + "loss": 1.5158, + "step": 17650 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016741871116591385, + "loss": 1.5218, + "step": 17651 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016740643500859996, + "loss": 1.5054, + "step": 17652 + }, + { + "epoch": 1.39, + "learning_rate": 0.000167394158733106, + "loss": 1.4632, + "step": 17653 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016738188233951528, + "loss": 1.5281, + "step": 17654 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001673696058279112, + "loss": 1.5473, + "step": 17655 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001673573291983771, + "loss": 1.5614, + "step": 17656 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001673450524509963, + "loss": 1.548, + "step": 17657 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016733277558585215, + "loss": 1.5244, + "step": 17658 + }, + { + "epoch": 1.39, + "learning_rate": 0.000167320498603028, + "loss": 1.5406, + "step": 17659 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016730822150260726, + "loss": 1.535, + "step": 17660 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016729594428467324, + "loss": 1.5062, + "step": 17661 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001672836669493093, + "loss": 1.4609, + "step": 17662 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001672713894965988, + "loss": 1.5677, + "step": 17663 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016725911192662506, + "loss": 1.51, + "step": 17664 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016724683423947155, + "loss": 1.5568, + "step": 17665 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001672345564352215, + "loss": 1.5335, + "step": 17666 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016722227851395833, + "loss": 1.5298, + "step": 17667 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016721000047576542, + "loss": 1.5706, + "step": 17668 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016719772232072602, + "loss": 1.5308, + "step": 17669 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001671854440489237, + "loss": 1.5574, + "step": 17670 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016717316566044162, + "loss": 1.5094, + "step": 17671 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016716088715536324, + "loss": 1.513, + "step": 17672 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016714860853377192, + "loss": 1.5365, + "step": 17673 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016713632979575098, + "loss": 1.5349, + "step": 17674 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016712405094138384, + "loss": 1.4707, + "step": 17675 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016711177197075382, + "loss": 1.5198, + "step": 17676 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016709949288394436, + "loss": 1.5668, + "step": 17677 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016708721368103872, + "loss": 1.5113, + "step": 17678 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016707493436212033, + "loss": 1.5251, + "step": 17679 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016706265492727265, + "loss": 1.5161, + "step": 17680 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016705037537657885, + "loss": 1.5079, + "step": 17681 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016703809571012247, + "loss": 1.5333, + "step": 17682 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001670258159279868, + "loss": 1.5272, + "step": 17683 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016701353603025524, + "loss": 1.4927, + "step": 17684 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016700125601701118, + "loss": 1.5313, + "step": 17685 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016698897588833793, + "loss": 1.5636, + "step": 17686 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016697669564431897, + "loss": 1.5156, + "step": 17687 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016696441528503756, + "loss": 1.5287, + "step": 17688 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016695213481057714, + "loss": 1.4859, + "step": 17689 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001669398542210211, + "loss": 1.5357, + "step": 17690 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001669275735164528, + "loss": 1.5085, + "step": 17691 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016691529269695563, + "loss": 1.5673, + "step": 17692 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001669030117626129, + "loss": 1.4941, + "step": 17693 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001668907307135081, + "loss": 1.5422, + "step": 17694 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016687844954972454, + "loss": 1.4932, + "step": 17695 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016686616827134559, + "loss": 1.5374, + "step": 17696 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016685388687845472, + "loss": 1.4861, + "step": 17697 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016684160537113523, + "loss": 1.5113, + "step": 17698 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016682932374947052, + "loss": 1.5296, + "step": 17699 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016681704201354405, + "loss": 1.488, + "step": 17700 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016680476016343906, + "loss": 1.5556, + "step": 17701 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016679247819923908, + "loss": 1.5163, + "step": 17702 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016678019612102743, + "loss": 1.5054, + "step": 17703 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016676791392888752, + "loss": 1.527, + "step": 17704 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016675563162290273, + "loss": 1.5599, + "step": 17705 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001667433492031564, + "loss": 1.5054, + "step": 17706 + }, + { + "epoch": 1.39, + "learning_rate": 0.000166731066669732, + "loss": 1.5071, + "step": 17707 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016671878402271288, + "loss": 1.5088, + "step": 17708 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016670650126218248, + "loss": 1.5478, + "step": 17709 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016669421838822412, + "loss": 1.5635, + "step": 17710 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001666819354009212, + "loss": 1.5489, + "step": 17711 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016666965230035722, + "loss": 1.5413, + "step": 17712 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016665736908661542, + "loss": 1.5305, + "step": 17713 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016664508575977937, + "loss": 1.526, + "step": 17714 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016663280231993233, + "loss": 1.5493, + "step": 17715 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016662051876715773, + "loss": 1.4558, + "step": 17716 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016660823510153893, + "loss": 1.5332, + "step": 17717 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016659595132315945, + "loss": 1.4958, + "step": 17718 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001665836674321026, + "loss": 1.5456, + "step": 17719 + }, + { + "epoch": 1.39, + "learning_rate": 0.0001665713834284518, + "loss": 1.552, + "step": 17720 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016655909931229048, + "loss": 1.4847, + "step": 17721 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016654681508370198, + "loss": 1.5171, + "step": 17722 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016653453074276972, + "loss": 1.5072, + "step": 17723 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016652224628957714, + "loss": 1.5711, + "step": 17724 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016650996172420764, + "loss": 1.4921, + "step": 17725 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016649767704674458, + "loss": 1.5267, + "step": 17726 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016648539225727144, + "loss": 1.548, + "step": 17727 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016647310735587152, + "loss": 1.5009, + "step": 17728 + }, + { + "epoch": 1.39, + "learning_rate": 0.00016646082234262838, + "loss": 1.521, + "step": 17729 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001664485372176253, + "loss": 1.4739, + "step": 17730 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016643625198094572, + "loss": 1.515, + "step": 17731 + }, + { + "epoch": 1.4, + "learning_rate": 0.000166423966632673, + "loss": 1.4861, + "step": 17732 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001664116811728907, + "loss": 1.5258, + "step": 17733 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016639939560168213, + "loss": 1.5329, + "step": 17734 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016638710991913065, + "loss": 1.5259, + "step": 17735 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016637482412531983, + "loss": 1.4902, + "step": 17736 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016636253822033294, + "loss": 1.5349, + "step": 17737 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016635025220425344, + "loss": 1.5358, + "step": 17738 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016633796607716476, + "loss": 1.536, + "step": 17739 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016632567983915027, + "loss": 1.5587, + "step": 17740 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016631339349029348, + "loss": 1.5244, + "step": 17741 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016630110703067772, + "loss": 1.4981, + "step": 17742 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016628882046038648, + "loss": 1.5432, + "step": 17743 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001662765337795031, + "loss": 1.4834, + "step": 17744 + }, + { + "epoch": 1.4, + "learning_rate": 0.000166264246988111, + "loss": 1.5487, + "step": 17745 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016625196008629374, + "loss": 1.527, + "step": 17746 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016623967307413456, + "loss": 1.5179, + "step": 17747 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016622738595171698, + "loss": 1.5105, + "step": 17748 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016621509871912437, + "loss": 1.565, + "step": 17749 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016620281137644024, + "loss": 1.4826, + "step": 17750 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016619052392374795, + "loss": 1.5001, + "step": 17751 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016617823636113092, + "loss": 1.5121, + "step": 17752 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016616594868867267, + "loss": 1.5559, + "step": 17753 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016615366090645645, + "loss": 1.4834, + "step": 17754 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016614137301456582, + "loss": 1.4894, + "step": 17755 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016612908501308419, + "loss": 1.5266, + "step": 17756 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016611679690209494, + "loss": 1.5491, + "step": 17757 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016610450868168156, + "loss": 1.5069, + "step": 17758 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016609222035192744, + "loss": 1.5373, + "step": 17759 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016607993191291605, + "loss": 1.5376, + "step": 17760 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001660676433647308, + "loss": 1.5801, + "step": 17761 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016605535470745505, + "loss": 1.5326, + "step": 17762 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016604306594117239, + "loss": 1.5356, + "step": 17763 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016603077706596605, + "loss": 1.5699, + "step": 17764 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001660184880819197, + "loss": 1.4911, + "step": 17765 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016600619898911662, + "loss": 1.526, + "step": 17766 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016599390978764024, + "loss": 1.5352, + "step": 17767 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016598162047757407, + "loss": 1.5559, + "step": 17768 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016596933105900152, + "loss": 1.526, + "step": 17769 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016595704153200608, + "loss": 1.5629, + "step": 17770 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016594475189667102, + "loss": 1.5353, + "step": 17771 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016593246215307998, + "loss": 1.5621, + "step": 17772 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016592017230131624, + "loss": 1.5282, + "step": 17773 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016590788234146337, + "loss": 1.5276, + "step": 17774 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016589559227360475, + "loss": 1.5485, + "step": 17775 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016588330209782383, + "loss": 1.5558, + "step": 17776 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001658710118142041, + "loss": 1.4528, + "step": 17777 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016585872142282887, + "loss": 1.4797, + "step": 17778 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001658464309237817, + "loss": 1.6063, + "step": 17779 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016583414031714604, + "loss": 1.524, + "step": 17780 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016582184960300527, + "loss": 1.5382, + "step": 17781 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016580955878144288, + "loss": 1.5602, + "step": 17782 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016579726785254234, + "loss": 1.5449, + "step": 17783 + }, + { + "epoch": 1.4, + "learning_rate": 0.000165784976816387, + "loss": 1.5068, + "step": 17784 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001657726856730605, + "loss": 1.555, + "step": 17785 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016576039442264606, + "loss": 1.5495, + "step": 17786 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016574810306522726, + "loss": 1.4981, + "step": 17787 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016573581160088754, + "loss": 1.547, + "step": 17788 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016572352002971037, + "loss": 1.556, + "step": 17789 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016571122835177914, + "loss": 1.504, + "step": 17790 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016569893656717737, + "loss": 1.5472, + "step": 17791 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016568664467598847, + "loss": 1.5291, + "step": 17792 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001656743526782959, + "loss": 1.508, + "step": 17793 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001656620605741831, + "loss": 1.5247, + "step": 17794 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016564976836373359, + "loss": 1.5337, + "step": 17795 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016563747604703076, + "loss": 1.5347, + "step": 17796 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016562518362415814, + "loss": 1.4746, + "step": 17797 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016561289109519913, + "loss": 1.5107, + "step": 17798 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016560059846023725, + "loss": 1.5381, + "step": 17799 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016558830571935582, + "loss": 1.5172, + "step": 17800 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016557601287263844, + "loss": 1.5339, + "step": 17801 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016556371992016856, + "loss": 1.446, + "step": 17802 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016555142686202953, + "loss": 1.5049, + "step": 17803 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016553913369830495, + "loss": 1.4869, + "step": 17804 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016552684042907823, + "loss": 1.5156, + "step": 17805 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016551454705443286, + "loss": 1.4509, + "step": 17806 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016550225357445222, + "loss": 1.5559, + "step": 17807 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016548995998921985, + "loss": 1.5252, + "step": 17808 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016547766629881923, + "loss": 1.5498, + "step": 17809 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016546537250333376, + "loss": 1.523, + "step": 17810 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016545307860284694, + "loss": 1.4884, + "step": 17811 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016544078459744226, + "loss": 1.5367, + "step": 17812 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016542849048720317, + "loss": 1.5366, + "step": 17813 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016541619627221318, + "loss": 1.576, + "step": 17814 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016540390195255564, + "loss": 1.521, + "step": 17815 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016539160752831423, + "loss": 1.5324, + "step": 17816 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001653793129995722, + "loss": 1.5606, + "step": 17817 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016536701836641313, + "loss": 1.53, + "step": 17818 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001653547236289205, + "loss": 1.5343, + "step": 17819 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016534242878717776, + "loss": 1.5441, + "step": 17820 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016533013384126844, + "loss": 1.5381, + "step": 17821 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016531783879127591, + "loss": 1.5287, + "step": 17822 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016530554363728377, + "loss": 1.5185, + "step": 17823 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001652932483793754, + "loss": 1.5345, + "step": 17824 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001652809530176343, + "loss": 1.5548, + "step": 17825 + }, + { + "epoch": 1.4, + "learning_rate": 0.000165268657552144, + "loss": 1.5583, + "step": 17826 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001652563619829879, + "loss": 1.5628, + "step": 17827 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016524406631024955, + "loss": 1.5419, + "step": 17828 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016523177053401239, + "loss": 1.5493, + "step": 17829 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016521947465435993, + "loss": 1.535, + "step": 17830 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001652071786713756, + "loss": 1.4931, + "step": 17831 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016519488258514293, + "loss": 1.5399, + "step": 17832 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016518258639574546, + "loss": 1.5807, + "step": 17833 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001651702901032665, + "loss": 1.4953, + "step": 17834 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016515799370778972, + "loss": 1.5375, + "step": 17835 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001651456972093985, + "loss": 1.5701, + "step": 17836 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016513340060817633, + "loss": 1.5419, + "step": 17837 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016512110390420675, + "loss": 1.5334, + "step": 17838 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016510880709757323, + "loss": 1.5005, + "step": 17839 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016509651018835922, + "loss": 1.5476, + "step": 17840 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016508421317664826, + "loss": 1.4998, + "step": 17841 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016507191606252378, + "loss": 1.5244, + "step": 17842 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016505961884606934, + "loss": 1.5675, + "step": 17843 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016504732152736838, + "loss": 1.5314, + "step": 17844 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016503502410650445, + "loss": 1.533, + "step": 17845 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016502272658356097, + "loss": 1.505, + "step": 17846 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016501042895862147, + "loss": 1.5114, + "step": 17847 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016499813123176942, + "loss": 1.508, + "step": 17848 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016498583340308838, + "loss": 1.5202, + "step": 17849 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016497353547266177, + "loss": 1.5023, + "step": 17850 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016496123744057313, + "loss": 1.5569, + "step": 17851 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001649489393069059, + "loss": 1.5299, + "step": 17852 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001649366410717437, + "loss": 1.5084, + "step": 17853 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001649243427351699, + "loss": 1.4912, + "step": 17854 + }, + { + "epoch": 1.4, + "learning_rate": 0.00016491204429726808, + "loss": 1.5459, + "step": 17855 + }, + { + "epoch": 1.4, + "learning_rate": 0.0001648997457581217, + "loss": 1.5043, + "step": 17856 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016488744711781424, + "loss": 1.5447, + "step": 17857 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016487514837642924, + "loss": 1.5229, + "step": 17858 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001648628495340502, + "loss": 1.5091, + "step": 17859 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016485055059076064, + "loss": 1.5032, + "step": 17860 + }, + { + "epoch": 1.41, + "learning_rate": 0.000164838251546644, + "loss": 1.5107, + "step": 17861 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016482595240178383, + "loss": 1.4618, + "step": 17862 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016481365315626362, + "loss": 1.5024, + "step": 17863 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016480135381016686, + "loss": 1.5168, + "step": 17864 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016478905436357713, + "loss": 1.5071, + "step": 17865 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001647767548165778, + "loss": 1.5558, + "step": 17866 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016476445516925255, + "loss": 1.5141, + "step": 17867 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016475215542168477, + "loss": 1.5115, + "step": 17868 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016473985557395796, + "loss": 1.515, + "step": 17869 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001647275556261557, + "loss": 1.5137, + "step": 17870 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016471525557836144, + "loss": 1.4616, + "step": 17871 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016470295543065877, + "loss": 1.5569, + "step": 17872 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016469065518313108, + "loss": 1.5379, + "step": 17873 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016467835483586197, + "loss": 1.5526, + "step": 17874 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016466605438893492, + "loss": 1.5346, + "step": 17875 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016465375384243347, + "loss": 1.4748, + "step": 17876 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001646414531964411, + "loss": 1.5469, + "step": 17877 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001646291524510414, + "loss": 1.5632, + "step": 17878 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016461685160631774, + "loss": 1.5036, + "step": 17879 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016460455066235382, + "loss": 1.5238, + "step": 17880 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016459224961923297, + "loss": 1.4855, + "step": 17881 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016457994847703884, + "loss": 1.4829, + "step": 17882 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001645676472358549, + "loss": 1.4841, + "step": 17883 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001645553458957647, + "loss": 1.4838, + "step": 17884 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001645430444568517, + "loss": 1.5752, + "step": 17885 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016453074291919946, + "loss": 1.5069, + "step": 17886 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016451844128289152, + "loss": 1.5307, + "step": 17887 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016450613954801138, + "loss": 1.4894, + "step": 17888 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016449383771464249, + "loss": 1.4983, + "step": 17889 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001644815357828685, + "loss": 1.5483, + "step": 17890 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016446923375277285, + "loss": 1.5061, + "step": 17891 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001644569316244391, + "loss": 1.4869, + "step": 17892 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016444462939795075, + "loss": 1.519, + "step": 17893 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016443232707339137, + "loss": 1.5212, + "step": 17894 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016442002465084444, + "loss": 1.521, + "step": 17895 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016440772213039347, + "loss": 1.529, + "step": 17896 + }, + { + "epoch": 1.41, + "learning_rate": 0.000164395419512122, + "loss": 1.4673, + "step": 17897 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016438311679611362, + "loss": 1.4759, + "step": 17898 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016437081398245184, + "loss": 1.5137, + "step": 17899 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001643585110712201, + "loss": 1.5071, + "step": 17900 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016434620806250207, + "loss": 1.5076, + "step": 17901 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001643339049563811, + "loss": 1.5405, + "step": 17902 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016432160175294092, + "loss": 1.4751, + "step": 17903 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016430929845226492, + "loss": 1.4663, + "step": 17904 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016429699505443666, + "loss": 1.5043, + "step": 17905 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016428469155953978, + "loss": 1.4971, + "step": 17906 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016427238796765762, + "loss": 1.53, + "step": 17907 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001642600842788739, + "loss": 1.4734, + "step": 17908 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016424778049327205, + "loss": 1.5172, + "step": 17909 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016423547661093563, + "loss": 1.5166, + "step": 17910 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001642231726319482, + "loss": 1.5459, + "step": 17911 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016421086855639326, + "loss": 1.5174, + "step": 17912 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016419856438435436, + "loss": 1.5131, + "step": 17913 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016418626011591503, + "loss": 1.4838, + "step": 17914 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001641739557511588, + "loss": 1.5464, + "step": 17915 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016416165129016933, + "loss": 1.4939, + "step": 17916 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016414934673302997, + "loss": 1.5694, + "step": 17917 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016413704207982442, + "loss": 1.5155, + "step": 17918 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016412473733063614, + "loss": 1.5316, + "step": 17919 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016411243248554865, + "loss": 1.5142, + "step": 17920 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016410012754464553, + "loss": 1.4547, + "step": 17921 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016408782250801034, + "loss": 1.5323, + "step": 17922 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016407551737572667, + "loss": 1.5182, + "step": 17923 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016406321214787792, + "loss": 1.51, + "step": 17924 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016405090682454775, + "loss": 1.5081, + "step": 17925 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001640386014058197, + "loss": 1.5066, + "step": 17926 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016402629589177726, + "loss": 1.5271, + "step": 17927 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016401399028250407, + "loss": 1.4333, + "step": 17928 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001640016845780835, + "loss": 1.5216, + "step": 17929 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016398937877859932, + "loss": 1.5597, + "step": 17930 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016397707288413494, + "loss": 1.474, + "step": 17931 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016396476689477395, + "loss": 1.4478, + "step": 17932 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016395246081059994, + "loss": 1.5455, + "step": 17933 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001639401546316964, + "loss": 1.5129, + "step": 17934 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016392784835814685, + "loss": 1.5635, + "step": 17935 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016391554199003493, + "loss": 1.5371, + "step": 17936 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001639032355274442, + "loss": 1.559, + "step": 17937 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016389092897045815, + "loss": 1.4796, + "step": 17938 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016387862231916032, + "loss": 1.5294, + "step": 17939 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016386631557363434, + "loss": 1.5699, + "step": 17940 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016385400873396373, + "loss": 1.5134, + "step": 17941 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016384170180023202, + "loss": 1.5157, + "step": 17942 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016382939477252282, + "loss": 1.6142, + "step": 17943 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016381708765091964, + "loss": 1.5579, + "step": 17944 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016380478043550608, + "loss": 1.5161, + "step": 17945 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016379247312636567, + "loss": 1.4985, + "step": 17946 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016378016572358195, + "loss": 1.5347, + "step": 17947 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016376785822723856, + "loss": 1.5268, + "step": 17948 + }, + { + "epoch": 1.41, + "learning_rate": 0.000163755550637419, + "loss": 1.4809, + "step": 17949 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016374324295420685, + "loss": 1.528, + "step": 17950 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016373093517768562, + "loss": 1.5315, + "step": 17951 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016371862730793895, + "loss": 1.5681, + "step": 17952 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016370631934505036, + "loss": 1.5139, + "step": 17953 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016369401128910342, + "loss": 1.5488, + "step": 17954 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016368170314018173, + "loss": 1.5109, + "step": 17955 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016366939489836877, + "loss": 1.5453, + "step": 17956 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016365708656374822, + "loss": 1.5188, + "step": 17957 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016364477813640355, + "loss": 1.5198, + "step": 17958 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016363246961641838, + "loss": 1.4592, + "step": 17959 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016362016100387628, + "loss": 1.5217, + "step": 17960 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016360785229886074, + "loss": 1.536, + "step": 17961 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001635955435014555, + "loss": 1.5417, + "step": 17962 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016358323461174393, + "loss": 1.4889, + "step": 17963 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016357092562980973, + "loss": 1.5123, + "step": 17964 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016355861655573643, + "loss": 1.5503, + "step": 17965 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016354630738960765, + "loss": 1.5804, + "step": 17966 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016353399813150686, + "loss": 1.5006, + "step": 17967 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016352168878151768, + "loss": 1.53, + "step": 17968 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016350937933972375, + "loss": 1.5629, + "step": 17969 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016349706980620855, + "loss": 1.5346, + "step": 17970 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001634847601810557, + "loss": 1.501, + "step": 17971 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001634724504643488, + "loss": 1.5079, + "step": 17972 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016346014065617135, + "loss": 1.5392, + "step": 17973 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016344783075660703, + "loss": 1.5597, + "step": 17974 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001634355207657393, + "loss": 1.5536, + "step": 17975 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016342321068365178, + "loss": 1.5294, + "step": 17976 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016341090051042814, + "loss": 1.523, + "step": 17977 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016339859024615185, + "loss": 1.5405, + "step": 17978 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016338627989090652, + "loss": 1.5343, + "step": 17979 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016337396944477575, + "loss": 1.4578, + "step": 17980 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001633616589078431, + "loss": 1.5396, + "step": 17981 + }, + { + "epoch": 1.41, + "learning_rate": 0.0001633493482801922, + "loss": 1.519, + "step": 17982 + }, + { + "epoch": 1.41, + "learning_rate": 0.00016333703756190655, + "loss": 1.5027, + "step": 17983 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016332472675306976, + "loss": 1.5273, + "step": 17984 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016331241585376544, + "loss": 1.5029, + "step": 17985 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001633001048640772, + "loss": 1.5218, + "step": 17986 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016328779378408856, + "loss": 1.5636, + "step": 17987 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016327548261388315, + "loss": 1.5112, + "step": 17988 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016326317135354452, + "loss": 1.5881, + "step": 17989 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001632508600031563, + "loss": 1.5075, + "step": 17990 + }, + { + "epoch": 1.42, + "learning_rate": 0.000163238548562802, + "loss": 1.5313, + "step": 17991 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016322623703256527, + "loss": 1.4912, + "step": 17992 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016321392541252973, + "loss": 1.515, + "step": 17993 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016320161370277894, + "loss": 1.5333, + "step": 17994 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001631893019033964, + "loss": 1.4926, + "step": 17995 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016317699001446587, + "loss": 1.5126, + "step": 17996 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001631646780360708, + "loss": 1.5221, + "step": 17997 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016315236596829483, + "loss": 1.5243, + "step": 17998 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016314005381122155, + "loss": 1.536, + "step": 17999 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016312774156493457, + "loss": 1.5241, + "step": 18000 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016311542922951746, + "loss": 1.5134, + "step": 18001 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016310311680505386, + "loss": 1.5492, + "step": 18002 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016309080429162726, + "loss": 1.5285, + "step": 18003 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016307849168932138, + "loss": 1.5442, + "step": 18004 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016306617899821974, + "loss": 1.5305, + "step": 18005 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016305386621840598, + "loss": 1.5252, + "step": 18006 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016304155334996361, + "loss": 1.5581, + "step": 18007 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016302924039297633, + "loss": 1.5699, + "step": 18008 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001630169273475277, + "loss": 1.5246, + "step": 18009 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016300461421370132, + "loss": 1.513, + "step": 18010 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001629923009915808, + "loss": 1.555, + "step": 18011 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016297998768124967, + "loss": 1.4721, + "step": 18012 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016296767428279163, + "loss": 1.5169, + "step": 18013 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016295536079629022, + "loss": 1.5519, + "step": 18014 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001629430472218291, + "loss": 1.5392, + "step": 18015 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016293073355949178, + "loss": 1.5591, + "step": 18016 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016291841980936193, + "loss": 1.5302, + "step": 18017 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016290610597152316, + "loss": 1.5106, + "step": 18018 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016289379204605903, + "loss": 1.5555, + "step": 18019 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016288147803305314, + "loss": 1.5001, + "step": 18020 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016286916393258919, + "loss": 1.4957, + "step": 18021 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016285684974475068, + "loss": 1.523, + "step": 18022 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016284453546962124, + "loss": 1.4991, + "step": 18023 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001628322211072845, + "loss": 1.5326, + "step": 18024 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001628199066578241, + "loss": 1.5346, + "step": 18025 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016280759212132357, + "loss": 1.4949, + "step": 18026 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016279527749786657, + "loss": 1.522, + "step": 18027 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001627829627875367, + "loss": 1.5507, + "step": 18028 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016277064799041752, + "loss": 1.5348, + "step": 18029 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016275833310659275, + "loss": 1.5247, + "step": 18030 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001627460181361459, + "loss": 1.49, + "step": 18031 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016273370307916062, + "loss": 1.5105, + "step": 18032 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016272138793572058, + "loss": 1.5615, + "step": 18033 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016270907270590928, + "loss": 1.4887, + "step": 18034 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016269675738981042, + "loss": 1.5334, + "step": 18035 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016268444198750756, + "loss": 1.5445, + "step": 18036 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016267212649908434, + "loss": 1.5265, + "step": 18037 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016265981092462444, + "loss": 1.5309, + "step": 18038 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001626474952642113, + "loss": 1.5443, + "step": 18039 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001626351795179287, + "loss": 1.512, + "step": 18040 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001626228636858602, + "loss": 1.5762, + "step": 18041 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016261054776808945, + "loss": 1.5445, + "step": 18042 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001625982317647, + "loss": 1.5516, + "step": 18043 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016258591567577552, + "loss": 1.5705, + "step": 18044 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016257359950139967, + "loss": 1.5048, + "step": 18045 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001625612832416559, + "loss": 1.4822, + "step": 18046 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016254896689662805, + "loss": 1.5103, + "step": 18047 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016253665046639962, + "loss": 1.5257, + "step": 18048 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016252433395105422, + "loss": 1.4912, + "step": 18049 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016251201735067555, + "loss": 1.5816, + "step": 18050 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016249970066534714, + "loss": 1.4976, + "step": 18051 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016248738389515273, + "loss": 1.5127, + "step": 18052 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001624750670401758, + "loss": 1.5483, + "step": 18053 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016246275010050007, + "loss": 1.5189, + "step": 18054 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016245043307620914, + "loss": 1.4668, + "step": 18055 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016243811596738662, + "loss": 1.5117, + "step": 18056 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016242579877411625, + "loss": 1.6033, + "step": 18057 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016241348149648144, + "loss": 1.5431, + "step": 18058 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016240116413456602, + "loss": 1.532, + "step": 18059 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016238884668845355, + "loss": 1.5132, + "step": 18060 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001623765291582276, + "loss": 1.5637, + "step": 18061 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016236421154397187, + "loss": 1.5839, + "step": 18062 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016235189384576992, + "loss": 1.5085, + "step": 18063 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016233957606370548, + "loss": 1.5302, + "step": 18064 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016232725819786213, + "loss": 1.5084, + "step": 18065 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001623149402483235, + "loss": 1.5117, + "step": 18066 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001623026222151732, + "loss": 1.4963, + "step": 18067 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016229030409849489, + "loss": 1.5456, + "step": 18068 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016227798589837222, + "loss": 1.4714, + "step": 18069 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016226566761488875, + "loss": 1.535, + "step": 18070 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001622533492481282, + "loss": 1.4948, + "step": 18071 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016224103079817419, + "loss": 1.4804, + "step": 18072 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016222871226511027, + "loss": 1.5199, + "step": 18073 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016221639364902022, + "loss": 1.5129, + "step": 18074 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016220407494998756, + "loss": 1.5556, + "step": 18075 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016219175616809595, + "loss": 1.5904, + "step": 18076 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001621794373034291, + "loss": 1.5117, + "step": 18077 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001621671183560705, + "loss": 1.4538, + "step": 18078 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016215479932610397, + "loss": 1.4816, + "step": 18079 + }, + { + "epoch": 1.42, + "learning_rate": 0.000162142480213613, + "loss": 1.556, + "step": 18080 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016213016101868135, + "loss": 1.5105, + "step": 18081 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016211784174139255, + "loss": 1.5108, + "step": 18082 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016210552238183032, + "loss": 1.567, + "step": 18083 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016209320294007827, + "loss": 1.5303, + "step": 18084 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016208088341622003, + "loss": 1.5312, + "step": 18085 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016206856381033926, + "loss": 1.5181, + "step": 18086 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016205624412251958, + "loss": 1.5665, + "step": 18087 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016204392435284468, + "loss": 1.5549, + "step": 18088 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001620316045013982, + "loss": 1.5216, + "step": 18089 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016201928456826374, + "loss": 1.5467, + "step": 18090 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016200696455352502, + "loss": 1.4764, + "step": 18091 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016199464445726557, + "loss": 1.5297, + "step": 18092 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016198232427956915, + "loss": 1.5387, + "step": 18093 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016197000402051932, + "loss": 1.5692, + "step": 18094 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016195768368019976, + "loss": 1.517, + "step": 18095 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016194536325869418, + "loss": 1.5426, + "step": 18096 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016193304275608612, + "loss": 1.5522, + "step": 18097 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016192072217245936, + "loss": 1.5226, + "step": 18098 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016190840150789743, + "loss": 1.5558, + "step": 18099 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016189608076248402, + "loss": 1.5449, + "step": 18100 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016188375993630278, + "loss": 1.5519, + "step": 18101 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016187143902943735, + "loss": 1.5134, + "step": 18102 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016185911804197147, + "loss": 1.4988, + "step": 18103 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016184679697398867, + "loss": 1.4935, + "step": 18104 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016183447582557265, + "loss": 1.5327, + "step": 18105 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016182215459680711, + "loss": 1.5117, + "step": 18106 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016180983328777562, + "loss": 1.5146, + "step": 18107 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016179751189856193, + "loss": 1.4741, + "step": 18108 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016178519042924958, + "loss": 1.5158, + "step": 18109 + }, + { + "epoch": 1.42, + "learning_rate": 0.00016177286887992235, + "loss": 1.481, + "step": 18110 + }, + { + "epoch": 1.42, + "learning_rate": 0.0001617605472506638, + "loss": 1.4964, + "step": 18111 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016174822554155765, + "loss": 1.5199, + "step": 18112 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016173590375268755, + "loss": 1.5429, + "step": 18113 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016172358188413708, + "loss": 1.5291, + "step": 18114 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016171125993598998, + "loss": 1.5396, + "step": 18115 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001616989379083299, + "loss": 1.4699, + "step": 18116 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016168661580124048, + "loss": 1.5617, + "step": 18117 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001616742936148054, + "loss": 1.5212, + "step": 18118 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016166197134910828, + "loss": 1.4964, + "step": 18119 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016164964900423285, + "loss": 1.5749, + "step": 18120 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001616373265802627, + "loss": 1.5337, + "step": 18121 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016162500407728155, + "loss": 1.5339, + "step": 18122 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016161268149537304, + "loss": 1.4823, + "step": 18123 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016160035883462081, + "loss": 1.5517, + "step": 18124 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016158803609510854, + "loss": 1.4869, + "step": 18125 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001615757132769199, + "loss": 1.5179, + "step": 18126 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016156339038013857, + "loss": 1.524, + "step": 18127 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016155106740484824, + "loss": 1.5582, + "step": 18128 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016153874435113246, + "loss": 1.5462, + "step": 18129 + }, + { + "epoch": 1.43, + "learning_rate": 0.000161526421219075, + "loss": 1.4984, + "step": 18130 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016151409800875953, + "loss": 1.604, + "step": 18131 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016150177472026966, + "loss": 1.5653, + "step": 18132 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016148945135368908, + "loss": 1.53, + "step": 18133 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016147712790910145, + "loss": 1.4409, + "step": 18134 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001614648043865905, + "loss": 1.5302, + "step": 18135 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016145248078623987, + "loss": 1.5586, + "step": 18136 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001614401571081332, + "loss": 1.5014, + "step": 18137 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016142783335235412, + "loss": 1.6021, + "step": 18138 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001614155095189864, + "loss": 1.5256, + "step": 18139 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001614031856081137, + "loss": 1.498, + "step": 18140 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001613908616198196, + "loss": 1.5037, + "step": 18141 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016137853755418787, + "loss": 1.5684, + "step": 18142 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016136621341130214, + "loss": 1.5393, + "step": 18143 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001613538891912461, + "loss": 1.5646, + "step": 18144 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016134156489410343, + "loss": 1.5486, + "step": 18145 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016132924051995778, + "loss": 1.5544, + "step": 18146 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016131691606889286, + "loss": 1.5228, + "step": 18147 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001613045915409923, + "loss": 1.5119, + "step": 18148 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016129226693633979, + "loss": 1.521, + "step": 18149 + }, + { + "epoch": 1.43, + "learning_rate": 0.000161279942255019, + "loss": 1.5208, + "step": 18150 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016126761749711368, + "loss": 1.5461, + "step": 18151 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016125529266270745, + "loss": 1.4802, + "step": 18152 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016124296775188394, + "loss": 1.5758, + "step": 18153 + }, + { + "epoch": 1.43, + "learning_rate": 0.000161230642764727, + "loss": 1.4978, + "step": 18154 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016121831770132009, + "loss": 1.5425, + "step": 18155 + }, + { + "epoch": 1.43, + "learning_rate": 0.000161205992561747, + "loss": 1.5304, + "step": 18156 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016119366734609143, + "loss": 1.526, + "step": 18157 + }, + { + "epoch": 1.43, + "learning_rate": 0.000161181342054437, + "loss": 1.5109, + "step": 18158 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001611690166868675, + "loss": 1.5731, + "step": 18159 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001611566912434665, + "loss": 1.5047, + "step": 18160 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016114436572431772, + "loss": 1.498, + "step": 18161 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016113204012950486, + "loss": 1.4861, + "step": 18162 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016111971445911157, + "loss": 1.5575, + "step": 18163 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016110738871322156, + "loss": 1.5183, + "step": 18164 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001610950628919185, + "loss": 1.5162, + "step": 18165 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016108273699528612, + "loss": 1.506, + "step": 18166 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016107041102340805, + "loss": 1.5037, + "step": 18167 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016105808497636799, + "loss": 1.4851, + "step": 18168 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016104575885424966, + "loss": 1.535, + "step": 18169 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001610334326571367, + "loss": 1.5403, + "step": 18170 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016102110638511284, + "loss": 1.5356, + "step": 18171 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001610087800382617, + "loss": 1.507, + "step": 18172 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016099645361666707, + "loss": 1.5578, + "step": 18173 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001609841271204126, + "loss": 1.5187, + "step": 18174 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016097180054958193, + "loss": 1.5365, + "step": 18175 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016095947390425884, + "loss": 1.5027, + "step": 18176 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016094714718452693, + "loss": 1.5093, + "step": 18177 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001609348203904699, + "loss": 1.4697, + "step": 18178 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016092249352217156, + "loss": 1.5371, + "step": 18179 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001609101665797154, + "loss": 1.5951, + "step": 18180 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016089783956318535, + "loss": 1.5544, + "step": 18181 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016088551247266488, + "loss": 1.4883, + "step": 18182 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001608731853082379, + "loss": 1.5357, + "step": 18183 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016086085806998792, + "loss": 1.4837, + "step": 18184 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001608485307579987, + "loss": 1.5129, + "step": 18185 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016083620337235398, + "loss": 1.5201, + "step": 18186 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016082387591313737, + "loss": 1.4947, + "step": 18187 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016081154838043266, + "loss": 1.4996, + "step": 18188 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016079922077432348, + "loss": 1.5884, + "step": 18189 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016078689309489353, + "loss": 1.4987, + "step": 18190 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001607745653422266, + "loss": 1.5661, + "step": 18191 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016076223751640626, + "loss": 1.4776, + "step": 18192 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001607499096175163, + "loss": 1.4784, + "step": 18193 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016073758164564033, + "loss": 1.5772, + "step": 18194 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016072525360086214, + "loss": 1.5419, + "step": 18195 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001607129254832654, + "loss": 1.4795, + "step": 18196 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016070059729293378, + "loss": 1.4601, + "step": 18197 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016068826902995107, + "loss": 1.5245, + "step": 18198 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001606759406944009, + "loss": 1.5005, + "step": 18199 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016066361228636692, + "loss": 1.5211, + "step": 18200 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016065128380593298, + "loss": 1.504, + "step": 18201 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016063895525318263, + "loss": 1.5804, + "step": 18202 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016062662662819972, + "loss": 1.5222, + "step": 18203 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016061429793106776, + "loss": 1.4743, + "step": 18204 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016060196916187067, + "loss": 1.6002, + "step": 18205 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016058964032069205, + "loss": 1.5704, + "step": 18206 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001605773114076156, + "loss": 1.5039, + "step": 18207 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016056498242272504, + "loss": 1.5555, + "step": 18208 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001605526533661041, + "loss": 1.4598, + "step": 18209 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016054032423783648, + "loss": 1.4721, + "step": 18210 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016052799503800578, + "loss": 1.4736, + "step": 18211 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001605156657666959, + "loss": 1.513, + "step": 18212 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016050333642399044, + "loss": 1.4814, + "step": 18213 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001604910070099731, + "loss": 1.4774, + "step": 18214 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016047867752472765, + "loss": 1.5372, + "step": 18215 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016046634796833772, + "loss": 1.5248, + "step": 18216 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016045401834088703, + "loss": 1.5564, + "step": 18217 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001604416886424594, + "loss": 1.5166, + "step": 18218 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001604293588731384, + "loss": 1.5444, + "step": 18219 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016041702903300787, + "loss": 1.4943, + "step": 18220 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016040469912215142, + "loss": 1.4876, + "step": 18221 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016039236914065284, + "loss": 1.5203, + "step": 18222 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016038003908859576, + "loss": 1.5411, + "step": 18223 + }, + { + "epoch": 1.43, + "learning_rate": 0.000160367708966064, + "loss": 1.5446, + "step": 18224 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001603553787731412, + "loss": 1.5477, + "step": 18225 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016034304850991106, + "loss": 1.5555, + "step": 18226 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016033071817645735, + "loss": 1.5256, + "step": 18227 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016031838777286377, + "loss": 1.6021, + "step": 18228 + }, + { + "epoch": 1.43, + "learning_rate": 0.000160306057299214, + "loss": 1.5348, + "step": 18229 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016029372675559184, + "loss": 1.5798, + "step": 18230 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001602813961420809, + "loss": 1.4998, + "step": 18231 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016026906545876503, + "loss": 1.4936, + "step": 18232 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016025673470572782, + "loss": 1.5366, + "step": 18233 + }, + { + "epoch": 1.43, + "learning_rate": 0.000160244403883053, + "loss": 1.4507, + "step": 18234 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016023207299082438, + "loss": 1.5251, + "step": 18235 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016021974202912564, + "loss": 1.5448, + "step": 18236 + }, + { + "epoch": 1.43, + "learning_rate": 0.0001602074109980405, + "loss": 1.5494, + "step": 18237 + }, + { + "epoch": 1.43, + "learning_rate": 0.00016019507989765261, + "loss": 1.5501, + "step": 18238 + }, + { + "epoch": 1.44, + "learning_rate": 0.00016018274872804585, + "loss": 1.5355, + "step": 18239 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001601704174893038, + "loss": 1.5767, + "step": 18240 + }, + { + "epoch": 1.44, + "learning_rate": 0.00016015808618151018, + "loss": 1.5325, + "step": 18241 + }, + { + "epoch": 1.44, + "learning_rate": 0.00016014575480474883, + "loss": 1.5685, + "step": 18242 + }, + { + "epoch": 1.44, + "learning_rate": 0.00016013342335910333, + "loss": 1.5301, + "step": 18243 + }, + { + "epoch": 1.44, + "learning_rate": 0.00016012109184465755, + "loss": 1.4817, + "step": 18244 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001601087602614951, + "loss": 1.5511, + "step": 18245 + }, + { + "epoch": 1.44, + "learning_rate": 0.00016009642860969974, + "loss": 1.5371, + "step": 18246 + }, + { + "epoch": 1.44, + "learning_rate": 0.00016008409688935524, + "loss": 1.4936, + "step": 18247 + }, + { + "epoch": 1.44, + "learning_rate": 0.00016007176510054528, + "loss": 1.522, + "step": 18248 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001600594332433536, + "loss": 1.5744, + "step": 18249 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001600471013178639, + "loss": 1.5666, + "step": 18250 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001600347693241599, + "loss": 1.5009, + "step": 18251 + }, + { + "epoch": 1.44, + "learning_rate": 0.00016002243726232537, + "loss": 1.499, + "step": 18252 + }, + { + "epoch": 1.44, + "learning_rate": 0.00016001010513244405, + "loss": 1.4907, + "step": 18253 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015999777293459962, + "loss": 1.5355, + "step": 18254 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015998544066887584, + "loss": 1.5465, + "step": 18255 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001599731083353564, + "loss": 1.4528, + "step": 18256 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015996077593412512, + "loss": 1.4916, + "step": 18257 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015994844346526557, + "loss": 1.5139, + "step": 18258 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015993611092886167, + "loss": 1.5104, + "step": 18259 + }, + { + "epoch": 1.44, + "learning_rate": 0.000159923778324997, + "loss": 1.5134, + "step": 18260 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001599114456537554, + "loss": 1.5124, + "step": 18261 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015989911291522052, + "loss": 1.5257, + "step": 18262 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015988678010947613, + "loss": 1.5103, + "step": 18263 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015987444723660597, + "loss": 1.5215, + "step": 18264 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015986211429669375, + "loss": 1.5098, + "step": 18265 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015984978128982322, + "loss": 1.5341, + "step": 18266 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001598374482160781, + "loss": 1.5112, + "step": 18267 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015982511507554214, + "loss": 1.5398, + "step": 18268 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015981278186829912, + "loss": 1.4462, + "step": 18269 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015980044859443269, + "loss": 1.5259, + "step": 18270 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015978811525402663, + "loss": 1.5091, + "step": 18271 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015977578184716464, + "loss": 1.5084, + "step": 18272 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015976344837393048, + "loss": 1.487, + "step": 18273 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015975111483440793, + "loss": 1.5205, + "step": 18274 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015973878122868066, + "loss": 1.5164, + "step": 18275 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015972644755683248, + "loss": 1.5241, + "step": 18276 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001597141138189471, + "loss": 1.5361, + "step": 18277 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001597017800151082, + "loss": 1.5736, + "step": 18278 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015968944614539956, + "loss": 1.4561, + "step": 18279 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015967711220990494, + "loss": 1.5149, + "step": 18280 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015966477820870812, + "loss": 1.5356, + "step": 18281 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001596524441418927, + "loss": 1.4704, + "step": 18282 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001596401100095426, + "loss": 1.4897, + "step": 18283 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015962777581174142, + "loss": 1.5498, + "step": 18284 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015961544154857293, + "loss": 1.5769, + "step": 18285 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015960310722012096, + "loss": 1.467, + "step": 18286 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015959077282646917, + "loss": 1.5439, + "step": 18287 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015957843836770136, + "loss": 1.5664, + "step": 18288 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015956610384390118, + "loss": 1.4974, + "step": 18289 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015955376925515244, + "loss": 1.5422, + "step": 18290 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001595414346015389, + "loss": 1.4635, + "step": 18291 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015952909988314426, + "loss": 1.5003, + "step": 18292 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015951676510005233, + "loss": 1.5555, + "step": 18293 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015950443025234678, + "loss": 1.5508, + "step": 18294 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001594920953401114, + "loss": 1.513, + "step": 18295 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015947976036342996, + "loss": 1.5119, + "step": 18296 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015946742532238617, + "loss": 1.4915, + "step": 18297 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015945509021706377, + "loss": 1.5352, + "step": 18298 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015944275504754652, + "loss": 1.5344, + "step": 18299 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015943041981391818, + "loss": 1.4539, + "step": 18300 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001594180845162625, + "loss": 1.5189, + "step": 18301 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001594057491546632, + "loss": 1.5021, + "step": 18302 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001593934137292041, + "loss": 1.5041, + "step": 18303 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015938107823996886, + "loss": 1.455, + "step": 18304 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015936874268704135, + "loss": 1.5012, + "step": 18305 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015935640707050514, + "loss": 1.5443, + "step": 18306 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015934407139044416, + "loss": 1.4868, + "step": 18307 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015933173564694207, + "loss": 1.5086, + "step": 18308 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015931939984008262, + "loss": 1.4964, + "step": 18309 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015930706396994964, + "loss": 1.5494, + "step": 18310 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015929472803662682, + "loss": 1.5113, + "step": 18311 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015928239204019792, + "loss": 1.5683, + "step": 18312 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015927005598074672, + "loss": 1.561, + "step": 18313 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015925771985835687, + "loss": 1.5105, + "step": 18314 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001592453836731123, + "loss": 1.5882, + "step": 18315 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015923304742509664, + "loss": 1.4719, + "step": 18316 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001592207111143937, + "loss": 1.5264, + "step": 18317 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001592083747410872, + "loss": 1.5489, + "step": 18318 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001591960383052609, + "loss": 1.5316, + "step": 18319 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015918370180699863, + "loss": 1.5094, + "step": 18320 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015917136524638405, + "loss": 1.5548, + "step": 18321 + }, + { + "epoch": 1.44, + "learning_rate": 0.000159159028623501, + "loss": 1.5511, + "step": 18322 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015914669193843316, + "loss": 1.554, + "step": 18323 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015913435519126435, + "loss": 1.5284, + "step": 18324 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015912201838207832, + "loss": 1.5427, + "step": 18325 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015910968151095878, + "loss": 1.4935, + "step": 18326 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015909734457798957, + "loss": 1.5239, + "step": 18327 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015908500758325442, + "loss": 1.5106, + "step": 18328 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015907267052683703, + "loss": 1.5101, + "step": 18329 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015906033340882123, + "loss": 1.5172, + "step": 18330 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015904799622929076, + "loss": 1.554, + "step": 18331 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015903565898832942, + "loss": 1.5144, + "step": 18332 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015902332168602095, + "loss": 1.5006, + "step": 18333 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015901098432244908, + "loss": 1.5364, + "step": 18334 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015899864689769758, + "loss": 1.5238, + "step": 18335 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015898630941185027, + "loss": 1.4959, + "step": 18336 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015897397186499083, + "loss": 1.5736, + "step": 18337 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001589616342572031, + "loss": 1.5033, + "step": 18338 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015894929658857087, + "loss": 1.4745, + "step": 18339 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001589369588591778, + "loss": 1.5898, + "step": 18340 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001589246210691077, + "loss": 1.5147, + "step": 18341 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015891228321844437, + "loss": 1.5294, + "step": 18342 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015889994530727156, + "loss": 1.5262, + "step": 18343 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015888760733567307, + "loss": 1.5077, + "step": 18344 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015887526930373253, + "loss": 1.5599, + "step": 18345 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001588629312115339, + "loss": 1.4666, + "step": 18346 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015885059305916082, + "loss": 1.5386, + "step": 18347 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001588382548466971, + "loss": 1.5233, + "step": 18348 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015882591657422654, + "loss": 1.5366, + "step": 18349 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001588135782418328, + "loss": 1.4977, + "step": 18350 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015880123984959982, + "loss": 1.4853, + "step": 18351 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015878890139761121, + "loss": 1.5634, + "step": 18352 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015877656288595078, + "loss": 1.495, + "step": 18353 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015876422431470243, + "loss": 1.4737, + "step": 18354 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015875188568394976, + "loss": 1.5278, + "step": 18355 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015873954699377666, + "loss": 1.5395, + "step": 18356 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015872720824426683, + "loss": 1.5662, + "step": 18357 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015871486943550407, + "loss": 1.5348, + "step": 18358 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015870253056757223, + "loss": 1.5271, + "step": 18359 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015869019164055492, + "loss": 1.5123, + "step": 18360 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015867785265453603, + "loss": 1.552, + "step": 18361 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001586655136095993, + "loss": 1.5236, + "step": 18362 + }, + { + "epoch": 1.44, + "learning_rate": 0.00015865317450582854, + "loss": 1.5505, + "step": 18363 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001586408353433075, + "loss": 1.5589, + "step": 18364 + }, + { + "epoch": 1.44, + "learning_rate": 0.0001586284961221199, + "loss": 1.5331, + "step": 18365 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015861615684234964, + "loss": 1.5027, + "step": 18366 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015860381750408043, + "loss": 1.5066, + "step": 18367 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015859147810739599, + "loss": 1.5208, + "step": 18368 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001585791386523802, + "loss": 1.5124, + "step": 18369 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015856679913911676, + "loss": 1.499, + "step": 18370 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001585544595676895, + "loss": 1.4659, + "step": 18371 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001585421199381822, + "loss": 1.5514, + "step": 18372 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001585297802506786, + "loss": 1.5361, + "step": 18373 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015851744050526253, + "loss": 1.5277, + "step": 18374 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015850510070201766, + "loss": 1.5434, + "step": 18375 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015849276084102792, + "loss": 1.5471, + "step": 18376 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015848042092237696, + "loss": 1.5412, + "step": 18377 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015846808094614872, + "loss": 1.528, + "step": 18378 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001584557409124268, + "loss": 1.4718, + "step": 18379 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001584434008212951, + "loss": 1.5059, + "step": 18380 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001584310606728374, + "loss": 1.5476, + "step": 18381 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001584187204671374, + "loss": 1.5422, + "step": 18382 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015840638020427896, + "loss": 1.5065, + "step": 18383 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001583940398843458, + "loss": 1.5497, + "step": 18384 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015838169950742177, + "loss": 1.5303, + "step": 18385 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015836935907359058, + "loss": 1.5821, + "step": 18386 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001583570185829361, + "loss": 1.4968, + "step": 18387 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015834467803554211, + "loss": 1.5369, + "step": 18388 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001583323374314923, + "loss": 1.5282, + "step": 18389 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015831999677087057, + "loss": 1.5335, + "step": 18390 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015830765605376063, + "loss": 1.5448, + "step": 18391 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015829531528024627, + "loss": 1.5249, + "step": 18392 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015828297445041133, + "loss": 1.5552, + "step": 18393 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001582706335643395, + "loss": 1.5694, + "step": 18394 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001582582926221147, + "loss": 1.5194, + "step": 18395 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015824595162382062, + "loss": 1.5426, + "step": 18396 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015823361056954108, + "loss": 1.5219, + "step": 18397 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001582212694593599, + "loss": 1.538, + "step": 18398 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015820892829336081, + "loss": 1.5479, + "step": 18399 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015819658707162763, + "loss": 1.5045, + "step": 18400 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015818424579424413, + "loss": 1.5251, + "step": 18401 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001581719044612942, + "loss": 1.5016, + "step": 18402 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015815956307286145, + "loss": 1.5382, + "step": 18403 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001581472216290298, + "loss": 1.5605, + "step": 18404 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015813488012988302, + "loss": 1.4537, + "step": 18405 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001581225385755049, + "loss": 1.5217, + "step": 18406 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001581101969659792, + "loss": 1.5176, + "step": 18407 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015809785530138972, + "loss": 1.5417, + "step": 18408 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001580855135818203, + "loss": 1.4983, + "step": 18409 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015807317180735472, + "loss": 1.5643, + "step": 18410 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015806082997807676, + "loss": 1.5653, + "step": 18411 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015804848809407022, + "loss": 1.4866, + "step": 18412 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015803614615541884, + "loss": 1.5215, + "step": 18413 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015802380416220647, + "loss": 1.4794, + "step": 18414 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015801146211451696, + "loss": 1.5618, + "step": 18415 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015799912001243397, + "loss": 1.5264, + "step": 18416 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015798677785604142, + "loss": 1.5325, + "step": 18417 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015797443564542304, + "loss": 1.5, + "step": 18418 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015796209338066265, + "loss": 1.5277, + "step": 18419 + }, + { + "epoch": 1.45, + "learning_rate": 0.000157949751061844, + "loss": 1.5011, + "step": 18420 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015793740868905095, + "loss": 1.5034, + "step": 18421 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015792506626236731, + "loss": 1.4961, + "step": 18422 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001579127237818768, + "loss": 1.4607, + "step": 18423 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015790038124766328, + "loss": 1.5298, + "step": 18424 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015788803865981053, + "loss": 1.5173, + "step": 18425 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015787569601840234, + "loss": 1.5528, + "step": 18426 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015786335332352251, + "loss": 1.5607, + "step": 18427 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015785101057525487, + "loss": 1.5008, + "step": 18428 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015783866777368323, + "loss": 1.4762, + "step": 18429 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015782632491889132, + "loss": 1.5158, + "step": 18430 + }, + { + "epoch": 1.45, + "learning_rate": 0.000157813982010963, + "loss": 1.5353, + "step": 18431 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015780163904998204, + "loss": 1.5412, + "step": 18432 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015778929603603225, + "loss": 1.5146, + "step": 18433 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015777695296919747, + "loss": 1.5214, + "step": 18434 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015776460984956144, + "loss": 1.5287, + "step": 18435 + }, + { + "epoch": 1.45, + "learning_rate": 0.000157752266677208, + "loss": 1.534, + "step": 18436 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015773992345222094, + "loss": 1.4948, + "step": 18437 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015772758017468412, + "loss": 1.4976, + "step": 18438 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015771523684468124, + "loss": 1.4924, + "step": 18439 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015770289346229616, + "loss": 1.5534, + "step": 18440 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015769055002761272, + "loss": 1.5112, + "step": 18441 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015767820654071467, + "loss": 1.5149, + "step": 18442 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015766586300168582, + "loss": 1.509, + "step": 18443 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015765351941061004, + "loss": 1.499, + "step": 18444 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015764117576757105, + "loss": 1.5159, + "step": 18445 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001576288320726527, + "loss": 1.5331, + "step": 18446 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015761648832593878, + "loss": 1.5105, + "step": 18447 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015760414452751313, + "loss": 1.5321, + "step": 18448 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015759180067745948, + "loss": 1.5286, + "step": 18449 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015757945677586174, + "loss": 1.5066, + "step": 18450 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001575671128228037, + "loss": 1.5256, + "step": 18451 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001575547688183691, + "loss": 1.5347, + "step": 18452 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001575424247626418, + "loss": 1.5588, + "step": 18453 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001575300806557056, + "loss": 1.6047, + "step": 18454 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015751773649764423, + "loss": 1.543, + "step": 18455 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001575053922885417, + "loss": 1.606, + "step": 18456 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015749304802848164, + "loss": 1.5577, + "step": 18457 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015748070371754793, + "loss": 1.5063, + "step": 18458 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015746835935582436, + "loss": 1.5642, + "step": 18459 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015745601494339477, + "loss": 1.5076, + "step": 18460 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015744367048034293, + "loss": 1.4982, + "step": 18461 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001574313259667527, + "loss": 1.4818, + "step": 18462 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015741898140270781, + "loss": 1.5317, + "step": 18463 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015740663678829217, + "loss": 1.5202, + "step": 18464 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015739429212358955, + "loss": 1.4894, + "step": 18465 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015738194740868382, + "loss": 1.5871, + "step": 18466 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015736960264365867, + "loss": 1.5646, + "step": 18467 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015735725782859802, + "loss": 1.5523, + "step": 18468 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015734491296358563, + "loss": 1.5031, + "step": 18469 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015733256804870534, + "loss": 1.5602, + "step": 18470 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015732022308404095, + "loss": 1.5565, + "step": 18471 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001573078780696763, + "loss": 1.5585, + "step": 18472 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001572955330056952, + "loss": 1.4931, + "step": 18473 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015728318789218142, + "loss": 1.4949, + "step": 18474 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015727084272921886, + "loss": 1.4412, + "step": 18475 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015725849751689126, + "loss": 1.5552, + "step": 18476 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015724615225528248, + "loss": 1.5569, + "step": 18477 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015723380694447636, + "loss": 1.5176, + "step": 18478 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015722146158455658, + "loss": 1.5143, + "step": 18479 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015720911617560714, + "loss": 1.5146, + "step": 18480 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015719677071771176, + "loss": 1.4939, + "step": 18481 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015718442521095427, + "loss": 1.5439, + "step": 18482 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015717207965541854, + "loss": 1.5528, + "step": 18483 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001571597340511883, + "loss": 1.52, + "step": 18484 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015714738839834745, + "loss": 1.5077, + "step": 18485 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015713504269697972, + "loss": 1.5077, + "step": 18486 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015712269694716905, + "loss": 1.5845, + "step": 18487 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001571103511489992, + "loss": 1.489, + "step": 18488 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001570980053025539, + "loss": 1.5477, + "step": 18489 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015708565940791716, + "loss": 1.529, + "step": 18490 + }, + { + "epoch": 1.45, + "learning_rate": 0.0001570733134651727, + "loss": 1.5188, + "step": 18491 + }, + { + "epoch": 1.45, + "learning_rate": 0.00015706096747440426, + "loss": 1.4948, + "step": 18492 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015704862143569584, + "loss": 1.5042, + "step": 18493 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015703627534913107, + "loss": 1.5349, + "step": 18494 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015702392921479398, + "loss": 1.5329, + "step": 18495 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015701158303276823, + "loss": 1.492, + "step": 18496 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015699923680313773, + "loss": 1.4873, + "step": 18497 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015698689052598625, + "loss": 1.4954, + "step": 18498 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015697454420139767, + "loss": 1.5047, + "step": 18499 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015696219782945574, + "loss": 1.5044, + "step": 18500 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015694985141024434, + "loss": 1.515, + "step": 18501 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001569375049438473, + "loss": 1.5381, + "step": 18502 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001569251584303484, + "loss": 1.5139, + "step": 18503 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015691281186983158, + "loss": 1.511, + "step": 18504 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015690046526238048, + "loss": 1.5242, + "step": 18505 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015688811860807908, + "loss": 1.4829, + "step": 18506 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015687577190701113, + "loss": 1.5428, + "step": 18507 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001568634251592605, + "loss": 1.5203, + "step": 18508 + }, + { + "epoch": 1.46, + "learning_rate": 0.000156851078364911, + "loss": 1.4561, + "step": 18509 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015683873152404646, + "loss": 1.5367, + "step": 18510 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001568263846367507, + "loss": 1.5207, + "step": 18511 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015681403770310756, + "loss": 1.4962, + "step": 18512 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001568016907232009, + "loss": 1.5193, + "step": 18513 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015678934369711448, + "loss": 1.5195, + "step": 18514 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015677699662493212, + "loss": 1.63, + "step": 18515 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015676464950673772, + "loss": 1.5364, + "step": 18516 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015675230234261513, + "loss": 1.5323, + "step": 18517 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015673995513264808, + "loss": 1.4884, + "step": 18518 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001567276078769205, + "loss": 1.5124, + "step": 18519 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001567152605755161, + "loss": 1.4992, + "step": 18520 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015670291322851884, + "loss": 1.5429, + "step": 18521 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015669056583601253, + "loss": 1.4732, + "step": 18522 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015667821839808092, + "loss": 1.5495, + "step": 18523 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015666587091480791, + "loss": 1.5366, + "step": 18524 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015665352338627733, + "loss": 1.5251, + "step": 18525 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015664117581257295, + "loss": 1.5215, + "step": 18526 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015662882819377866, + "loss": 1.5734, + "step": 18527 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001566164805299783, + "loss": 1.5296, + "step": 18528 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015660413282125575, + "loss": 1.5198, + "step": 18529 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001565917850676947, + "loss": 1.5249, + "step": 18530 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015657943726937913, + "loss": 1.4983, + "step": 18531 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015656708942639276, + "loss": 1.5473, + "step": 18532 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015655474153881946, + "loss": 1.4946, + "step": 18533 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001565423936067431, + "loss": 1.5369, + "step": 18534 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001565300456302475, + "loss": 1.5488, + "step": 18535 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015651769760941656, + "loss": 1.5582, + "step": 18536 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015650534954433397, + "loss": 1.506, + "step": 18537 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015649300143508367, + "loss": 1.5748, + "step": 18538 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001564806532817495, + "loss": 1.5279, + "step": 18539 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015646830508441522, + "loss": 1.5013, + "step": 18540 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015645595684316474, + "loss": 1.4827, + "step": 18541 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001564436085580819, + "loss": 1.5226, + "step": 18542 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001564312602292505, + "loss": 1.5047, + "step": 18543 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015641891185675438, + "loss": 1.4942, + "step": 18544 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015640656344067738, + "loss": 1.5462, + "step": 18545 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001563942149811034, + "loss": 1.5109, + "step": 18546 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015638186647811618, + "loss": 1.52, + "step": 18547 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001563695179317996, + "loss": 1.535, + "step": 18548 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015635716934223753, + "loss": 1.5147, + "step": 18549 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015634482070951377, + "loss": 1.5568, + "step": 18550 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015633247203371221, + "loss": 1.5636, + "step": 18551 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015632012331491668, + "loss": 1.5634, + "step": 18552 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015630777455321096, + "loss": 1.501, + "step": 18553 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015629542574867894, + "loss": 1.57, + "step": 18554 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015628307690140441, + "loss": 1.5235, + "step": 18555 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015627072801147133, + "loss": 1.5404, + "step": 18556 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001562583790789634, + "loss": 1.5753, + "step": 18557 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001562460301039646, + "loss": 1.5417, + "step": 18558 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015623368108655866, + "loss": 1.5163, + "step": 18559 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001562213320268295, + "loss": 1.4863, + "step": 18560 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015620898292486088, + "loss": 1.4899, + "step": 18561 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001561966337807367, + "loss": 1.4857, + "step": 18562 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015618428459454085, + "loss": 1.4977, + "step": 18563 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015617193536635707, + "loss": 1.5166, + "step": 18564 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015615958609626926, + "loss": 1.5337, + "step": 18565 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015614723678436125, + "loss": 1.5019, + "step": 18566 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001561348874307169, + "loss": 1.5334, + "step": 18567 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015612253803542008, + "loss": 1.5942, + "step": 18568 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015611018859855457, + "loss": 1.5074, + "step": 18569 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015609783912020432, + "loss": 1.5037, + "step": 18570 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015608548960045304, + "loss": 1.5278, + "step": 18571 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015607314003938464, + "loss": 1.5471, + "step": 18572 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015606079043708297, + "loss": 1.5342, + "step": 18573 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001560484407936319, + "loss": 1.4888, + "step": 18574 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015603609110911526, + "loss": 1.4603, + "step": 18575 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015602374138361689, + "loss": 1.5451, + "step": 18576 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015601139161722062, + "loss": 1.5411, + "step": 18577 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015599904181001035, + "loss": 1.473, + "step": 18578 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015598669196206988, + "loss": 1.5198, + "step": 18579 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015597434207348309, + "loss": 1.5052, + "step": 18580 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015596199214433376, + "loss": 1.4874, + "step": 18581 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015594964217470583, + "loss": 1.4482, + "step": 18582 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015593729216468313, + "loss": 1.5694, + "step": 18583 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015592494211434947, + "loss": 1.5321, + "step": 18584 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015591259202378874, + "loss": 1.5608, + "step": 18585 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015590024189308474, + "loss": 1.4458, + "step": 18586 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001558878917223214, + "loss": 1.5578, + "step": 18587 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001558755415115825, + "loss": 1.5731, + "step": 18588 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001558631912609519, + "loss": 1.4784, + "step": 18589 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015585084097051346, + "loss": 1.4835, + "step": 18590 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015583849064035107, + "loss": 1.5097, + "step": 18591 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015582614027054856, + "loss": 1.5711, + "step": 18592 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015581378986118975, + "loss": 1.5442, + "step": 18593 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015580143941235853, + "loss": 1.5194, + "step": 18594 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015578908892413873, + "loss": 1.5162, + "step": 18595 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015577673839661416, + "loss": 1.5182, + "step": 18596 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001557643878298688, + "loss": 1.58, + "step": 18597 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001557520372239864, + "loss": 1.4901, + "step": 18598 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015573968657905086, + "loss": 1.5889, + "step": 18599 + }, + { + "epoch": 1.46, + "learning_rate": 0.000155727335895146, + "loss": 1.5716, + "step": 18600 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001557149851723557, + "loss": 1.4895, + "step": 18601 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001557026344107638, + "loss": 1.4913, + "step": 18602 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015569028361045413, + "loss": 1.5669, + "step": 18603 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015567793277151056, + "loss": 1.52, + "step": 18604 + }, + { + "epoch": 1.46, + "learning_rate": 0.000155665581894017, + "loss": 1.4739, + "step": 18605 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015565323097805727, + "loss": 1.4933, + "step": 18606 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015564088002371524, + "loss": 1.5128, + "step": 18607 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001556285290310747, + "loss": 1.5845, + "step": 18608 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015561617800021957, + "loss": 1.5622, + "step": 18609 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001556038269312337, + "loss": 1.5431, + "step": 18610 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001555914758242009, + "loss": 1.4713, + "step": 18611 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015557912467920512, + "loss": 1.5174, + "step": 18612 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015556677349633013, + "loss": 1.4884, + "step": 18613 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015555442227565983, + "loss": 1.5114, + "step": 18614 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015554207101727807, + "loss": 1.5431, + "step": 18615 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015552971972126873, + "loss": 1.4914, + "step": 18616 + }, + { + "epoch": 1.46, + "learning_rate": 0.00015551736838771558, + "loss": 1.5145, + "step": 18617 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001555050170167026, + "loss": 1.5241, + "step": 18618 + }, + { + "epoch": 1.46, + "learning_rate": 0.0001554926656083136, + "loss": 1.4862, + "step": 18619 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015548031416263235, + "loss": 1.5621, + "step": 18620 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001554679626797429, + "loss": 1.5073, + "step": 18621 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001554556111597289, + "loss": 1.5225, + "step": 18622 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015544325960267435, + "loss": 1.4954, + "step": 18623 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015543090800866313, + "loss": 1.5183, + "step": 18624 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015541855637777897, + "loss": 1.4942, + "step": 18625 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015540620471010582, + "loss": 1.4675, + "step": 18626 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015539385300572753, + "loss": 1.5118, + "step": 18627 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015538150126472795, + "loss": 1.5242, + "step": 18628 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015536914948719095, + "loss": 1.5169, + "step": 18629 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015535679767320035, + "loss": 1.4842, + "step": 18630 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015534444582284015, + "loss": 1.4854, + "step": 18631 + }, + { + "epoch": 1.47, + "learning_rate": 0.000155332093936194, + "loss": 1.5372, + "step": 18632 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015531974201334593, + "loss": 1.569, + "step": 18633 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015530739005437975, + "loss": 1.566, + "step": 18634 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001552950380593793, + "loss": 1.4973, + "step": 18635 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015528268602842848, + "loss": 1.5255, + "step": 18636 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001552703339616111, + "loss": 1.4667, + "step": 18637 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015525798185901112, + "loss": 1.5172, + "step": 18638 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015524562972071232, + "loss": 1.5007, + "step": 18639 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015523327754679857, + "loss": 1.4981, + "step": 18640 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015522092533735377, + "loss": 1.4664, + "step": 18641 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015520857309246177, + "loss": 1.479, + "step": 18642 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015519622081220643, + "loss": 1.5245, + "step": 18643 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015518386849667162, + "loss": 1.5344, + "step": 18644 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015517151614594118, + "loss": 1.4651, + "step": 18645 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015515916376009902, + "loss": 1.4933, + "step": 18646 + }, + { + "epoch": 1.47, + "learning_rate": 0.000155146811339229, + "loss": 1.5644, + "step": 18647 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015513445888341499, + "loss": 1.5079, + "step": 18648 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015512210639274078, + "loss": 1.5315, + "step": 18649 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001551097538672903, + "loss": 1.5152, + "step": 18650 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001550974013071474, + "loss": 1.4831, + "step": 18651 + }, + { + "epoch": 1.47, + "learning_rate": 0.000155085048712396, + "loss": 1.5458, + "step": 18652 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015507269608311996, + "loss": 1.5106, + "step": 18653 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015506034341940305, + "loss": 1.531, + "step": 18654 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015504799072132923, + "loss": 1.498, + "step": 18655 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015503563798898232, + "loss": 1.5371, + "step": 18656 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001550232852224462, + "loss": 1.4416, + "step": 18657 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015501093242180477, + "loss": 1.5272, + "step": 18658 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015499857958714184, + "loss": 1.4876, + "step": 18659 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015498622671854134, + "loss": 1.4853, + "step": 18660 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015497387381608712, + "loss": 1.475, + "step": 18661 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015496152087986301, + "loss": 1.5227, + "step": 18662 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015494916790995293, + "loss": 1.5135, + "step": 18663 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015493681490644074, + "loss": 1.5745, + "step": 18664 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001549244618694103, + "loss": 1.5262, + "step": 18665 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001549121087989455, + "loss": 1.5424, + "step": 18666 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015489975569513015, + "loss": 1.512, + "step": 18667 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015488740255804816, + "loss": 1.5418, + "step": 18668 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015487504938778342, + "loss": 1.5175, + "step": 18669 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015486269618441981, + "loss": 1.5158, + "step": 18670 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015485034294804116, + "loss": 1.5153, + "step": 18671 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015483798967873136, + "loss": 1.5335, + "step": 18672 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015482563637657425, + "loss": 1.5227, + "step": 18673 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015481328304165376, + "loss": 1.5509, + "step": 18674 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001548009296740537, + "loss": 1.5293, + "step": 18675 + }, + { + "epoch": 1.47, + "learning_rate": 0.000154788576273858, + "loss": 1.4979, + "step": 18676 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015477622284115053, + "loss": 1.5313, + "step": 18677 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015476386937601512, + "loss": 1.5393, + "step": 18678 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015475151587853565, + "loss": 1.5466, + "step": 18679 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015473916234879607, + "loss": 1.5644, + "step": 18680 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015472680878688013, + "loss": 1.5228, + "step": 18681 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015471445519287184, + "loss": 1.5318, + "step": 18682 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001547021015668549, + "loss": 1.4697, + "step": 18683 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015468974790891336, + "loss": 1.5769, + "step": 18684 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015467739421913098, + "loss": 1.5023, + "step": 18685 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015466504049759167, + "loss": 1.5121, + "step": 18686 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015465268674437938, + "loss": 1.4844, + "step": 18687 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015464033295957785, + "loss": 1.5357, + "step": 18688 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015462797914327106, + "loss": 1.509, + "step": 18689 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001546156252955428, + "loss": 1.5052, + "step": 18690 + }, + { + "epoch": 1.47, + "learning_rate": 0.000154603271416477, + "loss": 1.5093, + "step": 18691 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015459091750615755, + "loss": 1.505, + "step": 18692 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001545785635646683, + "loss": 1.551, + "step": 18693 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015456620959209314, + "loss": 1.518, + "step": 18694 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001545538555885159, + "loss": 1.5318, + "step": 18695 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015454150155402052, + "loss": 1.4931, + "step": 18696 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015452914748869087, + "loss": 1.5311, + "step": 18697 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015451679339261077, + "loss": 1.5501, + "step": 18698 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015450443926586413, + "loss": 1.5472, + "step": 18699 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015449208510853485, + "loss": 1.5511, + "step": 18700 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015447973092070678, + "loss": 1.5199, + "step": 18701 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015446737670246386, + "loss": 1.5515, + "step": 18702 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015445502245388983, + "loss": 1.5, + "step": 18703 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015444266817506876, + "loss": 1.5362, + "step": 18704 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015443031386608435, + "loss": 1.5319, + "step": 18705 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001544179595270206, + "loss": 1.5423, + "step": 18706 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015440560515796127, + "loss": 1.5129, + "step": 18707 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015439325075899035, + "loss": 1.4887, + "step": 18708 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015438089633019173, + "loss": 1.5701, + "step": 18709 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015436854187164916, + "loss": 1.4749, + "step": 18710 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001543561873834467, + "loss": 1.5257, + "step": 18711 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015434383286566807, + "loss": 1.5223, + "step": 18712 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015433147831839722, + "loss": 1.5698, + "step": 18713 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015431912374171797, + "loss": 1.5027, + "step": 18714 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015430676913571432, + "loss": 1.5503, + "step": 18715 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015429441450047008, + "loss": 1.5118, + "step": 18716 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015428205983606912, + "loss": 1.5407, + "step": 18717 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001542697051425953, + "loss": 1.507, + "step": 18718 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015425735042013262, + "loss": 1.5054, + "step": 18719 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015424499566876485, + "loss": 1.4848, + "step": 18720 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001542326408885759, + "loss": 1.4745, + "step": 18721 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001542202860796496, + "loss": 1.5408, + "step": 18722 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015420793124206996, + "loss": 1.5437, + "step": 18723 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015419557637592074, + "loss": 1.5006, + "step": 18724 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015418322148128588, + "loss": 1.5566, + "step": 18725 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015417086655824928, + "loss": 1.4912, + "step": 18726 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015415851160689478, + "loss": 1.5143, + "step": 18727 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015414615662730634, + "loss": 1.5133, + "step": 18728 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015413380161956766, + "loss": 1.4866, + "step": 18729 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015412144658376282, + "loss": 1.5435, + "step": 18730 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015410909151997564, + "loss": 1.5553, + "step": 18731 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015409673642828998, + "loss": 1.512, + "step": 18732 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015408438130878977, + "loss": 1.5068, + "step": 18733 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015407202616155884, + "loss": 1.5389, + "step": 18734 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015405967098668108, + "loss": 1.4694, + "step": 18735 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015404731578424046, + "loss": 1.5331, + "step": 18736 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015403496055432073, + "loss": 1.4915, + "step": 18737 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015402260529700585, + "loss": 1.4881, + "step": 18738 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015401025001237972, + "loss": 1.5502, + "step": 18739 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015399789470052621, + "loss": 1.4938, + "step": 18740 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001539855393615292, + "loss": 1.5229, + "step": 18741 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015397318399547257, + "loss": 1.5251, + "step": 18742 + }, + { + "epoch": 1.47, + "learning_rate": 0.0001539608286024402, + "loss": 1.5404, + "step": 18743 + }, + { + "epoch": 1.47, + "learning_rate": 0.000153948473182516, + "loss": 1.5029, + "step": 18744 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015393611773578385, + "loss": 1.5715, + "step": 18745 + }, + { + "epoch": 1.47, + "learning_rate": 0.00015392376226232762, + "loss": 1.5162, + "step": 18746 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015391140676223122, + "loss": 1.5232, + "step": 18747 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015389905123557856, + "loss": 1.5321, + "step": 18748 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015388669568245345, + "loss": 1.502, + "step": 18749 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015387434010293987, + "loss": 1.5396, + "step": 18750 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015386198449712158, + "loss": 1.5425, + "step": 18751 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001538496288650826, + "loss": 1.5405, + "step": 18752 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015383727320690676, + "loss": 1.4937, + "step": 18753 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015382491752267792, + "loss": 1.5331, + "step": 18754 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015381256181248005, + "loss": 1.5057, + "step": 18755 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015380020607639694, + "loss": 1.5152, + "step": 18756 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015378785031451258, + "loss": 1.4946, + "step": 18757 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015377549452691078, + "loss": 1.499, + "step": 18758 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015376313871367546, + "loss": 1.5454, + "step": 18759 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001537507828748905, + "loss": 1.5292, + "step": 18760 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015373842701063976, + "loss": 1.4765, + "step": 18761 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015372607112100722, + "loss": 1.4846, + "step": 18762 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001537137152060767, + "loss": 1.5723, + "step": 18763 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001537013592659321, + "loss": 1.5154, + "step": 18764 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001536890033006573, + "loss": 1.5288, + "step": 18765 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015367664731033622, + "loss": 1.5391, + "step": 18766 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015366429129505275, + "loss": 1.5238, + "step": 18767 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015365193525489071, + "loss": 1.5834, + "step": 18768 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001536395791899341, + "loss": 1.5027, + "step": 18769 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015362722310026673, + "loss": 1.5088, + "step": 18770 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015361486698597249, + "loss": 1.4959, + "step": 18771 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015360251084713537, + "loss": 1.513, + "step": 18772 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015359015468383914, + "loss": 1.5192, + "step": 18773 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015357779849616772, + "loss": 1.5347, + "step": 18774 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015356544228420507, + "loss": 1.5, + "step": 18775 + }, + { + "epoch": 1.48, + "learning_rate": 0.000153553086048035, + "loss": 1.4913, + "step": 18776 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015354072978774144, + "loss": 1.5776, + "step": 18777 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001535283735034083, + "loss": 1.4522, + "step": 18778 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015351601719511943, + "loss": 1.5955, + "step": 18779 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015350366086295874, + "loss": 1.5522, + "step": 18780 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015349130450701014, + "loss": 1.5428, + "step": 18781 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015347894812735755, + "loss": 1.566, + "step": 18782 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015346659172408477, + "loss": 1.4537, + "step": 18783 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015345423529727572, + "loss": 1.5274, + "step": 18784 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015344187884701438, + "loss": 1.4982, + "step": 18785 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015342952237338452, + "loss": 1.5222, + "step": 18786 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015341716587647015, + "loss": 1.4943, + "step": 18787 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001534048093563551, + "loss": 1.5136, + "step": 18788 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015339245281312329, + "loss": 1.5473, + "step": 18789 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015338009624685857, + "loss": 1.5211, + "step": 18790 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015336773965764482, + "loss": 1.4549, + "step": 18791 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015335538304556606, + "loss": 1.5352, + "step": 18792 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015334302641070602, + "loss": 1.4732, + "step": 18793 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015333066975314877, + "loss": 1.5119, + "step": 18794 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015331831307297802, + "loss": 1.4907, + "step": 18795 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015330595637027782, + "loss": 1.4949, + "step": 18796 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015329359964513195, + "loss": 1.5064, + "step": 18797 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001532812428976244, + "loss": 1.4889, + "step": 18798 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015326888612783902, + "loss": 1.4947, + "step": 18799 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015325652933585965, + "loss": 1.481, + "step": 18800 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015324417252177028, + "loss": 1.5114, + "step": 18801 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015323181568565475, + "loss": 1.4846, + "step": 18802 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015321945882759702, + "loss": 1.5144, + "step": 18803 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015320710194768091, + "loss": 1.5215, + "step": 18804 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015319474504599037, + "loss": 1.537, + "step": 18805 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015318238812260927, + "loss": 1.5812, + "step": 18806 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001531700311776215, + "loss": 1.5279, + "step": 18807 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015315767421111092, + "loss": 1.5649, + "step": 18808 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015314531722316151, + "loss": 1.5196, + "step": 18809 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015313296021385715, + "loss": 1.5287, + "step": 18810 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015312060318328172, + "loss": 1.4942, + "step": 18811 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001531082461315191, + "loss": 1.523, + "step": 18812 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001530958890586532, + "loss": 1.4953, + "step": 18813 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015308353196476796, + "loss": 1.4731, + "step": 18814 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001530711748499472, + "loss": 1.5341, + "step": 18815 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015305881771427487, + "loss": 1.4921, + "step": 18816 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015304646055783487, + "loss": 1.4886, + "step": 18817 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015303410338071108, + "loss": 1.5189, + "step": 18818 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001530217461829874, + "loss": 1.4811, + "step": 18819 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015300938896474768, + "loss": 1.5299, + "step": 18820 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015299703172607593, + "loss": 1.4689, + "step": 18821 + }, + { + "epoch": 1.48, + "learning_rate": 0.000152984674467056, + "loss": 1.5491, + "step": 18822 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015297231718777176, + "loss": 1.4636, + "step": 18823 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015295995988830706, + "loss": 1.541, + "step": 18824 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015294760256874594, + "loss": 1.5524, + "step": 18825 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015293524522917219, + "loss": 1.4928, + "step": 18826 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015292288786966976, + "loss": 1.4907, + "step": 18827 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015291053049032257, + "loss": 1.5266, + "step": 18828 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015289817309121446, + "loss": 1.4845, + "step": 18829 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001528858156724293, + "loss": 1.5212, + "step": 18830 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015287345823405114, + "loss": 1.5156, + "step": 18831 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015286110077616369, + "loss": 1.48, + "step": 18832 + }, + { + "epoch": 1.48, + "learning_rate": 0.000152848743298851, + "loss": 1.4918, + "step": 18833 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001528363858021969, + "loss": 1.4945, + "step": 18834 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015282402828628531, + "loss": 1.4896, + "step": 18835 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015281167075120014, + "loss": 1.5639, + "step": 18836 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015279931319702527, + "loss": 1.5718, + "step": 18837 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015278695562384457, + "loss": 1.5311, + "step": 18838 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015277459803174205, + "loss": 1.5497, + "step": 18839 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015276224042080146, + "loss": 1.5162, + "step": 18840 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015274988279110683, + "loss": 1.4989, + "step": 18841 + }, + { + "epoch": 1.48, + "learning_rate": 0.000152737525142742, + "loss": 1.4681, + "step": 18842 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001527251674757909, + "loss": 1.5568, + "step": 18843 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015271280979033738, + "loss": 1.527, + "step": 18844 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015270045208646543, + "loss": 1.5067, + "step": 18845 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001526880943642589, + "loss": 1.5569, + "step": 18846 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015267573662380163, + "loss": 1.5169, + "step": 18847 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001526633788651776, + "loss": 1.4862, + "step": 18848 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015265102108847074, + "loss": 1.5289, + "step": 18849 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001526386632937649, + "loss": 1.5268, + "step": 18850 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015262630548114396, + "loss": 1.542, + "step": 18851 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001526139476506919, + "loss": 1.4921, + "step": 18852 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015260158980249256, + "loss": 1.4521, + "step": 18853 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015258923193662983, + "loss": 1.4814, + "step": 18854 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001525768740531877, + "loss": 1.5388, + "step": 18855 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015256451615224993, + "loss": 1.5405, + "step": 18856 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001525521582339006, + "loss": 1.5213, + "step": 18857 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015253980029822348, + "loss": 1.5028, + "step": 18858 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015252744234530254, + "loss": 1.5052, + "step": 18859 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015251508437522164, + "loss": 1.549, + "step": 18860 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001525027263880647, + "loss": 1.5042, + "step": 18861 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001524903683839157, + "loss": 1.5726, + "step": 18862 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001524780103628584, + "loss": 1.5506, + "step": 18863 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001524656523249768, + "loss": 1.508, + "step": 18864 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015245329427035476, + "loss": 1.5335, + "step": 18865 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001524409361990762, + "loss": 1.4732, + "step": 18866 + }, + { + "epoch": 1.48, + "learning_rate": 0.0001524285781112251, + "loss": 1.4634, + "step": 18867 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015241622000688524, + "loss": 1.5246, + "step": 18868 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015240386188614057, + "loss": 1.4851, + "step": 18869 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015239150374907504, + "loss": 1.4728, + "step": 18870 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015237914559577246, + "loss": 1.4819, + "step": 18871 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015236678742631686, + "loss": 1.5154, + "step": 18872 + }, + { + "epoch": 1.48, + "learning_rate": 0.00015235442924079202, + "loss": 1.5164, + "step": 18873 + }, + { + "epoch": 1.49, + "learning_rate": 0.000152342071039282, + "loss": 1.4833, + "step": 18874 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015232971282187052, + "loss": 1.5143, + "step": 18875 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015231735458864158, + "loss": 1.5101, + "step": 18876 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015230499633967916, + "loss": 1.5171, + "step": 18877 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015229263807506698, + "loss": 1.523, + "step": 18878 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015228027979488913, + "loss": 1.5197, + "step": 18879 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015226792149922942, + "loss": 1.504, + "step": 18880 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015225556318817178, + "loss": 1.538, + "step": 18881 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001522432048618001, + "loss": 1.527, + "step": 18882 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015223084652019828, + "loss": 1.5743, + "step": 18883 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015221848816345025, + "loss": 1.5521, + "step": 18884 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015220612979163992, + "loss": 1.5308, + "step": 18885 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001521937714048512, + "loss": 1.5629, + "step": 18886 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015218141300316795, + "loss": 1.5847, + "step": 18887 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015216905458667412, + "loss": 1.558, + "step": 18888 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015215669615545365, + "loss": 1.5527, + "step": 18889 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015214433770959033, + "loss": 1.4879, + "step": 18890 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001521319792491682, + "loss": 1.5797, + "step": 18891 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015211962077427106, + "loss": 1.493, + "step": 18892 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001521072622849829, + "loss": 1.5495, + "step": 18893 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015209490378138762, + "loss": 1.4694, + "step": 18894 + }, + { + "epoch": 1.49, + "learning_rate": 0.000152082545263569, + "loss": 1.5198, + "step": 18895 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015207018673161113, + "loss": 1.5058, + "step": 18896 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001520578281855978, + "loss": 1.5034, + "step": 18897 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015204546962561296, + "loss": 1.5348, + "step": 18898 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015203311105174052, + "loss": 1.5272, + "step": 18899 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001520207524640644, + "loss": 1.5116, + "step": 18900 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015200839386266847, + "loss": 1.5168, + "step": 18901 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015199603524763662, + "loss": 1.5071, + "step": 18902 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015198367661905282, + "loss": 1.4791, + "step": 18903 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015197131797700092, + "loss": 1.4887, + "step": 18904 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015195895932156487, + "loss": 1.5082, + "step": 18905 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001519466006528286, + "loss": 1.5403, + "step": 18906 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015193424197087598, + "loss": 1.5118, + "step": 18907 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015192188327579093, + "loss": 1.5523, + "step": 18908 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001519095245676573, + "loss": 1.496, + "step": 18909 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015189716584655907, + "loss": 1.482, + "step": 18910 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015188480711258016, + "loss": 1.4868, + "step": 18911 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015187244836580442, + "loss": 1.5177, + "step": 18912 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015186008960631586, + "loss": 1.4621, + "step": 18913 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001518477308341982, + "loss": 1.5026, + "step": 18914 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015183537204953556, + "loss": 1.4869, + "step": 18915 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015182301325241174, + "loss": 1.5326, + "step": 18916 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015181065444291064, + "loss": 1.5294, + "step": 18917 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015179829562111624, + "loss": 1.5487, + "step": 18918 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015178593678711233, + "loss": 1.5112, + "step": 18919 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015177357794098295, + "loss": 1.4723, + "step": 18920 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015176121908281196, + "loss": 1.5087, + "step": 18921 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015174886021268323, + "loss": 1.5002, + "step": 18922 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015173650133068074, + "loss": 1.5113, + "step": 18923 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015172414243688835, + "loss": 1.5073, + "step": 18924 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015171178353138993, + "loss": 1.5387, + "step": 18925 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001516994246142695, + "loss": 1.5315, + "step": 18926 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001516870656856109, + "loss": 1.5035, + "step": 18927 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001516747067454981, + "loss": 1.5538, + "step": 18928 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015166234779401494, + "loss": 1.5652, + "step": 18929 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015164998883124536, + "loss": 1.5341, + "step": 18930 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015163762985727323, + "loss": 1.5379, + "step": 18931 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015162527087218253, + "loss": 1.5028, + "step": 18932 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001516129118760571, + "loss": 1.5142, + "step": 18933 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001516005528689809, + "loss": 1.5404, + "step": 18934 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001515881938510379, + "loss": 1.5811, + "step": 18935 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015157583482231185, + "loss": 1.4957, + "step": 18936 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015156347578288682, + "loss": 1.447, + "step": 18937 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001515511167328466, + "loss": 1.5872, + "step": 18938 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015153875767227515, + "loss": 1.5817, + "step": 18939 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015152639860125644, + "loss": 1.5095, + "step": 18940 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001515140395198743, + "loss": 1.4815, + "step": 18941 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015150168042821265, + "loss": 1.5278, + "step": 18942 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001514893213263554, + "loss": 1.5138, + "step": 18943 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001514769622143865, + "loss": 1.5037, + "step": 18944 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015146460309238988, + "loss": 1.5074, + "step": 18945 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001514522439604494, + "loss": 1.4646, + "step": 18946 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015143988481864897, + "loss": 1.5085, + "step": 18947 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001514275256670725, + "loss": 1.55, + "step": 18948 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001514151665058039, + "loss": 1.5217, + "step": 18949 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015140280733492713, + "loss": 1.5216, + "step": 18950 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001513904481545261, + "loss": 1.5041, + "step": 18951 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015137808896468469, + "loss": 1.485, + "step": 18952 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015136572976548677, + "loss": 1.5367, + "step": 18953 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001513533705570163, + "loss": 1.5191, + "step": 18954 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015134101133935726, + "loss": 1.5704, + "step": 18955 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015132865211259342, + "loss": 1.4991, + "step": 18956 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015131629287680882, + "loss": 1.5054, + "step": 18957 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015130393363208726, + "loss": 1.506, + "step": 18958 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015129157437851278, + "loss": 1.4986, + "step": 18959 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015127921511616914, + "loss": 1.5231, + "step": 18960 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001512668558451404, + "loss": 1.4824, + "step": 18961 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001512544965655104, + "loss": 1.5252, + "step": 18962 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015124213727736303, + "loss": 1.4634, + "step": 18963 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015122977798078227, + "loss": 1.4874, + "step": 18964 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015121741867585198, + "loss": 1.5231, + "step": 18965 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015120505936265608, + "loss": 1.5015, + "step": 18966 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015119270004127847, + "loss": 1.5545, + "step": 18967 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015118034071180312, + "loss": 1.5378, + "step": 18968 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001511679813743139, + "loss": 1.5439, + "step": 18969 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015115562202889474, + "loss": 1.4786, + "step": 18970 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015114326267562952, + "loss": 1.508, + "step": 18971 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015113090331460223, + "loss": 1.5631, + "step": 18972 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001511185439458967, + "loss": 1.4882, + "step": 18973 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015110618456959686, + "loss": 1.5879, + "step": 18974 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015109382518578663, + "loss": 1.5319, + "step": 18975 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015108146579454997, + "loss": 1.5107, + "step": 18976 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015106910639597074, + "loss": 1.5428, + "step": 18977 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015105674699013283, + "loss": 1.4833, + "step": 18978 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015104438757712022, + "loss": 1.5184, + "step": 18979 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001510320281570168, + "loss": 1.517, + "step": 18980 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015101966872990648, + "loss": 1.4944, + "step": 18981 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015100730929587313, + "loss": 1.5305, + "step": 18982 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015099494985500075, + "loss": 1.4759, + "step": 18983 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015098259040737322, + "loss": 1.5025, + "step": 18984 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001509702309530744, + "loss": 1.5579, + "step": 18985 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015095787149218832, + "loss": 1.5226, + "step": 18986 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015094551202479874, + "loss": 1.5273, + "step": 18987 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015093315255098968, + "loss": 1.4878, + "step": 18988 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015092079307084502, + "loss": 1.4995, + "step": 18989 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015090843358444867, + "loss": 1.4746, + "step": 18990 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015089607409188465, + "loss": 1.5024, + "step": 18991 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001508837145932367, + "loss": 1.5319, + "step": 18992 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015087135508858886, + "loss": 1.5242, + "step": 18993 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015085899557802497, + "loss": 1.528, + "step": 18994 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015084663606162896, + "loss": 1.519, + "step": 18995 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001508342765394848, + "loss": 1.5544, + "step": 18996 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001508219170116763, + "loss": 1.6043, + "step": 18997 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001508095574782875, + "loss": 1.5623, + "step": 18998 + }, + { + "epoch": 1.49, + "learning_rate": 0.00015079719793940221, + "loss": 1.525, + "step": 18999 + }, + { + "epoch": 1.49, + "learning_rate": 0.0001507848383951044, + "loss": 1.5038, + "step": 19000 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015077247884547797, + "loss": 1.5071, + "step": 19001 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015076011929060683, + "loss": 1.5283, + "step": 19002 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015074775973057493, + "loss": 1.4588, + "step": 19003 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015073540016546612, + "loss": 1.5523, + "step": 19004 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015072304059536435, + "loss": 1.5246, + "step": 19005 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015071068102035355, + "loss": 1.5534, + "step": 19006 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001506983214405176, + "loss": 1.4636, + "step": 19007 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015068596185594047, + "loss": 1.5091, + "step": 19008 + }, + { + "epoch": 1.5, + "learning_rate": 0.000150673602266706, + "loss": 1.5022, + "step": 19009 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015066124267289817, + "loss": 1.5276, + "step": 19010 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015064888307460086, + "loss": 1.5316, + "step": 19011 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015063652347189796, + "loss": 1.5045, + "step": 19012 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015062416386487344, + "loss": 1.4937, + "step": 19013 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015061180425361118, + "loss": 1.5083, + "step": 19014 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015059944463819515, + "loss": 1.4937, + "step": 19015 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015058708501870918, + "loss": 1.5263, + "step": 19016 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015057472539523723, + "loss": 1.4435, + "step": 19017 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015056236576786324, + "loss": 1.544, + "step": 19018 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015055000613667106, + "loss": 1.5399, + "step": 19019 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015053764650174468, + "loss": 1.5196, + "step": 19020 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015052528686316792, + "loss": 1.5137, + "step": 19021 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015051292722102476, + "loss": 1.5155, + "step": 19022 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015050056757539917, + "loss": 1.5595, + "step": 19023 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015048820792637498, + "loss": 1.4853, + "step": 19024 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015047584827403612, + "loss": 1.5101, + "step": 19025 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015046348861846647, + "loss": 1.4827, + "step": 19026 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015045112895975, + "loss": 1.5008, + "step": 19027 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015043876929797068, + "loss": 1.4316, + "step": 19028 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001504264096332123, + "loss": 1.4498, + "step": 19029 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015041404996555887, + "loss": 1.5157, + "step": 19030 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015040169029509424, + "loss": 1.5331, + "step": 19031 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001503893306219024, + "loss": 1.5468, + "step": 19032 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015037697094606717, + "loss": 1.5189, + "step": 19033 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015036461126767252, + "loss": 1.476, + "step": 19034 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001503522515868024, + "loss": 1.5774, + "step": 19035 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001503398919035406, + "loss": 1.4961, + "step": 19036 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001503275322179712, + "loss": 1.5175, + "step": 19037 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015031517253017798, + "loss": 1.5397, + "step": 19038 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015030281284024495, + "loss": 1.5105, + "step": 19039 + }, + { + "epoch": 1.5, + "learning_rate": 0.000150290453148256, + "loss": 1.4931, + "step": 19040 + }, + { + "epoch": 1.5, + "learning_rate": 0.000150278093454295, + "loss": 1.4824, + "step": 19041 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015026573375844597, + "loss": 1.4967, + "step": 19042 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001502533740607927, + "loss": 1.4956, + "step": 19043 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015024101436141916, + "loss": 1.5657, + "step": 19044 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015022865466040924, + "loss": 1.5218, + "step": 19045 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001502162949578469, + "loss": 1.5274, + "step": 19046 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015020393525381608, + "loss": 1.5312, + "step": 19047 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015019157554840062, + "loss": 1.5989, + "step": 19048 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015017921584168446, + "loss": 1.566, + "step": 19049 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015016685613375154, + "loss": 1.5108, + "step": 19050 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015015449642468573, + "loss": 1.5426, + "step": 19051 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015014213671457098, + "loss": 1.4715, + "step": 19052 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015012977700349118, + "loss": 1.5303, + "step": 19053 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015011741729153036, + "loss": 1.5107, + "step": 19054 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015010505757877225, + "loss": 1.4993, + "step": 19055 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015009269786530086, + "loss": 1.5484, + "step": 19056 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015008033815120016, + "loss": 1.5363, + "step": 19057 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015006797843655396, + "loss": 1.5065, + "step": 19058 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001500556187214463, + "loss": 1.5283, + "step": 19059 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015004325900596087, + "loss": 1.4938, + "step": 19060 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015003089929018187, + "loss": 1.4865, + "step": 19061 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015001853957419302, + "loss": 1.5632, + "step": 19062 + }, + { + "epoch": 1.5, + "learning_rate": 0.00015000617985807833, + "loss": 1.4762, + "step": 19063 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014999382014192167, + "loss": 1.5393, + "step": 19064 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014998146042580695, + "loss": 1.4436, + "step": 19065 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014996910070981813, + "loss": 1.5043, + "step": 19066 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001499567409940391, + "loss": 1.5417, + "step": 19067 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014994438127855376, + "loss": 1.5541, + "step": 19068 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014993202156344604, + "loss": 1.5034, + "step": 19069 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014991966184879984, + "loss": 1.5224, + "step": 19070 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001499073021346991, + "loss": 1.4906, + "step": 19071 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014989494242122772, + "loss": 1.5738, + "step": 19072 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014988258270846966, + "loss": 1.5579, + "step": 19073 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014987022299650876, + "loss": 1.4705, + "step": 19074 + }, + { + "epoch": 1.5, + "learning_rate": 0.000149857863285429, + "loss": 1.4954, + "step": 19075 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014984550357531427, + "loss": 1.4792, + "step": 19076 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014983314386624846, + "loss": 1.5894, + "step": 19077 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001498207841583155, + "loss": 1.5433, + "step": 19078 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014980842445159938, + "loss": 1.5369, + "step": 19079 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014979606474618392, + "loss": 1.5648, + "step": 19080 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001497837050421531, + "loss": 1.5249, + "step": 19081 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014977134533959073, + "loss": 1.5014, + "step": 19082 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014975898563858084, + "loss": 1.4575, + "step": 19083 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014974662593920734, + "loss": 1.5474, + "step": 19084 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014973426624155406, + "loss": 1.4691, + "step": 19085 + }, + { + "epoch": 1.5, + "learning_rate": 0.000149721906545705, + "loss": 1.5073, + "step": 19086 + }, + { + "epoch": 1.5, + "learning_rate": 0.000149709546851744, + "loss": 1.5603, + "step": 19087 + }, + { + "epoch": 1.5, + "learning_rate": 0.000149697187159755, + "loss": 1.5277, + "step": 19088 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014968482746982196, + "loss": 1.4673, + "step": 19089 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001496724677820288, + "loss": 1.5117, + "step": 19090 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014966010809645936, + "loss": 1.5687, + "step": 19091 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001496477484131976, + "loss": 1.5106, + "step": 19092 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014963538873232748, + "loss": 1.5254, + "step": 19093 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014962302905393283, + "loss": 1.5328, + "step": 19094 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001496106693780976, + "loss": 1.5293, + "step": 19095 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014959830970490576, + "loss": 1.5527, + "step": 19096 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014958595003444113, + "loss": 1.5232, + "step": 19097 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014957359036678772, + "loss": 1.5201, + "step": 19098 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014956123070202933, + "loss": 1.5963, + "step": 19099 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014954887104024996, + "loss": 1.5726, + "step": 19100 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014953651138153353, + "loss": 1.5161, + "step": 19101 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001495241517259639, + "loss": 1.5194, + "step": 19102 + }, + { + "epoch": 1.5, + "learning_rate": 0.000149511792073625, + "loss": 1.5298, + "step": 19103 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001494994324246008, + "loss": 1.4467, + "step": 19104 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001494870727789752, + "loss": 1.5118, + "step": 19105 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014947471313683203, + "loss": 1.5502, + "step": 19106 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001494623534982553, + "loss": 1.5393, + "step": 19107 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014944999386332891, + "loss": 1.5207, + "step": 19108 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014943763423213677, + "loss": 1.5014, + "step": 19109 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014942527460476277, + "loss": 1.5075, + "step": 19110 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014941291498129082, + "loss": 1.4759, + "step": 19111 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014940055536180486, + "loss": 1.52, + "step": 19112 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001493881957463888, + "loss": 1.4968, + "step": 19113 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014937583613512656, + "loss": 1.4925, + "step": 19114 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014936347652810207, + "loss": 1.4879, + "step": 19115 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014935111692539917, + "loss": 1.5341, + "step": 19116 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014933875732710185, + "loss": 1.5129, + "step": 19117 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014932639773329403, + "loss": 1.5083, + "step": 19118 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014931403814405953, + "loss": 1.511, + "step": 19119 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014930167855948235, + "loss": 1.4676, + "step": 19120 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001492893189796464, + "loss": 1.5101, + "step": 19121 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014927695940463562, + "loss": 1.5244, + "step": 19122 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014926459983453385, + "loss": 1.5912, + "step": 19123 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014925224026942504, + "loss": 1.5083, + "step": 19124 + }, + { + "epoch": 1.5, + "learning_rate": 0.00014923988070939315, + "loss": 1.4873, + "step": 19125 + }, + { + "epoch": 1.5, + "learning_rate": 0.000149227521154522, + "loss": 1.4708, + "step": 19126 + }, + { + "epoch": 1.5, + "learning_rate": 0.0001492151616048956, + "loss": 1.4841, + "step": 19127 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001492028020605978, + "loss": 1.4726, + "step": 19128 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001491904425217125, + "loss": 1.5169, + "step": 19129 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001491780829883237, + "loss": 1.5283, + "step": 19130 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014916572346051522, + "loss": 1.5387, + "step": 19131 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014915336393837107, + "loss": 1.4836, + "step": 19132 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014914100442197506, + "loss": 1.4332, + "step": 19133 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014912864491141117, + "loss": 1.5575, + "step": 19134 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014911628540676327, + "loss": 1.533, + "step": 19135 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014910392590811533, + "loss": 1.5375, + "step": 19136 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014909156641555125, + "loss": 1.5596, + "step": 19137 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014907920692915492, + "loss": 1.4701, + "step": 19138 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014906684744901032, + "loss": 1.5552, + "step": 19139 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014905448797520123, + "loss": 1.5314, + "step": 19140 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014904212850781168, + "loss": 1.4894, + "step": 19141 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014902976904692557, + "loss": 1.4592, + "step": 19142 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014901740959262678, + "loss": 1.4919, + "step": 19143 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014900505014499925, + "loss": 1.492, + "step": 19144 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014899269070412687, + "loss": 1.4822, + "step": 19145 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014898033127009352, + "loss": 1.5344, + "step": 19146 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014896797184298322, + "loss": 1.5053, + "step": 19147 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014895561242287978, + "loss": 1.5347, + "step": 19148 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014894325300986717, + "loss": 1.5243, + "step": 19149 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014893089360402923, + "loss": 1.5139, + "step": 19150 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014891853420545003, + "loss": 1.5446, + "step": 19151 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014890617481421334, + "loss": 1.5624, + "step": 19152 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014889381543040312, + "loss": 1.4794, + "step": 19153 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001488814560541033, + "loss": 1.5487, + "step": 19154 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014886909668539777, + "loss": 1.5252, + "step": 19155 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014885673732437045, + "loss": 1.5019, + "step": 19156 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014884437797110523, + "loss": 1.5469, + "step": 19157 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014883201862568606, + "loss": 1.5409, + "step": 19158 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014881965928819686, + "loss": 1.5194, + "step": 19159 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001488072999587215, + "loss": 1.507, + "step": 19160 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014879494063734392, + "loss": 1.5462, + "step": 19161 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014878258132414803, + "loss": 1.5149, + "step": 19162 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014877022201921776, + "loss": 1.577, + "step": 19163 + }, + { + "epoch": 1.51, + "learning_rate": 0.000148757862722637, + "loss": 1.4926, + "step": 19164 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001487455034344896, + "loss": 1.531, + "step": 19165 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014873314415485959, + "loss": 1.4956, + "step": 19166 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001487207848838308, + "loss": 1.5054, + "step": 19167 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014870842562148725, + "loss": 1.5222, + "step": 19168 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001486960663679127, + "loss": 1.5355, + "step": 19169 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014868370712319118, + "loss": 1.5226, + "step": 19170 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014867134788740656, + "loss": 1.5365, + "step": 19171 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014865898866064275, + "loss": 1.5105, + "step": 19172 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014864662944298368, + "loss": 1.5059, + "step": 19173 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014863427023451323, + "loss": 1.4926, + "step": 19174 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014862191103531532, + "loss": 1.5041, + "step": 19175 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014860955184547393, + "loss": 1.5072, + "step": 19176 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014859719266507285, + "loss": 1.5365, + "step": 19177 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014858483349419608, + "loss": 1.4891, + "step": 19178 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014857247433292754, + "loss": 1.5268, + "step": 19179 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014856011518135106, + "loss": 1.4437, + "step": 19180 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014854775603955067, + "loss": 1.5358, + "step": 19181 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001485353969076101, + "loss": 1.4884, + "step": 19182 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014852303778561347, + "loss": 1.4835, + "step": 19183 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014851067867364454, + "loss": 1.5472, + "step": 19184 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014849831957178735, + "loss": 1.5336, + "step": 19185 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001484859604801257, + "loss": 1.4988, + "step": 19186 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014847360139874354, + "loss": 1.4776, + "step": 19187 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014846124232772482, + "loss": 1.493, + "step": 19188 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001484488832671534, + "loss": 1.5501, + "step": 19189 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014843652421711319, + "loss": 1.5174, + "step": 19190 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014842416517768815, + "loss": 1.5283, + "step": 19191 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014841180614896213, + "loss": 1.5175, + "step": 19192 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014839944713101907, + "loss": 1.4995, + "step": 19193 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001483870881239429, + "loss": 1.5643, + "step": 19194 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014837472912781748, + "loss": 1.4743, + "step": 19195 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014836237014272677, + "loss": 1.5414, + "step": 19196 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014835001116875467, + "loss": 1.5139, + "step": 19197 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014833765220598503, + "loss": 1.5306, + "step": 19198 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014832529325450186, + "loss": 1.4989, + "step": 19199 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014831293431438904, + "loss": 1.5241, + "step": 19200 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014830057538573046, + "loss": 1.4655, + "step": 19201 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014828821646861005, + "loss": 1.4918, + "step": 19202 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014827585756311165, + "loss": 1.4984, + "step": 19203 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014826349866931926, + "loss": 1.5195, + "step": 19204 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014825113978731677, + "loss": 1.4935, + "step": 19205 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014823878091718804, + "loss": 1.4868, + "step": 19206 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014822642205901702, + "loss": 1.5009, + "step": 19207 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014821406321288767, + "loss": 1.4405, + "step": 19208 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001482017043788838, + "loss": 1.4808, + "step": 19209 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014818934555708939, + "loss": 1.4688, + "step": 19210 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001481769867475883, + "loss": 1.5277, + "step": 19211 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014816462795046444, + "loss": 1.5727, + "step": 19212 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014815226916580174, + "loss": 1.4937, + "step": 19213 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014813991039368417, + "loss": 1.5568, + "step": 19214 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014812755163419553, + "loss": 1.4794, + "step": 19215 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001481151928874198, + "loss": 1.5165, + "step": 19216 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001481028341534409, + "loss": 1.4444, + "step": 19217 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014809047543234266, + "loss": 1.5378, + "step": 19218 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014807811672420908, + "loss": 1.5018, + "step": 19219 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014806575802912402, + "loss": 1.5448, + "step": 19220 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001480533993471714, + "loss": 1.5247, + "step": 19221 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001480410406784351, + "loss": 1.5079, + "step": 19222 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014802868202299906, + "loss": 1.4962, + "step": 19223 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014801632338094718, + "loss": 1.519, + "step": 19224 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001480039647523634, + "loss": 1.5178, + "step": 19225 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014799160613733156, + "loss": 1.4873, + "step": 19226 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014797924753593567, + "loss": 1.5156, + "step": 19227 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014796688894825948, + "loss": 1.5124, + "step": 19228 + }, + { + "epoch": 1.51, + "learning_rate": 0.000147954530374387, + "loss": 1.5229, + "step": 19229 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014794217181440214, + "loss": 1.4696, + "step": 19230 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014792981326838887, + "loss": 1.4845, + "step": 19231 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014791745473643095, + "loss": 1.5048, + "step": 19232 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014790509621861238, + "loss": 1.5185, + "step": 19233 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014789273771501708, + "loss": 1.5265, + "step": 19234 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014788037922572892, + "loss": 1.5154, + "step": 19235 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001478680207508318, + "loss": 1.4914, + "step": 19236 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014785566229040965, + "loss": 1.5218, + "step": 19237 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014784330384454638, + "loss": 1.498, + "step": 19238 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014783094541332589, + "loss": 1.5644, + "step": 19239 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014781858699683206, + "loss": 1.5206, + "step": 19240 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001478062285951488, + "loss": 1.5163, + "step": 19241 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001477938702083601, + "loss": 1.5009, + "step": 19242 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014778151183654975, + "loss": 1.5026, + "step": 19243 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014776915347980177, + "loss": 1.5052, + "step": 19244 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014775679513819988, + "loss": 1.496, + "step": 19245 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014774443681182822, + "loss": 1.5205, + "step": 19246 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014773207850077056, + "loss": 1.5537, + "step": 19247 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014771972020511084, + "loss": 1.5181, + "step": 19248 + }, + { + "epoch": 1.51, + "learning_rate": 0.000147707361924933, + "loss": 1.5346, + "step": 19249 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014769500366032084, + "loss": 1.4899, + "step": 19250 + }, + { + "epoch": 1.51, + "learning_rate": 0.0001476826454113584, + "loss": 1.459, + "step": 19251 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014767028717812948, + "loss": 1.4946, + "step": 19252 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014765792896071801, + "loss": 1.4695, + "step": 19253 + }, + { + "epoch": 1.51, + "learning_rate": 0.00014764557075920795, + "loss": 1.4942, + "step": 19254 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014763321257368314, + "loss": 1.51, + "step": 19255 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014762085440422754, + "loss": 1.4939, + "step": 19256 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014760849625092498, + "loss": 1.4581, + "step": 19257 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014759613811385943, + "loss": 1.4912, + "step": 19258 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014758377999311481, + "loss": 1.4984, + "step": 19259 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014757142188877485, + "loss": 1.5233, + "step": 19260 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014755906380092373, + "loss": 1.5208, + "step": 19261 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014754670572964521, + "loss": 1.5007, + "step": 19262 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014753434767502318, + "loss": 1.505, + "step": 19263 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001475219896371416, + "loss": 1.5252, + "step": 19264 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001475096316160843, + "loss": 1.546, + "step": 19265 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014749727361193526, + "loss": 1.5275, + "step": 19266 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014748491562477833, + "loss": 1.5313, + "step": 19267 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014747255765469746, + "loss": 1.5362, + "step": 19268 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001474601997017765, + "loss": 1.5168, + "step": 19269 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014744784176609938, + "loss": 1.5132, + "step": 19270 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014743548384775005, + "loss": 1.5989, + "step": 19271 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014742312594681232, + "loss": 1.5675, + "step": 19272 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014741076806337015, + "loss": 1.4883, + "step": 19273 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014739841019750747, + "loss": 1.4992, + "step": 19274 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014738605234930813, + "loss": 1.5505, + "step": 19275 + }, + { + "epoch": 1.52, + "learning_rate": 0.000147373694518856, + "loss": 1.5171, + "step": 19276 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014736133670623506, + "loss": 1.5194, + "step": 19277 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014734897891152923, + "loss": 1.5397, + "step": 19278 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014733662113482234, + "loss": 1.4948, + "step": 19279 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014732426337619835, + "loss": 1.5299, + "step": 19280 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014731190563574114, + "loss": 1.5726, + "step": 19281 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014729954791353454, + "loss": 1.5433, + "step": 19282 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001472871902096626, + "loss": 1.4741, + "step": 19283 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001472748325242091, + "loss": 1.4551, + "step": 19284 + }, + { + "epoch": 1.52, + "learning_rate": 0.000147262474857258, + "loss": 1.5103, + "step": 19285 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014725011720889317, + "loss": 1.5102, + "step": 19286 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014723775957919852, + "loss": 1.5113, + "step": 19287 + }, + { + "epoch": 1.52, + "learning_rate": 0.000147225401968258, + "loss": 1.5138, + "step": 19288 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014721304437615543, + "loss": 1.5266, + "step": 19289 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014720068680297476, + "loss": 1.5156, + "step": 19290 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001471883292487999, + "loss": 1.5229, + "step": 19291 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001471759717137147, + "loss": 1.5307, + "step": 19292 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014716361419780306, + "loss": 1.4993, + "step": 19293 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014715125670114896, + "loss": 1.5122, + "step": 19294 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001471388992238363, + "loss": 1.5311, + "step": 19295 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014712654176594886, + "loss": 1.5254, + "step": 19296 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014711418432757068, + "loss": 1.491, + "step": 19297 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014710182690878554, + "loss": 1.4971, + "step": 19298 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014708946950967743, + "loss": 1.5046, + "step": 19299 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014707711213033024, + "loss": 1.478, + "step": 19300 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001470647547708278, + "loss": 1.5194, + "step": 19301 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014705239743125406, + "loss": 1.5639, + "step": 19302 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014704004011169294, + "loss": 1.5081, + "step": 19303 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014702768281222827, + "loss": 1.5523, + "step": 19304 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014701532553294404, + "loss": 1.4986, + "step": 19305 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014700296827392407, + "loss": 1.5124, + "step": 19306 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001469906110352523, + "loss": 1.4979, + "step": 19307 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014697825381701257, + "loss": 1.4556, + "step": 19308 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014696589661928892, + "loss": 1.5228, + "step": 19309 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001469535394421651, + "loss": 1.4751, + "step": 19310 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014694118228572508, + "loss": 1.4955, + "step": 19311 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014692882515005278, + "loss": 1.5584, + "step": 19312 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014691646803523202, + "loss": 1.4896, + "step": 19313 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014690411094134677, + "loss": 1.4632, + "step": 19314 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014689175386848087, + "loss": 1.5399, + "step": 19315 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014687939681671825, + "loss": 1.54, + "step": 19316 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014686703978614285, + "loss": 1.5021, + "step": 19317 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014685468277683846, + "loss": 1.5261, + "step": 19318 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014684232578888906, + "loss": 1.5416, + "step": 19319 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014682996882237856, + "loss": 1.5642, + "step": 19320 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014681761187739078, + "loss": 1.4934, + "step": 19321 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001468052549540097, + "loss": 1.5684, + "step": 19322 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014679289805231906, + "loss": 1.5028, + "step": 19323 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014678054117240295, + "loss": 1.4795, + "step": 19324 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001467681843143452, + "loss": 1.4773, + "step": 19325 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014675582747822972, + "loss": 1.5175, + "step": 19326 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014674347066414033, + "loss": 1.5307, + "step": 19327 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014673111387216098, + "loss": 1.4626, + "step": 19328 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001467187571023756, + "loss": 1.5125, + "step": 19329 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014670640035486802, + "loss": 1.5055, + "step": 19330 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014669404362972218, + "loss": 1.5252, + "step": 19331 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014668168692702198, + "loss": 1.4882, + "step": 19332 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014666933024685126, + "loss": 1.5149, + "step": 19333 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014665697358929396, + "loss": 1.5285, + "step": 19334 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014664461695443397, + "loss": 1.4891, + "step": 19335 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014663226034235515, + "loss": 1.5544, + "step": 19336 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014661990375314148, + "loss": 1.4946, + "step": 19337 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014660754718687674, + "loss": 1.5204, + "step": 19338 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014659519064364487, + "loss": 1.5391, + "step": 19339 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001465828341235298, + "loss": 1.5304, + "step": 19340 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014657047762661542, + "loss": 1.5734, + "step": 19341 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001465581211529856, + "loss": 1.4996, + "step": 19342 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014654576470272425, + "loss": 1.5212, + "step": 19343 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014653340827591523, + "loss": 1.5265, + "step": 19344 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014652105187264245, + "loss": 1.5134, + "step": 19345 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014650869549298983, + "loss": 1.5314, + "step": 19346 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014649633913704123, + "loss": 1.5408, + "step": 19347 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014648398280488054, + "loss": 1.4926, + "step": 19348 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001464716264965917, + "loss": 1.5472, + "step": 19349 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014645927021225856, + "loss": 1.5159, + "step": 19350 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014644691395196503, + "loss": 1.5199, + "step": 19351 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014643455771579496, + "loss": 1.618, + "step": 19352 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014642220150383229, + "loss": 1.4983, + "step": 19353 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014640984531616091, + "loss": 1.5274, + "step": 19354 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014639748915286463, + "loss": 1.5445, + "step": 19355 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014638513301402746, + "loss": 1.4645, + "step": 19356 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014637277689973324, + "loss": 1.5673, + "step": 19357 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014636042081006589, + "loss": 1.4919, + "step": 19358 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014634806474510926, + "loss": 1.5069, + "step": 19359 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014633570870494723, + "loss": 1.5499, + "step": 19360 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014632335268966376, + "loss": 1.5259, + "step": 19361 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014631099669934266, + "loss": 1.4573, + "step": 19362 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001462986407340679, + "loss": 1.505, + "step": 19363 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014628628479392328, + "loss": 1.4669, + "step": 19364 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014627392887899275, + "loss": 1.4977, + "step": 19365 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001462615729893602, + "loss": 1.5501, + "step": 19366 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001462492171251095, + "loss": 1.5148, + "step": 19367 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014623686128632457, + "loss": 1.524, + "step": 19368 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014622450547308922, + "loss": 1.5084, + "step": 19369 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001462121496854874, + "loss": 1.485, + "step": 19370 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014619979392360298, + "loss": 1.4842, + "step": 19371 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001461874381875199, + "loss": 1.5668, + "step": 19372 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014617508247732203, + "loss": 1.4685, + "step": 19373 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001461627267930932, + "loss": 1.4755, + "step": 19374 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001461503711349174, + "loss": 1.4851, + "step": 19375 + }, + { + "epoch": 1.52, + "learning_rate": 0.0001461380155028784, + "loss": 1.489, + "step": 19376 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014612565989706013, + "loss": 1.5194, + "step": 19377 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014611330431754655, + "loss": 1.5211, + "step": 19378 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014610094876442144, + "loss": 1.5376, + "step": 19379 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014608859323776875, + "loss": 1.56, + "step": 19380 + }, + { + "epoch": 1.52, + "learning_rate": 0.00014607623773767235, + "loss": 1.5038, + "step": 19381 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014606388226421615, + "loss": 1.5149, + "step": 19382 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014605152681748402, + "loss": 1.4958, + "step": 19383 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014603917139755982, + "loss": 1.4601, + "step": 19384 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014602681600452746, + "loss": 1.5464, + "step": 19385 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014601446063847078, + "loss": 1.5338, + "step": 19386 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001460021052994738, + "loss": 1.5711, + "step": 19387 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014598974998762025, + "loss": 1.4817, + "step": 19388 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014597739470299413, + "loss": 1.5122, + "step": 19389 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014596503944567927, + "loss": 1.5668, + "step": 19390 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014595268421575957, + "loss": 1.5493, + "step": 19391 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014594032901331892, + "loss": 1.5447, + "step": 19392 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014592797383844116, + "loss": 1.4873, + "step": 19393 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014591561869121023, + "loss": 1.5465, + "step": 19394 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014590326357171002, + "loss": 1.5707, + "step": 19395 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014589090848002434, + "loss": 1.5484, + "step": 19396 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014587855341623718, + "loss": 1.5795, + "step": 19397 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014586619838043234, + "loss": 1.4819, + "step": 19398 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014585384337269372, + "loss": 1.5595, + "step": 19399 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014584148839310524, + "loss": 1.5355, + "step": 19400 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014582913344175075, + "loss": 1.4462, + "step": 19401 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001458167785187141, + "loss": 1.5831, + "step": 19402 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014580442362407923, + "loss": 1.4851, + "step": 19403 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014579206875793004, + "loss": 1.4435, + "step": 19404 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014577971392035037, + "loss": 1.5055, + "step": 19405 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001457673591114241, + "loss": 1.4851, + "step": 19406 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014575500433123515, + "loss": 1.533, + "step": 19407 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014574264957986735, + "loss": 1.4826, + "step": 19408 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014573029485740466, + "loss": 1.557, + "step": 19409 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014571794016393088, + "loss": 1.5149, + "step": 19410 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014570558549952992, + "loss": 1.4848, + "step": 19411 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014569323086428569, + "loss": 1.5023, + "step": 19412 + }, + { + "epoch": 1.53, + "learning_rate": 0.000145680876258282, + "loss": 1.506, + "step": 19413 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001456685216816028, + "loss": 1.4849, + "step": 19414 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014565616713433196, + "loss": 1.4276, + "step": 19415 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014564381261655333, + "loss": 1.4888, + "step": 19416 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014563145812835084, + "loss": 1.545, + "step": 19417 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014561910366980824, + "loss": 1.5595, + "step": 19418 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001456067492410096, + "loss": 1.5172, + "step": 19419 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014559439484203868, + "loss": 1.496, + "step": 19420 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001455820404729794, + "loss": 1.5337, + "step": 19421 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014556968613391565, + "loss": 1.4929, + "step": 19422 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014555733182493124, + "loss": 1.5428, + "step": 19423 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014554497754611014, + "loss": 1.5452, + "step": 19424 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014553262329753614, + "loss": 1.5145, + "step": 19425 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014552026907929322, + "loss": 1.5515, + "step": 19426 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014550791489146515, + "loss": 1.544, + "step": 19427 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014549556073413587, + "loss": 1.5324, + "step": 19428 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014548320660738925, + "loss": 1.4834, + "step": 19429 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014547085251130916, + "loss": 1.5007, + "step": 19430 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014545849844597948, + "loss": 1.4805, + "step": 19431 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014544614441148413, + "loss": 1.4888, + "step": 19432 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014543379040790687, + "loss": 1.4802, + "step": 19433 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014542143643533168, + "loss": 1.4789, + "step": 19434 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001454090824938424, + "loss": 1.4974, + "step": 19435 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014539672858352297, + "loss": 1.5679, + "step": 19436 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014538437470445716, + "loss": 1.48, + "step": 19437 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014537202085672894, + "loss": 1.4508, + "step": 19438 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014535966704042213, + "loss": 1.5347, + "step": 19439 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001453473132556206, + "loss": 1.5714, + "step": 19440 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001453349595024083, + "loss": 1.5006, + "step": 19441 + }, + { + "epoch": 1.53, + "learning_rate": 0.000145322605780869, + "loss": 1.5225, + "step": 19442 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014531025209108662, + "loss": 1.5042, + "step": 19443 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001452978984331451, + "loss": 1.535, + "step": 19444 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001452855448071282, + "loss": 1.5077, + "step": 19445 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014527319121311987, + "loss": 1.5488, + "step": 19446 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014526083765120394, + "loss": 1.4865, + "step": 19447 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014524848412146433, + "loss": 1.5136, + "step": 19448 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014523613062398483, + "loss": 1.5294, + "step": 19449 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014522377715884947, + "loss": 1.5116, + "step": 19450 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014521142372614197, + "loss": 1.4962, + "step": 19451 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014519907032594626, + "loss": 1.5258, + "step": 19452 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014518671695834624, + "loss": 1.4995, + "step": 19453 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014517436362342572, + "loss": 1.5302, + "step": 19454 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014516201032126864, + "loss": 1.4823, + "step": 19455 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014514965705195886, + "loss": 1.5216, + "step": 19456 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001451373038155802, + "loss": 1.5033, + "step": 19457 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014512495061221658, + "loss": 1.5228, + "step": 19458 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014511259744195184, + "loss": 1.535, + "step": 19459 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014510024430486985, + "loss": 1.5845, + "step": 19460 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014508789120105454, + "loss": 1.5116, + "step": 19461 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001450755381305897, + "loss": 1.4998, + "step": 19462 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014506318509355928, + "loss": 1.5303, + "step": 19463 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014505083209004707, + "loss": 1.462, + "step": 19464 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014503847912013696, + "loss": 1.5006, + "step": 19465 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014502612618391285, + "loss": 1.5174, + "step": 19466 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014501377328145863, + "loss": 1.5292, + "step": 19467 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014500142041285813, + "loss": 1.5187, + "step": 19468 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001449890675781952, + "loss": 1.504, + "step": 19469 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001449767147775538, + "loss": 1.517, + "step": 19470 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014496436201101768, + "loss": 1.4732, + "step": 19471 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014495200927867074, + "loss": 1.533, + "step": 19472 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014493965658059696, + "loss": 1.5061, + "step": 19473 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014492730391688004, + "loss": 1.5205, + "step": 19474 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014491495128760398, + "loss": 1.4943, + "step": 19475 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014490259869285257, + "loss": 1.4927, + "step": 19476 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014489024613270968, + "loss": 1.4844, + "step": 19477 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014487789360725925, + "loss": 1.5692, + "step": 19478 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014486554111658507, + "loss": 1.5528, + "step": 19479 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014485318866077097, + "loss": 1.5094, + "step": 19480 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014484083623990092, + "loss": 1.5056, + "step": 19481 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001448284838540588, + "loss": 1.5089, + "step": 19482 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014481613150332836, + "loss": 1.5389, + "step": 19483 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014480377918779354, + "loss": 1.4538, + "step": 19484 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014479142690753823, + "loss": 1.5655, + "step": 19485 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001447790746626462, + "loss": 1.5235, + "step": 19486 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014476672245320143, + "loss": 1.5039, + "step": 19487 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001447543702792877, + "loss": 1.4414, + "step": 19488 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014474201814098888, + "loss": 1.525, + "step": 19489 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014472966603838887, + "loss": 1.4997, + "step": 19490 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014471731397157152, + "loss": 1.5147, + "step": 19491 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014470496194062072, + "loss": 1.5129, + "step": 19492 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014469260994562027, + "loss": 1.5829, + "step": 19493 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014468025798665407, + "loss": 1.5244, + "step": 19494 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014466790606380603, + "loss": 1.4833, + "step": 19495 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014465555417715988, + "loss": 1.4729, + "step": 19496 + }, + { + "epoch": 1.53, + "learning_rate": 0.0001446432023267996, + "loss": 1.5599, + "step": 19497 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014463085051280903, + "loss": 1.5283, + "step": 19498 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014461849873527205, + "loss": 1.4774, + "step": 19499 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014460614699427247, + "loss": 1.5233, + "step": 19500 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014459379528989415, + "loss": 1.538, + "step": 19501 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014458144362222103, + "loss": 1.5403, + "step": 19502 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014456909199133688, + "loss": 1.4873, + "step": 19503 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014455674039732562, + "loss": 1.5162, + "step": 19504 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014454438884027107, + "loss": 1.5135, + "step": 19505 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014453203732025713, + "loss": 1.4816, + "step": 19506 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014451968583736763, + "loss": 1.5198, + "step": 19507 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014450733439168642, + "loss": 1.4883, + "step": 19508 + }, + { + "epoch": 1.53, + "learning_rate": 0.00014449498298329744, + "loss": 1.473, + "step": 19509 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014448263161228442, + "loss": 1.4953, + "step": 19510 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001444702802787313, + "loss": 1.5208, + "step": 19511 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001444579289827219, + "loss": 1.5018, + "step": 19512 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014444557772434012, + "loss": 1.5043, + "step": 19513 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014443322650366984, + "loss": 1.5062, + "step": 19514 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014442087532079485, + "loss": 1.4715, + "step": 19515 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014440852417579907, + "loss": 1.4909, + "step": 19516 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001443961730687663, + "loss": 1.4576, + "step": 19517 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001443838219997804, + "loss": 1.5188, + "step": 19518 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001443714709689253, + "loss": 1.5605, + "step": 19519 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014435911997628478, + "loss": 1.4794, + "step": 19520 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014434676902194275, + "loss": 1.5352, + "step": 19521 + }, + { + "epoch": 1.54, + "learning_rate": 0.000144334418105983, + "loss": 1.539, + "step": 19522 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001443220672284894, + "loss": 1.524, + "step": 19523 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001443097163895459, + "loss": 1.5138, + "step": 19524 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014429736558923626, + "loss": 1.4806, + "step": 19525 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014428501482764434, + "loss": 1.5132, + "step": 19526 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014427266410485404, + "loss": 1.5086, + "step": 19527 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014426031342094914, + "loss": 1.5171, + "step": 19528 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014424796277601355, + "loss": 1.508, + "step": 19529 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014423561217013115, + "loss": 1.5165, + "step": 19530 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001442232616033858, + "loss": 1.4616, + "step": 19531 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014421091107586127, + "loss": 1.5491, + "step": 19532 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001441985605876415, + "loss": 1.4918, + "step": 19533 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014418621013881025, + "loss": 1.5499, + "step": 19534 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014417385972945144, + "loss": 1.5382, + "step": 19535 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014416150935964893, + "loss": 1.517, + "step": 19536 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001441491590294865, + "loss": 1.5244, + "step": 19537 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001441368087390481, + "loss": 1.4942, + "step": 19538 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014412445848841754, + "loss": 1.5268, + "step": 19539 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014411210827767863, + "loss": 1.5047, + "step": 19540 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001440997581069153, + "loss": 1.5215, + "step": 19541 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001440874079762113, + "loss": 1.4872, + "step": 19542 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001440750578856505, + "loss": 1.456, + "step": 19543 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014406270783531684, + "loss": 1.5648, + "step": 19544 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014405035782529417, + "loss": 1.4804, + "step": 19545 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001440380078556662, + "loss": 1.4508, + "step": 19546 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014402565792651691, + "loss": 1.5486, + "step": 19547 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014401330803793014, + "loss": 1.5277, + "step": 19548 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014400095818998965, + "loss": 1.4356, + "step": 19549 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014398860838277938, + "loss": 1.4842, + "step": 19550 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014397625861638312, + "loss": 1.533, + "step": 19551 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014396390889088472, + "loss": 1.4756, + "step": 19552 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001439515592063681, + "loss": 1.5471, + "step": 19553 + }, + { + "epoch": 1.54, + "learning_rate": 0.000143939209562917, + "loss": 1.5001, + "step": 19554 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014392685996061536, + "loss": 1.5208, + "step": 19555 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014391451039954699, + "loss": 1.53, + "step": 19556 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014390216087979574, + "loss": 1.4962, + "step": 19557 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014388981140144543, + "loss": 1.5134, + "step": 19558 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014387746196457986, + "loss": 1.4644, + "step": 19559 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014386511256928307, + "loss": 1.5006, + "step": 19560 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001438527632156387, + "loss": 1.508, + "step": 19561 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014384041390373074, + "loss": 1.5075, + "step": 19562 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014382806463364293, + "loss": 1.5516, + "step": 19563 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014381571540545915, + "loss": 1.4862, + "step": 19564 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014380336621926327, + "loss": 1.5658, + "step": 19565 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001437910170751391, + "loss": 1.5114, + "step": 19566 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014377866797317051, + "loss": 1.4733, + "step": 19567 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014376631891344134, + "loss": 1.4561, + "step": 19568 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014375396989603538, + "loss": 1.4609, + "step": 19569 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014374162092103658, + "loss": 1.5535, + "step": 19570 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014372927198852867, + "loss": 1.4637, + "step": 19571 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014371692309859556, + "loss": 1.4544, + "step": 19572 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001437045742513211, + "loss": 1.5215, + "step": 19573 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014369222544678906, + "loss": 1.5337, + "step": 19574 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001436798766850833, + "loss": 1.5464, + "step": 19575 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014366752796628773, + "loss": 1.5085, + "step": 19576 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014365517929048618, + "loss": 1.5199, + "step": 19577 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014364283065776244, + "loss": 1.5274, + "step": 19578 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014363048206820039, + "loss": 1.4823, + "step": 19579 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014361813352188382, + "loss": 1.5037, + "step": 19580 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001436057850188966, + "loss": 1.5289, + "step": 19581 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014359343655932262, + "loss": 1.535, + "step": 19582 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014358108814324562, + "loss": 1.4872, + "step": 19583 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014356873977074952, + "loss": 1.4727, + "step": 19584 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001435563914419181, + "loss": 1.5339, + "step": 19585 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014354404315683524, + "loss": 1.564, + "step": 19586 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001435316949155848, + "loss": 1.5816, + "step": 19587 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014351934671825054, + "loss": 1.4402, + "step": 19588 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014350699856491633, + "loss": 1.52, + "step": 19589 + }, + { + "epoch": 1.54, + "learning_rate": 0.000143494650455666, + "loss": 1.5399, + "step": 19590 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014348230239058345, + "loss": 1.5321, + "step": 19591 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014346995436975243, + "loss": 1.4574, + "step": 19592 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014345760639325683, + "loss": 1.5582, + "step": 19593 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001434452584611805, + "loss": 1.492, + "step": 19594 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014343291057360724, + "loss": 1.4939, + "step": 19595 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014342056273062087, + "loss": 1.5437, + "step": 19596 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014340821493230528, + "loss": 1.5022, + "step": 19597 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014339586717874425, + "loss": 1.5074, + "step": 19598 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014338351947002168, + "loss": 1.5133, + "step": 19599 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014337117180622132, + "loss": 1.5133, + "step": 19600 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014335882418742703, + "loss": 1.4646, + "step": 19601 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001433464766137227, + "loss": 1.5025, + "step": 19602 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014333412908519211, + "loss": 1.5304, + "step": 19603 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001433217816019191, + "loss": 1.5283, + "step": 19604 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001433094341639875, + "loss": 1.5248, + "step": 19605 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001432970867714811, + "loss": 1.5369, + "step": 19606 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014328473942448383, + "loss": 1.4667, + "step": 19607 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001432723921230795, + "loss": 1.5183, + "step": 19608 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001432600448673519, + "loss": 1.507, + "step": 19609 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014324769765738484, + "loss": 1.5426, + "step": 19610 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014323535049326225, + "loss": 1.5747, + "step": 19611 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014322300337506785, + "loss": 1.5283, + "step": 19612 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014321065630288552, + "loss": 1.4997, + "step": 19613 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014319830927679914, + "loss": 1.5409, + "step": 19614 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014318596229689242, + "loss": 1.5563, + "step": 19615 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001431736153632493, + "loss": 1.5291, + "step": 19616 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014316126847595354, + "loss": 1.5319, + "step": 19617 + }, + { + "epoch": 1.54, + "learning_rate": 0.000143148921635089, + "loss": 1.5385, + "step": 19618 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014313657484073952, + "loss": 1.4553, + "step": 19619 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014312422809298887, + "loss": 1.5228, + "step": 19620 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014311188139192095, + "loss": 1.5213, + "step": 19621 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014309953473761947, + "loss": 1.4918, + "step": 19622 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014308718813016845, + "loss": 1.5566, + "step": 19623 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014307484156965154, + "loss": 1.4818, + "step": 19624 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014306249505615265, + "loss": 1.5151, + "step": 19625 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014305014858975563, + "loss": 1.4728, + "step": 19626 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014303780217054423, + "loss": 1.421, + "step": 19627 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014302545579860236, + "loss": 1.4676, + "step": 19628 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014301310947401372, + "loss": 1.5154, + "step": 19629 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014300076319686224, + "loss": 1.4935, + "step": 19630 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014298841696723175, + "loss": 1.4961, + "step": 19631 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014297607078520602, + "loss": 1.5334, + "step": 19632 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001429637246508689, + "loss": 1.5388, + "step": 19633 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014295137856430417, + "loss": 1.55, + "step": 19634 + }, + { + "epoch": 1.54, + "learning_rate": 0.0001429390325255957, + "loss": 1.4931, + "step": 19635 + }, + { + "epoch": 1.54, + "learning_rate": 0.00014292668653482734, + "loss": 1.5064, + "step": 19636 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014291434059208284, + "loss": 1.5263, + "step": 19637 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014290199469744604, + "loss": 1.5173, + "step": 19638 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014288964885100078, + "loss": 1.4632, + "step": 19639 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014287730305283093, + "loss": 1.5585, + "step": 19640 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014286495730302023, + "loss": 1.5214, + "step": 19641 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014285261160165255, + "loss": 1.542, + "step": 19642 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001428402659488117, + "loss": 1.4545, + "step": 19643 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014282792034458146, + "loss": 1.525, + "step": 19644 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014281557478904573, + "loss": 1.501, + "step": 19645 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014280322928228825, + "loss": 1.5233, + "step": 19646 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014279088382439286, + "loss": 1.5014, + "step": 19647 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014277853841544342, + "loss": 1.4633, + "step": 19648 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001427661930555237, + "loss": 1.5081, + "step": 19649 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014275384774471752, + "loss": 1.4671, + "step": 19650 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014274150248310875, + "loss": 1.5331, + "step": 19651 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014272915727078114, + "loss": 1.4533, + "step": 19652 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014271681210781853, + "loss": 1.505, + "step": 19653 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014270446699430475, + "loss": 1.4908, + "step": 19654 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014269212193032368, + "loss": 1.5237, + "step": 19655 + }, + { + "epoch": 1.55, + "learning_rate": 0.000142679776915959, + "loss": 1.5032, + "step": 19656 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014266743195129466, + "loss": 1.5659, + "step": 19657 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014265508703641437, + "loss": 1.5154, + "step": 19658 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014264274217140195, + "loss": 1.5273, + "step": 19659 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014263039735634133, + "loss": 1.5531, + "step": 19660 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014261805259131619, + "loss": 1.497, + "step": 19661 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014260570787641045, + "loss": 1.557, + "step": 19662 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014259336321170783, + "loss": 1.5064, + "step": 19663 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014258101859729216, + "loss": 1.4892, + "step": 19664 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014256867403324736, + "loss": 1.4964, + "step": 19665 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001425563295196571, + "loss": 1.5112, + "step": 19666 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014254398505660523, + "loss": 1.4873, + "step": 19667 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014253164064417567, + "loss": 1.4918, + "step": 19668 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014251929628245207, + "loss": 1.5319, + "step": 19669 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014250695197151833, + "loss": 1.5049, + "step": 19670 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014249460771145826, + "loss": 1.5729, + "step": 19671 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001424822635023557, + "loss": 1.5009, + "step": 19672 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001424699193442944, + "loss": 1.4975, + "step": 19673 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001424575752373582, + "loss": 1.5057, + "step": 19674 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014244523118163088, + "loss": 1.5684, + "step": 19675 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001424328871771963, + "loss": 1.4683, + "step": 19676 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014242054322413823, + "loss": 1.4989, + "step": 19677 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001424081993225405, + "loss": 1.5092, + "step": 19678 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014239585547248687, + "loss": 1.5183, + "step": 19679 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014238351167406124, + "loss": 1.5114, + "step": 19680 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014237116792734732, + "loss": 1.4963, + "step": 19681 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014235882423242898, + "loss": 1.5385, + "step": 19682 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014234648058939, + "loss": 1.482, + "step": 19683 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014233413699831418, + "loss": 1.5263, + "step": 19684 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014232179345928528, + "loss": 1.5334, + "step": 19685 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014230944997238725, + "loss": 1.5039, + "step": 19686 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014229710653770379, + "loss": 1.4607, + "step": 19687 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014228476315531873, + "loss": 1.4867, + "step": 19688 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001422724198253159, + "loss": 1.4858, + "step": 19689 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014226007654777903, + "loss": 1.5791, + "step": 19690 + }, + { + "epoch": 1.55, + "learning_rate": 0.000142247733322792, + "loss": 1.5312, + "step": 19691 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014223539015043856, + "loss": 1.4916, + "step": 19692 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014222304703080253, + "loss": 1.547, + "step": 19693 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014221070396396778, + "loss": 1.4892, + "step": 19694 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014219836095001799, + "loss": 1.4764, + "step": 19695 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014218601798903703, + "loss": 1.5752, + "step": 19696 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001421736750811087, + "loss": 1.5322, + "step": 19697 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001421613322263168, + "loss": 1.4856, + "step": 19698 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014214898942474513, + "loss": 1.5291, + "step": 19699 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014213664667647743, + "loss": 1.4905, + "step": 19700 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014212430398159763, + "loss": 1.4293, + "step": 19701 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014211196134018944, + "loss": 1.4661, + "step": 19702 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014209961875233672, + "loss": 1.4761, + "step": 19703 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014208727621812319, + "loss": 1.5156, + "step": 19704 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001420749337376327, + "loss": 1.5225, + "step": 19705 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014206259131094903, + "loss": 1.4922, + "step": 19706 + }, + { + "epoch": 1.55, + "learning_rate": 0.000142050248938156, + "loss": 1.4741, + "step": 19707 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014203790661933735, + "loss": 1.5295, + "step": 19708 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014202556435457698, + "loss": 1.5719, + "step": 19709 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014201322214395858, + "loss": 1.5021, + "step": 19710 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014200087998756603, + "loss": 1.4928, + "step": 19711 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014198853788548307, + "loss": 1.5088, + "step": 19712 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001419761958377935, + "loss": 1.5138, + "step": 19713 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014196385384458116, + "loss": 1.5597, + "step": 19714 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001419515119059298, + "loss": 1.5253, + "step": 19715 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014193917002192321, + "loss": 1.4945, + "step": 19716 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014192682819264522, + "loss": 1.5414, + "step": 19717 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014191448641817964, + "loss": 1.5105, + "step": 19718 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014190214469861023, + "loss": 1.536, + "step": 19719 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014188980303402081, + "loss": 1.518, + "step": 19720 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001418774614244951, + "loss": 1.5687, + "step": 19721 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014186511987011698, + "loss": 1.5023, + "step": 19722 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001418527783709702, + "loss": 1.5342, + "step": 19723 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014184043692713855, + "loss": 1.4956, + "step": 19724 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001418280955387058, + "loss": 1.5767, + "step": 19725 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014181575420575584, + "loss": 1.527, + "step": 19726 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014180341292837235, + "loss": 1.4887, + "step": 19727 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014179107170663921, + "loss": 1.4859, + "step": 19728 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014177873054064012, + "loss": 1.5247, + "step": 19729 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001417663894304589, + "loss": 1.5303, + "step": 19730 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014175404837617938, + "loss": 1.479, + "step": 19731 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014174170737788527, + "loss": 1.5309, + "step": 19732 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014172936643566043, + "loss": 1.53, + "step": 19733 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014171702554958865, + "loss": 1.5433, + "step": 19734 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014170468471975373, + "loss": 1.5543, + "step": 19735 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014169234394623937, + "loss": 1.5231, + "step": 19736 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001416800032291294, + "loss": 1.4594, + "step": 19737 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014166766256850768, + "loss": 1.4823, + "step": 19738 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001416553219644579, + "loss": 1.5472, + "step": 19739 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001416429814170639, + "loss": 1.4767, + "step": 19740 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001416306409264094, + "loss": 1.4938, + "step": 19741 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014161830049257823, + "loss": 1.4995, + "step": 19742 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014160596011565421, + "loss": 1.5164, + "step": 19743 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001415936197957211, + "loss": 1.4757, + "step": 19744 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014158127953286265, + "loss": 1.5439, + "step": 19745 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014156893932716267, + "loss": 1.5303, + "step": 19746 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001415565991787049, + "loss": 1.5695, + "step": 19747 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014154425908757313, + "loss": 1.5108, + "step": 19748 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014153191905385125, + "loss": 1.5224, + "step": 19749 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014151957907762298, + "loss": 1.5206, + "step": 19750 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014150723915897206, + "loss": 1.5065, + "step": 19751 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001414948992979823, + "loss": 1.5211, + "step": 19752 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014148255949473747, + "loss": 1.4639, + "step": 19753 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014147021974932137, + "loss": 1.5433, + "step": 19754 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001414578800618178, + "loss": 1.5297, + "step": 19755 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014144554043231047, + "loss": 1.5612, + "step": 19756 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014143320086088324, + "loss": 1.5088, + "step": 19757 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014142086134761981, + "loss": 1.5027, + "step": 19758 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014140852189260401, + "loss": 1.5243, + "step": 19759 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014139618249591962, + "loss": 1.5034, + "step": 19760 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014138384315765039, + "loss": 1.4949, + "step": 19761 + }, + { + "epoch": 1.55, + "learning_rate": 0.0001413715038778801, + "loss": 1.5073, + "step": 19762 + }, + { + "epoch": 1.55, + "learning_rate": 0.00014135916465669247, + "loss": 1.5226, + "step": 19763 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014134682549417146, + "loss": 1.4705, + "step": 19764 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014133448639040068, + "loss": 1.4885, + "step": 19765 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014132214734546394, + "loss": 1.5278, + "step": 19766 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014130980835944508, + "loss": 1.586, + "step": 19767 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001412974694324278, + "loss": 1.4953, + "step": 19768 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001412851305644959, + "loss": 1.5431, + "step": 19769 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014127279175573315, + "loss": 1.5378, + "step": 19770 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001412604530062233, + "loss": 1.5307, + "step": 19771 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014124811431605024, + "loss": 1.5088, + "step": 19772 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014123577568529757, + "loss": 1.5208, + "step": 19773 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001412234371140492, + "loss": 1.5453, + "step": 19774 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014121109860238881, + "loss": 1.481, + "step": 19775 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001411987601504002, + "loss": 1.4916, + "step": 19776 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001411864217581672, + "loss": 1.4905, + "step": 19777 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014117408342577352, + "loss": 1.4696, + "step": 19778 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014116174515330288, + "loss": 1.5158, + "step": 19779 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014114940694083915, + "loss": 1.5699, + "step": 19780 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001411370687884661, + "loss": 1.4689, + "step": 19781 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014112473069626742, + "loss": 1.4631, + "step": 19782 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014111239266432693, + "loss": 1.5724, + "step": 19783 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014110005469272842, + "loss": 1.4976, + "step": 19784 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001410877167815556, + "loss": 1.5259, + "step": 19785 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014107537893089228, + "loss": 1.5101, + "step": 19786 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001410630411408222, + "loss": 1.5275, + "step": 19787 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014105070341142913, + "loss": 1.5373, + "step": 19788 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014103836574279688, + "loss": 1.5051, + "step": 19789 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014102602813500915, + "loss": 1.5217, + "step": 19790 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014101369058814973, + "loss": 1.4891, + "step": 19791 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014100135310230244, + "loss": 1.5058, + "step": 19792 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014098901567755092, + "loss": 1.5013, + "step": 19793 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014097667831397908, + "loss": 1.4667, + "step": 19794 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014096434101167052, + "loss": 1.4393, + "step": 19795 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014095200377070918, + "loss": 1.5544, + "step": 19796 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014093966659117874, + "loss": 1.4662, + "step": 19797 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014092732947316297, + "loss": 1.5085, + "step": 19798 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001409149924167456, + "loss": 1.5251, + "step": 19799 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001409026554220104, + "loss": 1.4688, + "step": 19800 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001408903184890412, + "loss": 1.5443, + "step": 19801 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014087798161792169, + "loss": 1.468, + "step": 19802 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014086564480873565, + "loss": 1.5475, + "step": 19803 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014085330806156684, + "loss": 1.475, + "step": 19804 + }, + { + "epoch": 1.56, + "learning_rate": 0.000140840971376499, + "loss": 1.49, + "step": 19805 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014082863475361595, + "loss": 1.5007, + "step": 19806 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001408162981930014, + "loss": 1.4837, + "step": 19807 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014080396169473906, + "loss": 1.5176, + "step": 19808 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014079162525891282, + "loss": 1.5689, + "step": 19809 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014077928888560633, + "loss": 1.4885, + "step": 19810 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014076695257490333, + "loss": 1.5534, + "step": 19811 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014075461632688768, + "loss": 1.4764, + "step": 19812 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014074228014164308, + "loss": 1.5006, + "step": 19813 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014072994401925329, + "loss": 1.4822, + "step": 19814 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001407176079598021, + "loss": 1.5183, + "step": 19815 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014070527196337318, + "loss": 1.5107, + "step": 19816 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014069293603005033, + "loss": 1.5223, + "step": 19817 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014068060015991736, + "loss": 1.5369, + "step": 19818 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014066826435305793, + "loss": 1.5356, + "step": 19819 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014065592860955584, + "loss": 1.5391, + "step": 19820 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014064359292949487, + "loss": 1.5264, + "step": 19821 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014063125731295868, + "loss": 1.5219, + "step": 19822 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014061892176003114, + "loss": 1.5439, + "step": 19823 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014060658627079592, + "loss": 1.5062, + "step": 19824 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001405942508453368, + "loss": 1.5006, + "step": 19825 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014058191548373746, + "loss": 1.5406, + "step": 19826 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001405695801860818, + "loss": 1.5227, + "step": 19827 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014055724495245345, + "loss": 1.5437, + "step": 19828 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001405449097829362, + "loss": 1.5361, + "step": 19829 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014053257467761383, + "loss": 1.4856, + "step": 19830 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014052023963657002, + "loss": 1.5208, + "step": 19831 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014050790465988856, + "loss": 1.5505, + "step": 19832 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014049556974765322, + "loss": 1.4981, + "step": 19833 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014048323489994767, + "loss": 1.5334, + "step": 19834 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014047090011685574, + "loss": 1.4661, + "step": 19835 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001404585653984611, + "loss": 1.4656, + "step": 19836 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014044623074484754, + "loss": 1.501, + "step": 19837 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014043389615609885, + "loss": 1.5369, + "step": 19838 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001404215616322987, + "loss": 1.5136, + "step": 19839 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014040922717353086, + "loss": 1.4846, + "step": 19840 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014039689277987907, + "loss": 1.5485, + "step": 19841 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014038455845142702, + "loss": 1.4861, + "step": 19842 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014037222418825855, + "loss": 1.486, + "step": 19843 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014035988999045742, + "loss": 1.4935, + "step": 19844 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014034755585810727, + "loss": 1.461, + "step": 19845 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014033522179129188, + "loss": 1.5292, + "step": 19846 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014032288779009504, + "loss": 1.5483, + "step": 19847 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001403105538546004, + "loss": 1.5473, + "step": 19848 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014029821998489178, + "loss": 1.5016, + "step": 19849 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014028588618105294, + "loss": 1.5017, + "step": 19850 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001402735524431675, + "loss": 1.5455, + "step": 19851 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014026121877131932, + "loss": 1.5646, + "step": 19852 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014024888516559207, + "loss": 1.5168, + "step": 19853 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001402365516260695, + "loss": 1.531, + "step": 19854 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001402242181528354, + "loss": 1.4858, + "step": 19855 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001402118847459734, + "loss": 1.5306, + "step": 19856 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014019955140556737, + "loss": 1.516, + "step": 19857 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014018721813170086, + "loss": 1.4886, + "step": 19858 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001401748849244578, + "loss": 1.5624, + "step": 19859 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014016255178392185, + "loss": 1.5636, + "step": 19860 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014015021871017675, + "loss": 1.5292, + "step": 19861 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014013788570330625, + "loss": 1.4898, + "step": 19862 + }, + { + "epoch": 1.56, + "learning_rate": 0.000140125552763394, + "loss": 1.4399, + "step": 19863 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014011321989052387, + "loss": 1.4787, + "step": 19864 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014010088708477948, + "loss": 1.4874, + "step": 19865 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001400885543462446, + "loss": 1.5511, + "step": 19866 + }, + { + "epoch": 1.56, + "learning_rate": 0.000140076221675003, + "loss": 1.4906, + "step": 19867 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014006388907113836, + "loss": 1.5222, + "step": 19868 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014005155653473443, + "loss": 1.5003, + "step": 19869 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014003922406587494, + "loss": 1.5007, + "step": 19870 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001400268916646436, + "loss": 1.5332, + "step": 19871 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001400145593311242, + "loss": 1.4357, + "step": 19872 + }, + { + "epoch": 1.56, + "learning_rate": 0.00014000222706540036, + "loss": 1.5496, + "step": 19873 + }, + { + "epoch": 1.56, + "learning_rate": 0.00013998989486755593, + "loss": 1.5037, + "step": 19874 + }, + { + "epoch": 1.56, + "learning_rate": 0.00013997756273767458, + "loss": 1.432, + "step": 19875 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001399652306758401, + "loss": 1.5277, + "step": 19876 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001399528986821361, + "loss": 1.5258, + "step": 19877 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001399405667566464, + "loss": 1.4605, + "step": 19878 + }, + { + "epoch": 1.56, + "learning_rate": 0.00013992823489945472, + "loss": 1.5227, + "step": 19879 + }, + { + "epoch": 1.56, + "learning_rate": 0.00013991590311064473, + "loss": 1.5083, + "step": 19880 + }, + { + "epoch": 1.56, + "learning_rate": 0.00013990357139030023, + "loss": 1.4753, + "step": 19881 + }, + { + "epoch": 1.56, + "learning_rate": 0.00013989123973850488, + "loss": 1.5053, + "step": 19882 + }, + { + "epoch": 1.56, + "learning_rate": 0.00013987890815534245, + "loss": 1.5112, + "step": 19883 + }, + { + "epoch": 1.56, + "learning_rate": 0.00013986657664089667, + "loss": 1.4909, + "step": 19884 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001398542451952512, + "loss": 1.4978, + "step": 19885 + }, + { + "epoch": 1.56, + "learning_rate": 0.00013984191381848985, + "loss": 1.4764, + "step": 19886 + }, + { + "epoch": 1.56, + "learning_rate": 0.00013982958251069626, + "loss": 1.5264, + "step": 19887 + }, + { + "epoch": 1.56, + "learning_rate": 0.00013981725127195418, + "loss": 1.5129, + "step": 19888 + }, + { + "epoch": 1.56, + "learning_rate": 0.0001398049201023473, + "loss": 1.5093, + "step": 19889 + }, + { + "epoch": 1.56, + "learning_rate": 0.00013979258900195948, + "loss": 1.528, + "step": 19890 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013978025797087434, + "loss": 1.5254, + "step": 19891 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013976792700917556, + "loss": 1.5219, + "step": 19892 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013975559611694696, + "loss": 1.4738, + "step": 19893 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013974326529427218, + "loss": 1.4937, + "step": 19894 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013973093454123497, + "loss": 1.5084, + "step": 19895 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013971860385791906, + "loss": 1.4874, + "step": 19896 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013970627324440816, + "loss": 1.5153, + "step": 19897 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013969394270078598, + "loss": 1.5037, + "step": 19898 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013968161222713624, + "loss": 1.4771, + "step": 19899 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013966928182354265, + "loss": 1.5521, + "step": 19900 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013965695149008894, + "loss": 1.5165, + "step": 19901 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013964462122685882, + "loss": 1.5073, + "step": 19902 + }, + { + "epoch": 1.57, + "learning_rate": 0.000139632291033936, + "loss": 1.5276, + "step": 19903 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013961996091140424, + "loss": 1.5173, + "step": 19904 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013960763085934714, + "loss": 1.4964, + "step": 19905 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013959530087784855, + "loss": 1.5, + "step": 19906 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001395829709669921, + "loss": 1.5042, + "step": 19907 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013957064112686155, + "loss": 1.5055, + "step": 19908 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001395583113575406, + "loss": 1.4993, + "step": 19909 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013954598165911294, + "loss": 1.5841, + "step": 19910 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013953365203166229, + "loss": 1.559, + "step": 19911 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013952132247527238, + "loss": 1.5258, + "step": 19912 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001395089929900269, + "loss": 1.5192, + "step": 19913 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013949666357600956, + "loss": 1.5448, + "step": 19914 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001394843342333041, + "loss": 1.5065, + "step": 19915 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001394720049619942, + "loss": 1.5253, + "step": 19916 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013945967576216355, + "loss": 1.5802, + "step": 19917 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013944734663389594, + "loss": 1.4965, + "step": 19918 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013943501757727496, + "loss": 1.4608, + "step": 19919 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001394226885923844, + "loss": 1.5305, + "step": 19920 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001394103596793079, + "loss": 1.5217, + "step": 19921 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001393980308381293, + "loss": 1.5465, + "step": 19922 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001393857020689322, + "loss": 1.5178, + "step": 19923 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013937337337180028, + "loss": 1.5236, + "step": 19924 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013936104474681735, + "loss": 1.5034, + "step": 19925 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013934871619406705, + "loss": 1.5581, + "step": 19926 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013933638771363306, + "loss": 1.5159, + "step": 19927 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001393240593055991, + "loss": 1.5026, + "step": 19928 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001393117309700489, + "loss": 1.4631, + "step": 19929 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013929940270706622, + "loss": 1.5392, + "step": 19930 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001392870745167346, + "loss": 1.6033, + "step": 19931 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013927474639913783, + "loss": 1.5565, + "step": 19932 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013926241835435967, + "loss": 1.4617, + "step": 19933 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013925009038248375, + "loss": 1.5481, + "step": 19934 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001392377624835938, + "loss": 1.4626, + "step": 19935 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013922543465777338, + "loss": 1.4972, + "step": 19936 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013921310690510644, + "loss": 1.5276, + "step": 19937 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001392007792256765, + "loss": 1.4261, + "step": 19938 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013918845161956734, + "loss": 1.5189, + "step": 19939 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001391761240868626, + "loss": 1.5081, + "step": 19940 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013916379662764602, + "loss": 1.4815, + "step": 19941 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001391514692420013, + "loss": 1.5456, + "step": 19942 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013913914193001208, + "loss": 1.5652, + "step": 19943 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001391268146917621, + "loss": 1.4849, + "step": 19944 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001391144875273351, + "loss": 1.5308, + "step": 19945 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013910216043681466, + "loss": 1.5293, + "step": 19946 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001390898334202846, + "loss": 1.5136, + "step": 19947 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001390775064778285, + "loss": 1.5898, + "step": 19948 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001390651796095301, + "loss": 1.5036, + "step": 19949 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001390528528154731, + "loss": 1.5581, + "step": 19950 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001390405260957412, + "loss": 1.5217, + "step": 19951 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013902819945041804, + "loss": 1.4898, + "step": 19952 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013901587287958736, + "loss": 1.5517, + "step": 19953 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001390035463833329, + "loss": 1.5431, + "step": 19954 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013899121996173823, + "loss": 1.4703, + "step": 19955 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013897889361488716, + "loss": 1.5774, + "step": 19956 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013896656734286328, + "loss": 1.5076, + "step": 19957 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013895424114575034, + "loss": 1.5309, + "step": 19958 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013894191502363202, + "loss": 1.4981, + "step": 19959 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013892958897659196, + "loss": 1.546, + "step": 19960 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013891726300471386, + "loss": 1.4556, + "step": 19961 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001389049371080815, + "loss": 1.4888, + "step": 19962 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013889261128677844, + "loss": 1.5075, + "step": 19963 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013888028554088846, + "loss": 1.4914, + "step": 19964 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013886795987049516, + "loss": 1.5043, + "step": 19965 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013885563427568228, + "loss": 1.5071, + "step": 19966 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013884330875653354, + "loss": 1.5177, + "step": 19967 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001388309833131325, + "loss": 1.4988, + "step": 19968 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013881865794556294, + "loss": 1.4815, + "step": 19969 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013880633265390854, + "loss": 1.4934, + "step": 19970 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013879400743825298, + "loss": 1.4802, + "step": 19971 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013878168229867991, + "loss": 1.4948, + "step": 19972 + }, + { + "epoch": 1.57, + "learning_rate": 0.000138769357235273, + "loss": 1.4631, + "step": 19973 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013875703224811603, + "loss": 1.4851, + "step": 19974 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013874470733729255, + "loss": 1.5138, + "step": 19975 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013873238250288632, + "loss": 1.5377, + "step": 19976 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013872005774498097, + "loss": 1.5132, + "step": 19977 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013870773306366022, + "loss": 1.465, + "step": 19978 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013869540845900773, + "loss": 1.5251, + "step": 19979 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013868308393110717, + "loss": 1.5691, + "step": 19980 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013867075948004225, + "loss": 1.512, + "step": 19981 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001386584351058966, + "loss": 1.533, + "step": 19982 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013864611080875386, + "loss": 1.5256, + "step": 19983 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001386337865886978, + "loss": 1.5179, + "step": 19984 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013862146244581213, + "loss": 1.5007, + "step": 19985 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013860913838018038, + "loss": 1.4624, + "step": 19986 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013859681439188628, + "loss": 1.5861, + "step": 19987 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001385844904810136, + "loss": 1.456, + "step": 19988 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013857216664764585, + "loss": 1.4736, + "step": 19989 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001385598428918668, + "loss": 1.4931, + "step": 19990 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013854751921376016, + "loss": 1.5306, + "step": 19991 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013853519561340946, + "loss": 1.5204, + "step": 19992 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013852287209089852, + "loss": 1.5393, + "step": 19993 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013851054864631092, + "loss": 1.5026, + "step": 19994 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013849822527973034, + "loss": 1.4899, + "step": 19995 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001384859019912405, + "loss": 1.4731, + "step": 19996 + }, + { + "epoch": 1.57, + "learning_rate": 0.000138473578780925, + "loss": 1.5333, + "step": 19997 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013846125564886754, + "loss": 1.4772, + "step": 19998 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013844893259515174, + "loss": 1.5269, + "step": 19999 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001384366096198614, + "loss": 1.4998, + "step": 20000 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013842428672308004, + "loss": 1.5544, + "step": 20001 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001384119639048914, + "loss": 1.5374, + "step": 20002 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013839964116537919, + "loss": 1.4641, + "step": 20003 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013838731850462696, + "loss": 1.491, + "step": 20004 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013837499592271845, + "loss": 1.512, + "step": 20005 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013836267341973727, + "loss": 1.5049, + "step": 20006 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013835035099576712, + "loss": 1.4766, + "step": 20007 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001383380286508917, + "loss": 1.4777, + "step": 20008 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001383257063851946, + "loss": 1.4473, + "step": 20009 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013831338419875955, + "loss": 1.5324, + "step": 20010 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013830106209167012, + "loss": 1.5036, + "step": 20011 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013828874006401, + "loss": 1.5278, + "step": 20012 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013827641811586293, + "loss": 1.5292, + "step": 20013 + }, + { + "epoch": 1.57, + "learning_rate": 0.0001382640962473125, + "loss": 1.5714, + "step": 20014 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013825177445844232, + "loss": 1.5439, + "step": 20015 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013823945274933614, + "loss": 1.4567, + "step": 20016 + }, + { + "epoch": 1.57, + "learning_rate": 0.00013822713112007762, + "loss": 1.5504, + "step": 20017 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013821480957075036, + "loss": 1.5502, + "step": 20018 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013820248810143804, + "loss": 1.551, + "step": 20019 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013819016671222435, + "loss": 1.5131, + "step": 20020 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013817784540319286, + "loss": 1.5611, + "step": 20021 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013816552417442735, + "loss": 1.528, + "step": 20022 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013815320302601133, + "loss": 1.5035, + "step": 20023 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013814088195802853, + "loss": 1.5258, + "step": 20024 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013812856097056265, + "loss": 1.5553, + "step": 20025 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013811624006369722, + "loss": 1.4784, + "step": 20026 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013810391923751598, + "loss": 1.5193, + "step": 20027 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001380915984921026, + "loss": 1.4537, + "step": 20028 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013807927782754067, + "loss": 1.458, + "step": 20029 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013806695724391388, + "loss": 1.5254, + "step": 20030 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001380546367413058, + "loss": 1.4867, + "step": 20031 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001380423163198002, + "loss": 1.5246, + "step": 20032 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013802999597948065, + "loss": 1.4774, + "step": 20033 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013801767572043085, + "loss": 1.4977, + "step": 20034 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001380053555427344, + "loss": 1.5297, + "step": 20035 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013799303544647498, + "loss": 1.4892, + "step": 20036 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013798071543173624, + "loss": 1.5752, + "step": 20037 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013796839549860178, + "loss": 1.5224, + "step": 20038 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013795607564715532, + "loss": 1.5427, + "step": 20039 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001379437558774804, + "loss": 1.5424, + "step": 20040 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013793143618966074, + "loss": 1.4934, + "step": 20041 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013791911658378, + "loss": 1.5355, + "step": 20042 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013790679705992176, + "loss": 1.5037, + "step": 20043 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013789447761816968, + "loss": 1.5126, + "step": 20044 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013788215825860748, + "loss": 1.4894, + "step": 20045 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013786983898131863, + "loss": 1.4777, + "step": 20046 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013785751978638697, + "loss": 1.5555, + "step": 20047 + }, + { + "epoch": 1.58, + "learning_rate": 0.000137845200673896, + "loss": 1.5172, + "step": 20048 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013783288164392944, + "loss": 1.589, + "step": 20049 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001378205626965709, + "loss": 1.494, + "step": 20050 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013780824383190403, + "loss": 1.5343, + "step": 20051 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013779592505001244, + "loss": 1.497, + "step": 20052 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013778360635097975, + "loss": 1.5209, + "step": 20053 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001377712877348897, + "loss": 1.5265, + "step": 20054 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013775896920182582, + "loss": 1.5503, + "step": 20055 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013774665075187177, + "loss": 1.5346, + "step": 20056 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013773433238511125, + "loss": 1.5093, + "step": 20057 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001377220141016278, + "loss": 1.5039, + "step": 20058 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013770969590150511, + "loss": 1.5076, + "step": 20059 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013769737778482682, + "loss": 1.4595, + "step": 20060 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013768505975167653, + "loss": 1.4667, + "step": 20061 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013767274180213782, + "loss": 1.4997, + "step": 20062 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001376604239362945, + "loss": 1.5088, + "step": 20063 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013764810615423003, + "loss": 1.5242, + "step": 20064 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001376357884560281, + "loss": 1.477, + "step": 20065 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013762347084177238, + "loss": 1.547, + "step": 20066 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013761115331154645, + "loss": 1.5199, + "step": 20067 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013759883586543398, + "loss": 1.4988, + "step": 20068 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013758651850351853, + "loss": 1.521, + "step": 20069 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013757420122588378, + "loss": 1.4457, + "step": 20070 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013756188403261335, + "loss": 1.4913, + "step": 20071 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013754956692379084, + "loss": 1.4681, + "step": 20072 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001375372498994999, + "loss": 1.5348, + "step": 20073 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013752493295982423, + "loss": 1.4427, + "step": 20074 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013751261610484732, + "loss": 1.491, + "step": 20075 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013750029933465288, + "loss": 1.5047, + "step": 20076 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013748798264932448, + "loss": 1.4605, + "step": 20077 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013747566604894573, + "loss": 1.4746, + "step": 20078 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013746334953360035, + "loss": 1.5238, + "step": 20079 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013745103310337193, + "loss": 1.5121, + "step": 20080 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013743871675834404, + "loss": 1.5404, + "step": 20081 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013742640049860033, + "loss": 1.507, + "step": 20082 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013741408432422445, + "loss": 1.5156, + "step": 20083 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013740176823529997, + "loss": 1.5321, + "step": 20084 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013738945223191052, + "loss": 1.463, + "step": 20085 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013737713631413977, + "loss": 1.5095, + "step": 20086 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013736482048207126, + "loss": 1.5016, + "step": 20087 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013735250473578868, + "loss": 1.541, + "step": 20088 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013734018907537562, + "loss": 1.4739, + "step": 20089 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013732787350091564, + "loss": 1.5181, + "step": 20090 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013731555801249244, + "loss": 1.5884, + "step": 20091 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013730324261018958, + "loss": 1.4833, + "step": 20092 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013729092729409067, + "loss": 1.5135, + "step": 20093 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001372786120642794, + "loss": 1.4812, + "step": 20094 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013726629692083933, + "loss": 1.5356, + "step": 20095 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013725398186385405, + "loss": 1.6071, + "step": 20096 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013724166689340725, + "loss": 1.4319, + "step": 20097 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013722935200958245, + "loss": 1.5188, + "step": 20098 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013721703721246328, + "loss": 1.4454, + "step": 20099 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013720472250213343, + "loss": 1.4727, + "step": 20100 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013719240787867643, + "loss": 1.5238, + "step": 20101 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001371800933421759, + "loss": 1.5203, + "step": 20102 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013716777889271549, + "loss": 1.4912, + "step": 20103 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013715546453037876, + "loss": 1.5386, + "step": 20104 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013714315025524938, + "loss": 1.5067, + "step": 20105 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013713083606741084, + "loss": 1.4938, + "step": 20106 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013711852196694684, + "loss": 1.5084, + "step": 20107 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013710620795394103, + "loss": 1.4439, + "step": 20108 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013709389402847684, + "loss": 1.5333, + "step": 20109 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013708158019063804, + "loss": 1.5317, + "step": 20110 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001370692664405082, + "loss": 1.592, + "step": 20111 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001370569527781709, + "loss": 1.5185, + "step": 20112 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013704463920370975, + "loss": 1.4867, + "step": 20113 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013703232571720834, + "loss": 1.55, + "step": 20114 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013702001231875033, + "loss": 1.5246, + "step": 20115 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001370076990084192, + "loss": 1.4997, + "step": 20116 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013699538578629868, + "loss": 1.5017, + "step": 20117 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001369830726524723, + "loss": 1.4847, + "step": 20118 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013697075960702364, + "loss": 1.5627, + "step": 20119 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013695844665003639, + "loss": 1.5376, + "step": 20120 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013694613378159402, + "loss": 1.5395, + "step": 20121 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013693382100178028, + "loss": 1.502, + "step": 20122 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013692150831067862, + "loss": 1.594, + "step": 20123 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001369091957083727, + "loss": 1.4797, + "step": 20124 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013689688319494612, + "loss": 1.534, + "step": 20125 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013688457077048246, + "loss": 1.4709, + "step": 20126 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001368722584350654, + "loss": 1.4951, + "step": 20127 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001368599461887784, + "loss": 1.5206, + "step": 20128 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013684763403170515, + "loss": 1.4611, + "step": 20129 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013683532196392918, + "loss": 1.5094, + "step": 20130 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013682300998553413, + "loss": 1.4788, + "step": 20131 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013681069809660357, + "loss": 1.52, + "step": 20132 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013679838629722109, + "loss": 1.5786, + "step": 20133 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013678607458747028, + "loss": 1.4645, + "step": 20134 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001367737629674347, + "loss": 1.4654, + "step": 20135 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013676145143719798, + "loss": 1.5074, + "step": 20136 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013674913999684374, + "loss": 1.4497, + "step": 20137 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001367368286464555, + "loss": 1.5244, + "step": 20138 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013672451738611687, + "loss": 1.5213, + "step": 20139 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013671220621591147, + "loss": 1.5459, + "step": 20140 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013669989513592277, + "loss": 1.54, + "step": 20141 + }, + { + "epoch": 1.58, + "learning_rate": 0.0001366875841462345, + "loss": 1.4847, + "step": 20142 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013667527324693018, + "loss": 1.4372, + "step": 20143 + }, + { + "epoch": 1.58, + "learning_rate": 0.00013666296243809346, + "loss": 1.4852, + "step": 20144 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001366506517198078, + "loss": 1.4399, + "step": 20145 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001366383410921569, + "loss": 1.4999, + "step": 20146 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013662603055522422, + "loss": 1.5246, + "step": 20147 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013661372010909345, + "loss": 1.479, + "step": 20148 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013660140975384815, + "loss": 1.5485, + "step": 20149 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013658909948957186, + "loss": 1.5081, + "step": 20150 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013657678931634822, + "loss": 1.5027, + "step": 20151 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013656447923426072, + "loss": 1.5481, + "step": 20152 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013655216924339303, + "loss": 1.5341, + "step": 20153 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013653985934382868, + "loss": 1.4994, + "step": 20154 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013652754953565123, + "loss": 1.4655, + "step": 20155 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013651523981894427, + "loss": 1.5505, + "step": 20156 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013650293019379142, + "loss": 1.523, + "step": 20157 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013649062066027626, + "loss": 1.55, + "step": 20158 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001364783112184823, + "loss": 1.5394, + "step": 20159 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013646600186849312, + "loss": 1.4749, + "step": 20160 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013645369261039238, + "loss": 1.5349, + "step": 20161 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013644138344426354, + "loss": 1.5237, + "step": 20162 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013642907437019024, + "loss": 1.5044, + "step": 20163 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013641676538825605, + "loss": 1.4957, + "step": 20164 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001364044564985445, + "loss": 1.5243, + "step": 20165 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013639214770113923, + "loss": 1.5245, + "step": 20166 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013637983899612372, + "loss": 1.5074, + "step": 20167 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001363675303835816, + "loss": 1.4888, + "step": 20168 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013635522186359646, + "loss": 1.5253, + "step": 20169 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013634291343625178, + "loss": 1.5057, + "step": 20170 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013633060510163125, + "loss": 1.465, + "step": 20171 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013631829685981824, + "loss": 1.5175, + "step": 20172 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013630598871089655, + "loss": 1.4737, + "step": 20173 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013629368065494962, + "loss": 1.516, + "step": 20174 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013628137269206106, + "loss": 1.487, + "step": 20175 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013626906482231435, + "loss": 1.4825, + "step": 20176 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013625675704579315, + "loss": 1.5055, + "step": 20177 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013624444936258102, + "loss": 1.4994, + "step": 20178 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001362321417727614, + "loss": 1.5507, + "step": 20179 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013621983427641803, + "loss": 1.5156, + "step": 20180 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013620752687363433, + "loss": 1.4938, + "step": 20181 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013619521956449393, + "loss": 1.522, + "step": 20182 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013618291234908036, + "loss": 1.5327, + "step": 20183 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013617060522747718, + "loss": 1.4736, + "step": 20184 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013615829819976796, + "loss": 1.4883, + "step": 20185 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001361459912660363, + "loss": 1.4989, + "step": 20186 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013613368442636566, + "loss": 1.4714, + "step": 20187 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013612137768083963, + "loss": 1.5382, + "step": 20188 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013610907102954182, + "loss": 1.5072, + "step": 20189 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013609676447255578, + "loss": 1.4742, + "step": 20190 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013608445800996502, + "loss": 1.5137, + "step": 20191 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013607215164185312, + "loss": 1.5171, + "step": 20192 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001360598453683036, + "loss": 1.52, + "step": 20193 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013604753918940006, + "loss": 1.4927, + "step": 20194 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013603523310522602, + "loss": 1.5349, + "step": 20195 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013602292711586503, + "loss": 1.5386, + "step": 20196 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013601062122140065, + "loss": 1.534, + "step": 20197 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013599831542191647, + "loss": 1.5014, + "step": 20198 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013598600971749595, + "loss": 1.4794, + "step": 20199 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013597370410822277, + "loss": 1.4526, + "step": 20200 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013596139859418032, + "loss": 1.4792, + "step": 20201 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013594909317545225, + "loss": 1.4897, + "step": 20202 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013593678785212202, + "loss": 1.5052, + "step": 20203 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013592448262427336, + "loss": 1.5789, + "step": 20204 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001359121774919896, + "loss": 1.5171, + "step": 20205 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013589987245535442, + "loss": 1.5611, + "step": 20206 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013588756751445135, + "loss": 1.5044, + "step": 20207 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013587526266936386, + "loss": 1.5364, + "step": 20208 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013586295792017555, + "loss": 1.5361, + "step": 20209 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013585065326697, + "loss": 1.5091, + "step": 20210 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013583834870983067, + "loss": 1.524, + "step": 20211 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013582604424884116, + "loss": 1.444, + "step": 20212 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013581373988408497, + "loss": 1.4891, + "step": 20213 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013580143561564564, + "loss": 1.5714, + "step": 20214 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013578913144360677, + "loss": 1.4947, + "step": 20215 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001357768273680518, + "loss": 1.5416, + "step": 20216 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001357645233890644, + "loss": 1.5265, + "step": 20217 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013575221950672798, + "loss": 1.5373, + "step": 20218 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013573991572112608, + "loss": 1.4891, + "step": 20219 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013572761203234232, + "loss": 1.4997, + "step": 20220 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013571530844046022, + "loss": 1.4879, + "step": 20221 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013570300494556328, + "loss": 1.5023, + "step": 20222 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013569070154773505, + "loss": 1.5475, + "step": 20223 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013567839824705908, + "loss": 1.505, + "step": 20224 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013566609504361886, + "loss": 1.4703, + "step": 20225 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013565379193749793, + "loss": 1.4899, + "step": 20226 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013564148892877988, + "loss": 1.5053, + "step": 20227 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013562918601754817, + "loss": 1.5104, + "step": 20228 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013561688320388638, + "loss": 1.4796, + "step": 20229 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013560458048787798, + "loss": 1.4553, + "step": 20230 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013559227786960653, + "loss": 1.474, + "step": 20231 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013557997534915562, + "loss": 1.477, + "step": 20232 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013556767292660865, + "loss": 1.5818, + "step": 20233 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013555537060204925, + "loss": 1.5021, + "step": 20234 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013554306837556084, + "loss": 1.5108, + "step": 20235 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013553076624722713, + "loss": 1.5081, + "step": 20236 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013551846421713148, + "loss": 1.4822, + "step": 20237 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013550616228535743, + "loss": 1.5389, + "step": 20238 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013549386045198864, + "loss": 1.525, + "step": 20239 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013548155871710845, + "loss": 1.5017, + "step": 20240 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013546925708080054, + "loss": 1.5565, + "step": 20241 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013545695554314827, + "loss": 1.498, + "step": 20242 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013544465410423527, + "loss": 1.5239, + "step": 20243 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001354323527641451, + "loss": 1.4863, + "step": 20244 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013542005152296114, + "loss": 1.484, + "step": 20245 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013540775038076703, + "loss": 1.5263, + "step": 20246 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001353954493376462, + "loss": 1.4647, + "step": 20247 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013538314839368223, + "loss": 1.5547, + "step": 20248 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013537084754895864, + "loss": 1.5202, + "step": 20249 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001353585468035589, + "loss": 1.5005, + "step": 20250 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001353462461575665, + "loss": 1.4579, + "step": 20251 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013533394561106505, + "loss": 1.5178, + "step": 20252 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013532164516413803, + "loss": 1.563, + "step": 20253 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013530934481686892, + "loss": 1.4895, + "step": 20254 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013529704456934123, + "loss": 1.5513, + "step": 20255 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013528474442163854, + "loss": 1.512, + "step": 20256 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013527244437384428, + "loss": 1.5263, + "step": 20257 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013526014442604204, + "loss": 1.52, + "step": 20258 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013524784457831526, + "loss": 1.5247, + "step": 20259 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013523554483074745, + "loss": 1.4563, + "step": 20260 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013522324518342217, + "loss": 1.4799, + "step": 20261 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013521094563642287, + "loss": 1.5086, + "step": 20262 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013519864618983314, + "loss": 1.4934, + "step": 20263 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001351863468437364, + "loss": 1.5448, + "step": 20264 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013517404759821617, + "loss": 1.4388, + "step": 20265 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013516174845335598, + "loss": 1.5099, + "step": 20266 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013514944940923933, + "loss": 1.5241, + "step": 20267 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013513715046594978, + "loss": 1.4608, + "step": 20268 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001351248516235707, + "loss": 1.4341, + "step": 20269 + }, + { + "epoch": 1.59, + "learning_rate": 0.00013511255288218576, + "loss": 1.5296, + "step": 20270 + }, + { + "epoch": 1.59, + "learning_rate": 0.0001351002542418783, + "loss": 1.5151, + "step": 20271 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001350879557027319, + "loss": 1.5172, + "step": 20272 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001350756572648301, + "loss": 1.5292, + "step": 20273 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013506335892825628, + "loss": 1.4729, + "step": 20274 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013505106069309407, + "loss": 1.531, + "step": 20275 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013503876255942688, + "loss": 1.4994, + "step": 20276 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013502646452733823, + "loss": 1.4935, + "step": 20277 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013501416659691165, + "loss": 1.5136, + "step": 20278 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013500186876823058, + "loss": 1.5178, + "step": 20279 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013498957104137854, + "loss": 1.522, + "step": 20280 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013497727341643906, + "loss": 1.4833, + "step": 20281 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013496497589349555, + "loss": 1.4914, + "step": 20282 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013495267847263157, + "loss": 1.5221, + "step": 20283 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001349403811539306, + "loss": 1.487, + "step": 20284 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001349280839374762, + "loss": 1.5665, + "step": 20285 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013491578682335172, + "loss": 1.5458, + "step": 20286 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013490348981164078, + "loss": 1.5223, + "step": 20287 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013489119290242677, + "loss": 1.5478, + "step": 20288 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013487889609579322, + "loss": 1.5165, + "step": 20289 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013486659939182367, + "loss": 1.5209, + "step": 20290 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013485430279060152, + "loss": 1.5295, + "step": 20291 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013484200629221028, + "loss": 1.4568, + "step": 20292 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001348297098967335, + "loss": 1.4755, + "step": 20293 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013481741360425457, + "loss": 1.5107, + "step": 20294 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013480511741485707, + "loss": 1.5039, + "step": 20295 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001347928213286244, + "loss": 1.5132, + "step": 20296 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001347805253456401, + "loss": 1.5393, + "step": 20297 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013476822946598756, + "loss": 1.5013, + "step": 20298 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013475593368975043, + "loss": 1.508, + "step": 20299 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013474363801701207, + "loss": 1.5286, + "step": 20300 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013473134244785598, + "loss": 1.4986, + "step": 20301 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001347190469823657, + "loss": 1.4826, + "step": 20302 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013470675162062458, + "loss": 1.5666, + "step": 20303 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013469445636271626, + "loss": 1.468, + "step": 20304 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013468216120872406, + "loss": 1.5207, + "step": 20305 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013466986615873157, + "loss": 1.5489, + "step": 20306 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013465757121282224, + "loss": 1.4843, + "step": 20307 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013464527637107947, + "loss": 1.5601, + "step": 20308 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013463298163358687, + "loss": 1.5315, + "step": 20309 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013462068700042783, + "loss": 1.4437, + "step": 20310 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013460839247168583, + "loss": 1.5685, + "step": 20311 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013459609804744436, + "loss": 1.5703, + "step": 20312 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001345838037277868, + "loss": 1.5057, + "step": 20313 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001345715095127968, + "loss": 1.5014, + "step": 20314 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001345592154025577, + "loss": 1.4878, + "step": 20315 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013454692139715303, + "loss": 1.5056, + "step": 20316 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013453462749666624, + "loss": 1.5197, + "step": 20317 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013452233370118077, + "loss": 1.5381, + "step": 20318 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013451004001078013, + "loss": 1.5382, + "step": 20319 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013449774642554778, + "loss": 1.5549, + "step": 20320 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013448545294556715, + "loss": 1.5151, + "step": 20321 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013447315957092177, + "loss": 1.5375, + "step": 20322 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013446086630169502, + "loss": 1.4846, + "step": 20323 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013444857313797044, + "loss": 1.5481, + "step": 20324 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013443628007983146, + "loss": 1.4613, + "step": 20325 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013442398712736154, + "loss": 1.5137, + "step": 20326 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013441169428064418, + "loss": 1.5386, + "step": 20327 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001343994015397628, + "loss": 1.5367, + "step": 20328 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013438710890480084, + "loss": 1.496, + "step": 20329 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001343748163758418, + "loss": 1.5233, + "step": 20330 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013436252395296919, + "loss": 1.5818, + "step": 20331 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013435023163626636, + "loss": 1.5034, + "step": 20332 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013433793942581687, + "loss": 1.479, + "step": 20333 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013432564732170408, + "loss": 1.5003, + "step": 20334 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001343133553240115, + "loss": 1.5257, + "step": 20335 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013430106343282263, + "loss": 1.5353, + "step": 20336 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013428877164822084, + "loss": 1.5116, + "step": 20337 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013427647997028963, + "loss": 1.5062, + "step": 20338 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013426418839911243, + "loss": 1.479, + "step": 20339 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001342518969347727, + "loss": 1.4882, + "step": 20340 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013423960557735397, + "loss": 1.4976, + "step": 20341 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013422731432693956, + "loss": 1.5487, + "step": 20342 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013421502318361296, + "loss": 1.5227, + "step": 20343 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001342027321474577, + "loss": 1.4565, + "step": 20344 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001341904412185571, + "loss": 1.5364, + "step": 20345 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001341781503969947, + "loss": 1.4695, + "step": 20346 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013416585968285393, + "loss": 1.4881, + "step": 20347 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013415356907621828, + "loss": 1.509, + "step": 20348 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001341412785771711, + "loss": 1.4907, + "step": 20349 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013412898818579593, + "loss": 1.499, + "step": 20350 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013411669790217617, + "loss": 1.5189, + "step": 20351 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013410440772639522, + "loss": 1.5551, + "step": 20352 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013409211765853663, + "loss": 1.4816, + "step": 20353 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013407982769868374, + "loss": 1.5271, + "step": 20354 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013406753784692003, + "loss": 1.5162, + "step": 20355 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013405524810332898, + "loss": 1.5438, + "step": 20356 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013404295846799398, + "loss": 1.452, + "step": 20357 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001340306689409985, + "loss": 1.4985, + "step": 20358 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013401837952242593, + "loss": 1.5011, + "step": 20359 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013400609021235974, + "loss": 1.4968, + "step": 20360 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013399380101088336, + "loss": 1.4815, + "step": 20361 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013398151191808028, + "loss": 1.5239, + "step": 20362 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001339692229340339, + "loss": 1.5073, + "step": 20363 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013395693405882762, + "loss": 1.5087, + "step": 20364 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013394464529254492, + "loss": 1.4706, + "step": 20365 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001339323566352692, + "loss": 1.5349, + "step": 20366 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013392006808708392, + "loss": 1.5449, + "step": 20367 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013390777964807253, + "loss": 1.4699, + "step": 20368 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013389549131831842, + "loss": 1.5282, + "step": 20369 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013388320309790506, + "loss": 1.4879, + "step": 20370 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013387091498691584, + "loss": 1.5278, + "step": 20371 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013385862698543418, + "loss": 1.4788, + "step": 20372 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013384633909354357, + "loss": 1.5726, + "step": 20373 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013383405131132739, + "loss": 1.4838, + "step": 20374 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013382176363886908, + "loss": 1.5621, + "step": 20375 + }, + { + "epoch": 1.6, + "learning_rate": 0.000133809476076252, + "loss": 1.4467, + "step": 20376 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013379718862355973, + "loss": 1.503, + "step": 20377 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013378490128087558, + "loss": 1.4803, + "step": 20378 + }, + { + "epoch": 1.6, + "learning_rate": 0.000133772614048283, + "loss": 1.5404, + "step": 20379 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013376032692586544, + "loss": 1.4766, + "step": 20380 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013374803991370629, + "loss": 1.4931, + "step": 20381 + }, + { + "epoch": 1.6, + "learning_rate": 0.000133735753011889, + "loss": 1.4971, + "step": 20382 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013372346622049692, + "loss": 1.505, + "step": 20383 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013371117953961354, + "loss": 1.5115, + "step": 20384 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013369889296932229, + "loss": 1.4854, + "step": 20385 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013368660650970652, + "loss": 1.4961, + "step": 20386 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013367432016084973, + "loss": 1.4919, + "step": 20387 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013366203392283527, + "loss": 1.4693, + "step": 20388 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013364974779574658, + "loss": 1.5126, + "step": 20389 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001336374617796671, + "loss": 1.4486, + "step": 20390 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013362517587468023, + "loss": 1.4843, + "step": 20391 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001336128900808693, + "loss": 1.5067, + "step": 20392 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013360060439831785, + "loss": 1.5117, + "step": 20393 + }, + { + "epoch": 1.6, + "learning_rate": 0.0001335883188271093, + "loss": 1.4951, + "step": 20394 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013357603336732694, + "loss": 1.4696, + "step": 20395 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013356374801905429, + "loss": 1.5101, + "step": 20396 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013355146278237474, + "loss": 1.5315, + "step": 20397 + }, + { + "epoch": 1.6, + "learning_rate": 0.00013353917765737163, + "loss": 1.4699, + "step": 20398 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013352689264412845, + "loss": 1.5239, + "step": 20399 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013351460774272856, + "loss": 1.5149, + "step": 20400 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001335023229532554, + "loss": 1.4676, + "step": 20401 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013349003827579236, + "loss": 1.5279, + "step": 20402 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013347775371042286, + "loss": 1.4937, + "step": 20403 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013346546925723028, + "loss": 1.4925, + "step": 20404 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013345318491629805, + "loss": 1.5406, + "step": 20405 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013344090068770955, + "loss": 1.5307, + "step": 20406 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001334286165715482, + "loss": 1.487, + "step": 20407 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013341633256789735, + "loss": 1.4442, + "step": 20408 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013340404867684052, + "loss": 1.5029, + "step": 20409 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013339176489846101, + "loss": 1.4927, + "step": 20410 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001333794812328423, + "loss": 1.5593, + "step": 20411 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001333671976800677, + "loss": 1.5502, + "step": 20412 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013335491424022064, + "loss": 1.5452, + "step": 20413 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013334263091338455, + "loss": 1.5532, + "step": 20414 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013333034769964276, + "loss": 1.5186, + "step": 20415 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013331806459907877, + "loss": 1.5204, + "step": 20416 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013330578161177588, + "loss": 1.4647, + "step": 20417 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013329349873781752, + "loss": 1.5052, + "step": 20418 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013328121597728712, + "loss": 1.5043, + "step": 20419 + }, + { + "epoch": 1.61, + "learning_rate": 0.000133268933330268, + "loss": 1.5222, + "step": 20420 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013325665079684358, + "loss": 1.4711, + "step": 20421 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013324436837709733, + "loss": 1.5061, + "step": 20422 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013323208607111248, + "loss": 1.508, + "step": 20423 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013321980387897254, + "loss": 1.497, + "step": 20424 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013320752180076087, + "loss": 1.5778, + "step": 20425 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001331952398365609, + "loss": 1.5328, + "step": 20426 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013318295798645595, + "loss": 1.4575, + "step": 20427 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013317067625052945, + "loss": 1.4943, + "step": 20428 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013315839462886474, + "loss": 1.4828, + "step": 20429 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013314611312154525, + "loss": 1.4555, + "step": 20430 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001331338317286544, + "loss": 1.4975, + "step": 20431 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013312155045027546, + "loss": 1.5701, + "step": 20432 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001331092692864919, + "loss": 1.4961, + "step": 20433 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001330969882373871, + "loss": 1.5192, + "step": 20434 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001330847073030444, + "loss": 1.5318, + "step": 20435 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013307242648354724, + "loss": 1.4979, + "step": 20436 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001330601457789789, + "loss": 1.4981, + "step": 20437 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013304786518942286, + "loss": 1.458, + "step": 20438 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013303558471496242, + "loss": 1.5021, + "step": 20439 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013302330435568103, + "loss": 1.4848, + "step": 20440 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013301102411166204, + "loss": 1.4912, + "step": 20441 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001329987439829888, + "loss": 1.5101, + "step": 20442 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013298646396974473, + "loss": 1.5011, + "step": 20443 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013297418407201317, + "loss": 1.5129, + "step": 20444 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013296190428987753, + "loss": 1.4429, + "step": 20445 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013294962462342112, + "loss": 1.5352, + "step": 20446 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013293734507272738, + "loss": 1.5284, + "step": 20447 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013292506563787964, + "loss": 1.4904, + "step": 20448 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013291278631896128, + "loss": 1.4739, + "step": 20449 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013290050711605564, + "loss": 1.5073, + "step": 20450 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013288822802924618, + "loss": 1.4637, + "step": 20451 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013287594905861616, + "loss": 1.5609, + "step": 20452 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013286367020424905, + "loss": 1.4938, + "step": 20453 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001328513914662281, + "loss": 1.547, + "step": 20454 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013283911284463673, + "loss": 1.5346, + "step": 20455 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013282683433955836, + "loss": 1.4809, + "step": 20456 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001328145559510763, + "loss": 1.4952, + "step": 20457 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001328022776792739, + "loss": 1.5049, + "step": 20458 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013278999952423456, + "loss": 1.5244, + "step": 20459 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013277772148604167, + "loss": 1.4631, + "step": 20460 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001327654435647785, + "loss": 1.5093, + "step": 20461 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013275316576052843, + "loss": 1.4791, + "step": 20462 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001327408880733749, + "loss": 1.5169, + "step": 20463 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001327286105034012, + "loss": 1.4896, + "step": 20464 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001327163330506907, + "loss": 1.5095, + "step": 20465 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013270405571532676, + "loss": 1.5483, + "step": 20466 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001326917784973927, + "loss": 1.5154, + "step": 20467 + }, + { + "epoch": 1.61, + "learning_rate": 0.000132679501396972, + "loss": 1.5143, + "step": 20468 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013266722441414785, + "loss": 1.4992, + "step": 20469 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013265494754900376, + "loss": 1.533, + "step": 20470 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013264267080162286, + "loss": 1.5055, + "step": 20471 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013263039417208878, + "loss": 1.4789, + "step": 20472 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001326181176604847, + "loss": 1.5, + "step": 20473 + }, + { + "epoch": 1.61, + "learning_rate": 0.000132605841266894, + "loss": 1.4974, + "step": 20474 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013259356499140001, + "loss": 1.4971, + "step": 20475 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013258128883408618, + "loss": 1.5117, + "step": 20476 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013256901279503575, + "loss": 1.5582, + "step": 20477 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001325567368743321, + "loss": 1.5215, + "step": 20478 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013254446107205858, + "loss": 1.4764, + "step": 20479 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013253218538829853, + "loss": 1.5552, + "step": 20480 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001325199098231353, + "loss": 1.5506, + "step": 20481 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013250763437665228, + "loss": 1.5052, + "step": 20482 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013249535904893273, + "loss": 1.5554, + "step": 20483 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013248308384006003, + "loss": 1.5495, + "step": 20484 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013247080875011756, + "loss": 1.5631, + "step": 20485 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013245853377918856, + "loss": 1.5014, + "step": 20486 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013244625892735646, + "loss": 1.4921, + "step": 20487 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013243398419470457, + "loss": 1.589, + "step": 20488 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013242170958131628, + "loss": 1.554, + "step": 20489 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013240943508727486, + "loss": 1.5016, + "step": 20490 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013239716071266364, + "loss": 1.4586, + "step": 20491 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013238488645756605, + "loss": 1.5262, + "step": 20492 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001323726123220653, + "loss": 1.5285, + "step": 20493 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013236033830624482, + "loss": 1.5175, + "step": 20494 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013234806441018786, + "loss": 1.508, + "step": 20495 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013233579063397783, + "loss": 1.476, + "step": 20496 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013232351697769806, + "loss": 1.4827, + "step": 20497 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013231124344143184, + "loss": 1.5303, + "step": 20498 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013229897002526252, + "loss": 1.5045, + "step": 20499 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001322866967292734, + "loss": 1.5453, + "step": 20500 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013227442355354783, + "loss": 1.542, + "step": 20501 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013226215049816912, + "loss": 1.5094, + "step": 20502 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013224987756322066, + "loss": 1.4968, + "step": 20503 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013223760474878574, + "loss": 1.5106, + "step": 20504 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013222533205494767, + "loss": 1.4636, + "step": 20505 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001322130594817898, + "loss": 1.5307, + "step": 20506 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013220078702939545, + "loss": 1.454, + "step": 20507 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001321885146978479, + "loss": 1.5118, + "step": 20508 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013217624248723053, + "loss": 1.4582, + "step": 20509 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013216397039762662, + "loss": 1.4519, + "step": 20510 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013215169842911955, + "loss": 1.5359, + "step": 20511 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013213942658179254, + "loss": 1.5546, + "step": 20512 + }, + { + "epoch": 1.61, + "learning_rate": 0.000132127154855729, + "loss": 1.5124, + "step": 20513 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013211488325101222, + "loss": 1.4974, + "step": 20514 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001321026117677255, + "loss": 1.4694, + "step": 20515 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013209034040595214, + "loss": 1.5241, + "step": 20516 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013207806916577556, + "loss": 1.5283, + "step": 20517 + }, + { + "epoch": 1.61, + "learning_rate": 0.0001320657980472789, + "loss": 1.4653, + "step": 20518 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013205352705054563, + "loss": 1.5205, + "step": 20519 + }, + { + "epoch": 1.61, + "learning_rate": 0.000132041256175659, + "loss": 1.4989, + "step": 20520 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013202898542270236, + "loss": 1.4633, + "step": 20521 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013201671479175895, + "loss": 1.5146, + "step": 20522 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013200444428291218, + "loss": 1.4956, + "step": 20523 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013199217389624527, + "loss": 1.5107, + "step": 20524 + }, + { + "epoch": 1.61, + "learning_rate": 0.00013197990363184153, + "loss": 1.5309, + "step": 20525 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013196763348978434, + "loss": 1.471, + "step": 20526 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013195536347015697, + "loss": 1.5325, + "step": 20527 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001319430935730427, + "loss": 1.4645, + "step": 20528 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013193082379852489, + "loss": 1.4787, + "step": 20529 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013191855414668678, + "loss": 1.4947, + "step": 20530 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013190628461761173, + "loss": 1.4786, + "step": 20531 + }, + { + "epoch": 1.62, + "learning_rate": 0.000131894015211383, + "loss": 1.5111, + "step": 20532 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001318817459280839, + "loss": 1.5323, + "step": 20533 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013186947676779777, + "loss": 1.4699, + "step": 20534 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013185720773060792, + "loss": 1.4665, + "step": 20535 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001318449388165976, + "loss": 1.4901, + "step": 20536 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001318326700258501, + "loss": 1.4579, + "step": 20537 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013182040135844878, + "loss": 1.4864, + "step": 20538 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001318081328144769, + "loss": 1.47, + "step": 20539 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013179586439401774, + "loss": 1.5123, + "step": 20540 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001317835960971546, + "loss": 1.4549, + "step": 20541 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001317713279239708, + "loss": 1.4728, + "step": 20542 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013175905987454966, + "loss": 1.5168, + "step": 20543 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001317467919489744, + "loss": 1.5244, + "step": 20544 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013173452414732837, + "loss": 1.5006, + "step": 20545 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013172225646969484, + "loss": 1.5187, + "step": 20546 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001317099889161571, + "loss": 1.5103, + "step": 20547 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013169772148679846, + "loss": 1.5107, + "step": 20548 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013168545418170208, + "loss": 1.5296, + "step": 20549 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013167318700095146, + "loss": 1.4712, + "step": 20550 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013166091994462977, + "loss": 1.5238, + "step": 20551 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013164865301282036, + "loss": 1.4975, + "step": 20552 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013163638620560642, + "loss": 1.5645, + "step": 20553 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013162411952307126, + "loss": 1.5504, + "step": 20554 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013161185296529826, + "loss": 1.4981, + "step": 20555 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013159958653237056, + "loss": 1.5108, + "step": 20556 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013158732022437155, + "loss": 1.4786, + "step": 20557 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013157505404138447, + "loss": 1.4833, + "step": 20558 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013156278798349258, + "loss": 1.4699, + "step": 20559 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013155052205077923, + "loss": 1.539, + "step": 20560 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013153825624332764, + "loss": 1.5071, + "step": 20561 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013152599056122106, + "loss": 1.5011, + "step": 20562 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013151372500454288, + "loss": 1.5714, + "step": 20563 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013150145957337625, + "loss": 1.4975, + "step": 20564 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001314891942678045, + "loss": 1.5063, + "step": 20565 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001314769290879109, + "loss": 1.5336, + "step": 20566 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013146466403377878, + "loss": 1.5494, + "step": 20567 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013145239910549133, + "loss": 1.4788, + "step": 20568 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013144013430313188, + "loss": 1.558, + "step": 20569 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013142786962678366, + "loss": 1.5142, + "step": 20570 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013141560507652994, + "loss": 1.4681, + "step": 20571 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013140334065245404, + "loss": 1.4632, + "step": 20572 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013139107635463915, + "loss": 1.5309, + "step": 20573 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013137881218316862, + "loss": 1.525, + "step": 20574 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013136654813812568, + "loss": 1.4622, + "step": 20575 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013135428421959356, + "loss": 1.5008, + "step": 20576 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001313420204276556, + "loss": 1.5084, + "step": 20577 + }, + { + "epoch": 1.62, + "learning_rate": 0.000131329756762395, + "loss": 1.4963, + "step": 20578 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013131749322389507, + "loss": 1.5415, + "step": 20579 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013130522981223903, + "loss": 1.5435, + "step": 20580 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013129296652751013, + "loss": 1.5375, + "step": 20581 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001312807033697917, + "loss": 1.508, + "step": 20582 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013126844033916696, + "loss": 1.488, + "step": 20583 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001312561774357192, + "loss": 1.4972, + "step": 20584 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013124391465953162, + "loss": 1.4778, + "step": 20585 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001312316520106875, + "loss": 1.4964, + "step": 20586 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013121938948927015, + "loss": 1.5318, + "step": 20587 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013120712709536276, + "loss": 1.494, + "step": 20588 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013119486482904863, + "loss": 1.5235, + "step": 20589 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013118260269041096, + "loss": 1.4954, + "step": 20590 + }, + { + "epoch": 1.62, + "learning_rate": 0.000131170340679533, + "loss": 1.5289, + "step": 20591 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013115807879649811, + "loss": 1.4978, + "step": 20592 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013114581704138943, + "loss": 1.5085, + "step": 20593 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013113355541429026, + "loss": 1.534, + "step": 20594 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013112129391528381, + "loss": 1.5233, + "step": 20595 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013110903254445335, + "loss": 1.4957, + "step": 20596 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013109677130188215, + "loss": 1.48, + "step": 20597 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013108451018765347, + "loss": 1.5104, + "step": 20598 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001310722492018505, + "loss": 1.5172, + "step": 20599 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001310599883445565, + "loss": 1.491, + "step": 20600 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013104772761585477, + "loss": 1.4985, + "step": 20601 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013103546701582846, + "loss": 1.4649, + "step": 20602 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013102320654456088, + "loss": 1.5383, + "step": 20603 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001310109462021353, + "loss": 1.5311, + "step": 20604 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013099868598863486, + "loss": 1.4887, + "step": 20605 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013098642590414288, + "loss": 1.5056, + "step": 20606 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013097416594874258, + "loss": 1.5266, + "step": 20607 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013096190612251718, + "loss": 1.4953, + "step": 20608 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013094964642554997, + "loss": 1.465, + "step": 20609 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001309373868579241, + "loss": 1.5383, + "step": 20610 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013092512741972288, + "loss": 1.5185, + "step": 20611 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013091286811102944, + "loss": 1.534, + "step": 20612 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013090060893192716, + "loss": 1.5046, + "step": 20613 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013088834988249923, + "loss": 1.5291, + "step": 20614 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001308760909628288, + "loss": 1.5555, + "step": 20615 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013086383217299924, + "loss": 1.5326, + "step": 20616 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013085157351309362, + "loss": 1.5033, + "step": 20617 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013083931498319531, + "loss": 1.5278, + "step": 20618 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013082705658338742, + "loss": 1.4493, + "step": 20619 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013081479831375328, + "loss": 1.5232, + "step": 20620 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013080254017437605, + "loss": 1.513, + "step": 20621 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013079028216533899, + "loss": 1.4921, + "step": 20622 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013077802428672531, + "loss": 1.5088, + "step": 20623 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013076576653861825, + "loss": 1.5161, + "step": 20624 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013075350892110098, + "loss": 1.5149, + "step": 20625 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013074125143425682, + "loss": 1.507, + "step": 20626 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001307289940781689, + "loss": 1.4611, + "step": 20627 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001307167368529204, + "loss": 1.5054, + "step": 20628 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001307044797585947, + "loss": 1.5079, + "step": 20629 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013069222279527495, + "loss": 1.5101, + "step": 20630 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013067996596304433, + "loss": 1.5098, + "step": 20631 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013066770926198608, + "loss": 1.4411, + "step": 20632 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013065545269218344, + "loss": 1.4711, + "step": 20633 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013064319625371955, + "loss": 1.5212, + "step": 20634 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013063093994667774, + "loss": 1.5342, + "step": 20635 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001306186837711411, + "loss": 1.5081, + "step": 20636 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001306064277271929, + "loss": 1.5608, + "step": 20637 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013059417181491642, + "loss": 1.5401, + "step": 20638 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013058191603439474, + "loss": 1.5205, + "step": 20639 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013056966038571118, + "loss": 1.5509, + "step": 20640 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013055740486894886, + "loss": 1.4663, + "step": 20641 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013054514948419103, + "loss": 1.5211, + "step": 20642 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001305328942315209, + "loss": 1.5028, + "step": 20643 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013052063911102166, + "loss": 1.4876, + "step": 20644 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001305083841227766, + "loss": 1.4818, + "step": 20645 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013049612926686882, + "loss": 1.5136, + "step": 20646 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013048387454338156, + "loss": 1.5341, + "step": 20647 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013047161995239804, + "loss": 1.4798, + "step": 20648 + }, + { + "epoch": 1.62, + "learning_rate": 0.0001304593654940014, + "loss": 1.4926, + "step": 20649 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013044711116827495, + "loss": 1.4552, + "step": 20650 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013043485697530175, + "loss": 1.5213, + "step": 20651 + }, + { + "epoch": 1.62, + "learning_rate": 0.00013042260291516516, + "loss": 1.5796, + "step": 20652 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013041034898794823, + "loss": 1.4985, + "step": 20653 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001303980951937342, + "loss": 1.5328, + "step": 20654 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013038584153260636, + "loss": 1.4873, + "step": 20655 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013037358800464777, + "loss": 1.5183, + "step": 20656 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001303613346099417, + "loss": 1.5344, + "step": 20657 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013034908134857136, + "loss": 1.4664, + "step": 20658 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013033682822061985, + "loss": 1.5215, + "step": 20659 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013032457522617046, + "loss": 1.5463, + "step": 20660 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013031232236530635, + "loss": 1.4918, + "step": 20661 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013030006963811073, + "loss": 1.4952, + "step": 20662 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013028781704466674, + "loss": 1.4974, + "step": 20663 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001302755645850576, + "loss": 1.5414, + "step": 20664 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013026331225936649, + "loss": 1.4887, + "step": 20665 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001302510600676766, + "loss": 1.4606, + "step": 20666 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013023880801007112, + "loss": 1.5014, + "step": 20667 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013022655608663323, + "loss": 1.4327, + "step": 20668 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013021430429744607, + "loss": 1.5018, + "step": 20669 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013020205264259295, + "loss": 1.5055, + "step": 20670 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013018980112215688, + "loss": 1.4976, + "step": 20671 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001301775497362212, + "loss": 1.5085, + "step": 20672 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013016529848486897, + "loss": 1.5415, + "step": 20673 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013015304736818342, + "loss": 1.4861, + "step": 20674 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001301407963862477, + "loss": 1.488, + "step": 20675 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013012854553914505, + "loss": 1.4764, + "step": 20676 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001301162948269586, + "loss": 1.4652, + "step": 20677 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013010404424977154, + "loss": 1.5194, + "step": 20678 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013009179380766707, + "loss": 1.5331, + "step": 20679 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001300795435007283, + "loss": 1.4951, + "step": 20680 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013006729332903848, + "loss": 1.4968, + "step": 20681 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001300550432926807, + "loss": 1.5319, + "step": 20682 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013004279339173813, + "loss": 1.5031, + "step": 20683 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013003054362629407, + "loss": 1.4896, + "step": 20684 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013001829399643156, + "loss": 1.4971, + "step": 20685 + }, + { + "epoch": 1.63, + "learning_rate": 0.00013000604450223377, + "loss": 1.4836, + "step": 20686 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012999379514378395, + "loss": 1.5281, + "step": 20687 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001299815459211652, + "loss": 1.4955, + "step": 20688 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012996929683446073, + "loss": 1.4967, + "step": 20689 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012995704788375365, + "loss": 1.4715, + "step": 20690 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012994479906912714, + "loss": 1.5087, + "step": 20691 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012993255039066436, + "loss": 1.5116, + "step": 20692 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012992030184844856, + "loss": 1.4714, + "step": 20693 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001299080534425628, + "loss": 1.5424, + "step": 20694 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012989580517309025, + "loss": 1.4629, + "step": 20695 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012988355704011414, + "loss": 1.5302, + "step": 20696 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012987130904371753, + "loss": 1.5332, + "step": 20697 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012985906118398362, + "loss": 1.4795, + "step": 20698 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012984681346099562, + "loss": 1.5352, + "step": 20699 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012983456587483658, + "loss": 1.5348, + "step": 20700 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012982231842558975, + "loss": 1.5275, + "step": 20701 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012981007111333823, + "loss": 1.5284, + "step": 20702 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012979782393816516, + "loss": 1.5408, + "step": 20703 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012978557690015375, + "loss": 1.5251, + "step": 20704 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001297733299993871, + "loss": 1.5436, + "step": 20705 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012976108323594835, + "loss": 1.504, + "step": 20706 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001297488366099207, + "loss": 1.4694, + "step": 20707 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001297365901213873, + "loss": 1.5268, + "step": 20708 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012972434377043124, + "loss": 1.5428, + "step": 20709 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012971209755713574, + "loss": 1.5422, + "step": 20710 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012969985148158386, + "loss": 1.4865, + "step": 20711 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001296876055438588, + "loss": 1.5141, + "step": 20712 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001296753597440437, + "loss": 1.5578, + "step": 20713 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012966311408222166, + "loss": 1.5105, + "step": 20714 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012965086855847588, + "loss": 1.5532, + "step": 20715 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012963862317288947, + "loss": 1.4532, + "step": 20716 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012962637792554558, + "loss": 1.5041, + "step": 20717 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012961413281652732, + "loss": 1.5092, + "step": 20718 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012960188784591785, + "loss": 1.4601, + "step": 20719 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001295896430138003, + "loss": 1.4462, + "step": 20720 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012957739832025785, + "loss": 1.493, + "step": 20721 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001295651537653735, + "loss": 1.4912, + "step": 20722 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012955290934923055, + "loss": 1.5047, + "step": 20723 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012954066507191205, + "loss": 1.5145, + "step": 20724 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012952842093350117, + "loss": 1.5067, + "step": 20725 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012951617693408098, + "loss": 1.4938, + "step": 20726 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012950393307373467, + "loss": 1.4898, + "step": 20727 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012949168935254534, + "loss": 1.4933, + "step": 20728 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001294794457705961, + "loss": 1.5177, + "step": 20729 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012946720232797013, + "loss": 1.483, + "step": 20730 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012945495902475052, + "loss": 1.5652, + "step": 20731 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012944271586102038, + "loss": 1.5093, + "step": 20732 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012943047283686288, + "loss": 1.5065, + "step": 20733 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001294182299523611, + "loss": 1.5169, + "step": 20734 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001294059872075982, + "loss": 1.5285, + "step": 20735 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012939374460265726, + "loss": 1.5059, + "step": 20736 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012938150213762141, + "loss": 1.5115, + "step": 20737 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012936925981257377, + "loss": 1.5097, + "step": 20738 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012935701762759752, + "loss": 1.5158, + "step": 20739 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001293447755827757, + "loss": 1.4871, + "step": 20740 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012933253367819144, + "loss": 1.4676, + "step": 20741 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012932029191392794, + "loss": 1.4744, + "step": 20742 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001293080502900682, + "loss": 1.5181, + "step": 20743 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012929580880669537, + "loss": 1.507, + "step": 20744 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001292835674638926, + "loss": 1.5308, + "step": 20745 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012927132626174294, + "loss": 1.4774, + "step": 20746 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001292590852003296, + "loss": 1.4707, + "step": 20747 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012924684427973555, + "loss": 1.4994, + "step": 20748 + }, + { + "epoch": 1.63, + "learning_rate": 0.000129234603500044, + "loss": 1.5145, + "step": 20749 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012922236286133808, + "loss": 1.4997, + "step": 20750 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001292101223637008, + "loss": 1.5394, + "step": 20751 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001291978820072153, + "loss": 1.5031, + "step": 20752 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012918564179196468, + "loss": 1.5175, + "step": 20753 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012917340171803214, + "loss": 1.4827, + "step": 20754 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012916116178550066, + "loss": 1.4939, + "step": 20755 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012914892199445343, + "loss": 1.489, + "step": 20756 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001291366823449735, + "loss": 1.5129, + "step": 20757 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012912444283714398, + "loss": 1.5101, + "step": 20758 + }, + { + "epoch": 1.63, + "learning_rate": 0.000129112203471048, + "loss": 1.5267, + "step": 20759 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001290999642467686, + "loss": 1.5389, + "step": 20760 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012908772516438888, + "loss": 1.5306, + "step": 20761 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012907548622399204, + "loss": 1.5313, + "step": 20762 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012906324742566105, + "loss": 1.5174, + "step": 20763 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012905100876947907, + "loss": 1.5281, + "step": 20764 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012903877025552917, + "loss": 1.5001, + "step": 20765 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012902653188389448, + "loss": 1.5257, + "step": 20766 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012901429365465804, + "loss": 1.4957, + "step": 20767 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012900205556790298, + "loss": 1.52, + "step": 20768 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012898981762371231, + "loss": 1.4731, + "step": 20769 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012897757982216924, + "loss": 1.4455, + "step": 20770 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012896534216335682, + "loss": 1.483, + "step": 20771 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001289531046473581, + "loss": 1.5231, + "step": 20772 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012894086727425615, + "loss": 1.5105, + "step": 20773 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012892863004413416, + "loss": 1.5266, + "step": 20774 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001289163929570751, + "loss": 1.4643, + "step": 20775 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012890415601316213, + "loss": 1.5045, + "step": 20776 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012889191921247825, + "loss": 1.5021, + "step": 20777 + }, + { + "epoch": 1.63, + "learning_rate": 0.0001288796825551066, + "loss": 1.4866, + "step": 20778 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012886744604113028, + "loss": 1.5127, + "step": 20779 + }, + { + "epoch": 1.63, + "learning_rate": 0.00012885520967063235, + "loss": 1.5083, + "step": 20780 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012884297344369582, + "loss": 1.4825, + "step": 20781 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012883073736040388, + "loss": 1.5029, + "step": 20782 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012881850142083953, + "loss": 1.5648, + "step": 20783 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012880626562508586, + "loss": 1.5256, + "step": 20784 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001287940299732259, + "loss": 1.4451, + "step": 20785 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012878179446534284, + "loss": 1.5135, + "step": 20786 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012876955910151968, + "loss": 1.5234, + "step": 20787 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012875732388183952, + "loss": 1.5666, + "step": 20788 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012874508880638536, + "loss": 1.5245, + "step": 20789 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012873285387524032, + "loss": 1.4807, + "step": 20790 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001287206190884875, + "loss": 1.4325, + "step": 20791 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012870838444620992, + "loss": 1.5032, + "step": 20792 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001286961499484907, + "loss": 1.4852, + "step": 20793 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001286839155954128, + "loss": 1.4977, + "step": 20794 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012867168138705937, + "loss": 1.5244, + "step": 20795 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012865944732351345, + "loss": 1.4699, + "step": 20796 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012864721340485812, + "loss": 1.5104, + "step": 20797 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012863497963117642, + "loss": 1.4419, + "step": 20798 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012862274600255143, + "loss": 1.4757, + "step": 20799 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012861051251906617, + "loss": 1.4696, + "step": 20800 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001285982791808037, + "loss": 1.554, + "step": 20801 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012858604598784716, + "loss": 1.4995, + "step": 20802 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012857381294027954, + "loss": 1.5174, + "step": 20803 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001285615800381839, + "loss": 1.5112, + "step": 20804 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012854934728164332, + "loss": 1.509, + "step": 20805 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012853711467074083, + "loss": 1.4624, + "step": 20806 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012852488220555945, + "loss": 1.4669, + "step": 20807 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001285126498861823, + "loss": 1.4979, + "step": 20808 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001285004177126924, + "loss": 1.498, + "step": 20809 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012848818568517278, + "loss": 1.5029, + "step": 20810 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012847595380370655, + "loss": 1.4775, + "step": 20811 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012846372206837668, + "loss": 1.5562, + "step": 20812 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012845149047926627, + "loss": 1.5562, + "step": 20813 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012843925903645835, + "loss": 1.5158, + "step": 20814 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012842702774003593, + "loss": 1.5408, + "step": 20815 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012841479659008207, + "loss": 1.5016, + "step": 20816 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001284025655866799, + "loss": 1.5309, + "step": 20817 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012839033472991234, + "loss": 1.4763, + "step": 20818 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012837810401986248, + "loss": 1.5805, + "step": 20819 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001283658734566134, + "loss": 1.4691, + "step": 20820 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012835364304024808, + "loss": 1.5365, + "step": 20821 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001283414127708496, + "loss": 1.4738, + "step": 20822 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012832918264850095, + "loss": 1.4607, + "step": 20823 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012831695267328519, + "loss": 1.5221, + "step": 20824 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012830472284528537, + "loss": 1.5522, + "step": 20825 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012829249316458448, + "loss": 1.4964, + "step": 20826 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012828026363126562, + "loss": 1.5472, + "step": 20827 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012826803424541178, + "loss": 1.5125, + "step": 20828 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012825580500710598, + "loss": 1.4823, + "step": 20829 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001282435759164313, + "loss": 1.5149, + "step": 20830 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012823134697347068, + "loss": 1.5352, + "step": 20831 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012821911817830717, + "loss": 1.5088, + "step": 20832 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012820688953102386, + "loss": 1.5393, + "step": 20833 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001281946610317038, + "loss": 1.4605, + "step": 20834 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012818243268042994, + "loss": 1.4584, + "step": 20835 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012817020447728527, + "loss": 1.4698, + "step": 20836 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001281579764223529, + "loss": 1.4848, + "step": 20837 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012814574851571583, + "loss": 1.548, + "step": 20838 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012813352075745704, + "loss": 1.4754, + "step": 20839 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012812129314765963, + "loss": 1.4678, + "step": 20840 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012810906568640649, + "loss": 1.523, + "step": 20841 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001280968383737808, + "loss": 1.5651, + "step": 20842 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012808461120986542, + "loss": 1.4595, + "step": 20843 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012807238419474345, + "loss": 1.498, + "step": 20844 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001280601573284979, + "loss": 1.4956, + "step": 20845 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012804793061121176, + "loss": 1.4728, + "step": 20846 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001280357040429681, + "loss": 1.5572, + "step": 20847 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012802347762384976, + "loss": 1.513, + "step": 20848 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012801125135394003, + "loss": 1.4717, + "step": 20849 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012799902523332168, + "loss": 1.485, + "step": 20850 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012798679926207787, + "loss": 1.5355, + "step": 20851 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001279745734402915, + "loss": 1.5065, + "step": 20852 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012796234776804564, + "loss": 1.52, + "step": 20853 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001279501222454233, + "loss": 1.4959, + "step": 20854 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012793789687250742, + "loss": 1.5114, + "step": 20855 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012792567164938106, + "loss": 1.4999, + "step": 20856 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012791344657612724, + "loss": 1.5285, + "step": 20857 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012790122165282888, + "loss": 1.4956, + "step": 20858 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012788899687956907, + "loss": 1.4686, + "step": 20859 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012787677225643075, + "loss": 1.4936, + "step": 20860 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012786454778349691, + "loss": 1.533, + "step": 20861 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012785232346085066, + "loss": 1.5327, + "step": 20862 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012784009928857478, + "loss": 1.4789, + "step": 20863 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012782787526675248, + "loss": 1.4483, + "step": 20864 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012781565139546666, + "loss": 1.5166, + "step": 20865 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012780342767480034, + "loss": 1.5077, + "step": 20866 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012779120410483648, + "loss": 1.5002, + "step": 20867 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012777898068565808, + "loss": 1.4923, + "step": 20868 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012776675741734818, + "loss": 1.4844, + "step": 20869 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001277545342999897, + "loss": 1.471, + "step": 20870 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012774231133366566, + "loss": 1.4512, + "step": 20871 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012773008851845903, + "loss": 1.5544, + "step": 20872 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001277178658544528, + "loss": 1.4919, + "step": 20873 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012770564334173, + "loss": 1.4717, + "step": 20874 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012769342098037357, + "loss": 1.4861, + "step": 20875 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012768119877046652, + "loss": 1.5204, + "step": 20876 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012766897671209176, + "loss": 1.4706, + "step": 20877 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012765675480533236, + "loss": 1.4976, + "step": 20878 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001276445330502712, + "loss": 1.4685, + "step": 20879 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012763231144699135, + "loss": 1.5148, + "step": 20880 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012762008999557583, + "loss": 1.4752, + "step": 20881 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001276078686961075, + "loss": 1.5431, + "step": 20882 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001275956475486694, + "loss": 1.4746, + "step": 20883 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001275834265533445, + "loss": 1.4926, + "step": 20884 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012757120571021572, + "loss": 1.5127, + "step": 20885 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012755898501936615, + "loss": 1.5083, + "step": 20886 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012754676448087861, + "loss": 1.526, + "step": 20887 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012753454409483622, + "loss": 1.5098, + "step": 20888 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001275223238613218, + "loss": 1.5012, + "step": 20889 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012751010378041845, + "loss": 1.5306, + "step": 20890 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012749788385220908, + "loss": 1.4723, + "step": 20891 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012748566407677663, + "loss": 1.4697, + "step": 20892 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012747344445420412, + "loss": 1.5116, + "step": 20893 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012746122498457453, + "loss": 1.5331, + "step": 20894 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012744900566797067, + "loss": 1.4669, + "step": 20895 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001274367865044757, + "loss": 1.5169, + "step": 20896 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012742456749417245, + "loss": 1.4559, + "step": 20897 + }, + { + "epoch": 1.64, + "learning_rate": 0.000127412348637144, + "loss": 1.5006, + "step": 20898 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001274001299334732, + "loss": 1.5156, + "step": 20899 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012738791138324306, + "loss": 1.5239, + "step": 20900 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001273756929865365, + "loss": 1.4817, + "step": 20901 + }, + { + "epoch": 1.64, + "learning_rate": 0.0001273634747434365, + "loss": 1.504, + "step": 20902 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012735125665402607, + "loss": 1.4993, + "step": 20903 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012733903871838806, + "loss": 1.4607, + "step": 20904 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012732682093660549, + "loss": 1.4735, + "step": 20905 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012731460330876127, + "loss": 1.5404, + "step": 20906 + }, + { + "epoch": 1.64, + "learning_rate": 0.00012730238583493836, + "loss": 1.4958, + "step": 20907 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001272901685152198, + "loss": 1.4793, + "step": 20908 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001272779513496884, + "loss": 1.4855, + "step": 20909 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012726573433842717, + "loss": 1.507, + "step": 20910 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012725351748151903, + "loss": 1.5089, + "step": 20911 + }, + { + "epoch": 1.65, + "learning_rate": 0.000127241300779047, + "loss": 1.4599, + "step": 20912 + }, + { + "epoch": 1.65, + "learning_rate": 0.000127229084231094, + "loss": 1.5008, + "step": 20913 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012721686783774292, + "loss": 1.5215, + "step": 20914 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012720465159907676, + "loss": 1.5376, + "step": 20915 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001271924355151784, + "loss": 1.4698, + "step": 20916 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012718021958613084, + "loss": 1.4571, + "step": 20917 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012716800381201699, + "loss": 1.4598, + "step": 20918 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012715578819291978, + "loss": 1.4809, + "step": 20919 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012714357272892223, + "loss": 1.4651, + "step": 20920 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012713135742010713, + "loss": 1.4974, + "step": 20921 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001271191422665575, + "loss": 1.5993, + "step": 20922 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012710692726835632, + "loss": 1.4723, + "step": 20923 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012709471242558642, + "loss": 1.4857, + "step": 20924 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012708249773833082, + "loss": 1.485, + "step": 20925 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012707028320667232, + "loss": 1.4863, + "step": 20926 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012705806883069404, + "loss": 1.5109, + "step": 20927 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012704585461047877, + "loss": 1.5089, + "step": 20928 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012703364054610954, + "loss": 1.4593, + "step": 20929 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012702142663766912, + "loss": 1.5038, + "step": 20930 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001270092128852406, + "loss": 1.5246, + "step": 20931 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012699699928890685, + "loss": 1.4648, + "step": 20932 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012698478584875075, + "loss": 1.5092, + "step": 20933 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012697257256485527, + "loss": 1.5581, + "step": 20934 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001269603594373033, + "loss": 1.5009, + "step": 20935 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012694814646617777, + "loss": 1.5396, + "step": 20936 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012693593365156164, + "loss": 1.4617, + "step": 20937 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012692372099353774, + "loss": 1.4657, + "step": 20938 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012691150849218906, + "loss": 1.5398, + "step": 20939 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012689929614759853, + "loss": 1.5286, + "step": 20940 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012688708395984898, + "loss": 1.4717, + "step": 20941 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012687487192902336, + "loss": 1.569, + "step": 20942 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001268626600552046, + "loss": 1.4607, + "step": 20943 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012685044833847569, + "loss": 1.4758, + "step": 20944 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001268382367789194, + "loss": 1.4871, + "step": 20945 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012682602537661874, + "loss": 1.5197, + "step": 20946 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012681381413165655, + "loss": 1.525, + "step": 20947 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012680160304411576, + "loss": 1.5285, + "step": 20948 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001267893921140793, + "loss": 1.4999, + "step": 20949 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012677718134163006, + "loss": 1.5175, + "step": 20950 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012676497072685092, + "loss": 1.5282, + "step": 20951 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012675276026982485, + "loss": 1.5823, + "step": 20952 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012674054997063468, + "loss": 1.4857, + "step": 20953 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012672833982936338, + "loss": 1.5312, + "step": 20954 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012671612984609375, + "loss": 1.5071, + "step": 20955 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012670392002090878, + "loss": 1.5092, + "step": 20956 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012669171035389133, + "loss": 1.5242, + "step": 20957 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012667950084512426, + "loss": 1.5192, + "step": 20958 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012666729149469057, + "loss": 1.4879, + "step": 20959 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012665508230267304, + "loss": 1.4664, + "step": 20960 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012664287326915469, + "loss": 1.5279, + "step": 20961 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001266306643942183, + "loss": 1.4933, + "step": 20962 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001266184556779468, + "loss": 1.4764, + "step": 20963 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001266062471204231, + "loss": 1.4892, + "step": 20964 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012659403872173006, + "loss": 1.5174, + "step": 20965 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001265818304819506, + "loss": 1.4916, + "step": 20966 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001265696224011676, + "loss": 1.4705, + "step": 20967 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001265574144794639, + "loss": 1.5029, + "step": 20968 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012654520671692243, + "loss": 1.5284, + "step": 20969 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012653299911362606, + "loss": 1.4567, + "step": 20970 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001265207916696577, + "loss": 1.4113, + "step": 20971 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012650858438510018, + "loss": 1.4897, + "step": 20972 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012649637726003636, + "loss": 1.4945, + "step": 20973 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001264841702945492, + "loss": 1.4871, + "step": 20974 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001264719634887216, + "loss": 1.4831, + "step": 20975 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012645975684263635, + "loss": 1.5264, + "step": 20976 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012644755035637635, + "loss": 1.4634, + "step": 20977 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001264353440300245, + "loss": 1.5412, + "step": 20978 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012642313786366365, + "loss": 1.5076, + "step": 20979 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001264109318573767, + "loss": 1.5195, + "step": 20980 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001263987260112465, + "loss": 1.4804, + "step": 20981 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012638652032535591, + "loss": 1.4616, + "step": 20982 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012637431479978786, + "loss": 1.4947, + "step": 20983 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012636210943462513, + "loss": 1.5162, + "step": 20984 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012634990422995065, + "loss": 1.5263, + "step": 20985 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012633769918584726, + "loss": 1.5463, + "step": 20986 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012632549430239784, + "loss": 1.5203, + "step": 20987 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012631328957968526, + "loss": 1.5239, + "step": 20988 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001263010850177923, + "loss": 1.4696, + "step": 20989 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012628888061680198, + "loss": 1.4645, + "step": 20990 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012627667637679703, + "loss": 1.5438, + "step": 20991 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012626447229786036, + "loss": 1.4907, + "step": 20992 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012625226838007487, + "loss": 1.4812, + "step": 20993 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012624006462352334, + "loss": 1.429, + "step": 20994 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001262278610282887, + "loss": 1.5502, + "step": 20995 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001262156575944537, + "loss": 1.5093, + "step": 20996 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012620345432210126, + "loss": 1.4856, + "step": 20997 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001261912512113143, + "loss": 1.5389, + "step": 20998 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012617904826217556, + "loss": 1.5046, + "step": 20999 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012616684547476795, + "loss": 1.5003, + "step": 21000 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001261546428491743, + "loss": 1.4645, + "step": 21001 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012614244038547745, + "loss": 1.508, + "step": 21002 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012613023808376032, + "loss": 1.5294, + "step": 21003 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012611803594410564, + "loss": 1.4645, + "step": 21004 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001261058339665963, + "loss": 1.5298, + "step": 21005 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012609363215131518, + "loss": 1.546, + "step": 21006 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012608143049834514, + "loss": 1.4668, + "step": 21007 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012606922900776897, + "loss": 1.487, + "step": 21008 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012605702767966954, + "loss": 1.4842, + "step": 21009 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012604482651412967, + "loss": 1.5204, + "step": 21010 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001260326255112322, + "loss": 1.5238, + "step": 21011 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012602042467106003, + "loss": 1.4815, + "step": 21012 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012600822399369587, + "loss": 1.5448, + "step": 21013 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012599602347922265, + "loss": 1.5228, + "step": 21014 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001259838231277232, + "loss": 1.516, + "step": 21015 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012597162293928035, + "loss": 1.4558, + "step": 21016 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001259594229139769, + "loss": 1.4939, + "step": 21017 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001259472230518957, + "loss": 1.4971, + "step": 21018 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012593502335311957, + "loss": 1.512, + "step": 21019 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001259228238177314, + "loss": 1.503, + "step": 21020 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012591062444581384, + "loss": 1.4863, + "step": 21021 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012589842523744998, + "loss": 1.4528, + "step": 21022 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012588622619272245, + "loss": 1.4875, + "step": 21023 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001258740273117142, + "loss": 1.4603, + "step": 21024 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012586182859450793, + "loss": 1.4804, + "step": 21025 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012584963004118652, + "loss": 1.5493, + "step": 21026 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012583743165183286, + "loss": 1.4975, + "step": 21027 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012582523342652966, + "loss": 1.5556, + "step": 21028 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001258130353653598, + "loss": 1.5211, + "step": 21029 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012580083746840606, + "loss": 1.5239, + "step": 21030 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001257886397357513, + "loss": 1.4871, + "step": 21031 + }, + { + "epoch": 1.65, + "learning_rate": 0.0001257764421674783, + "loss": 1.4641, + "step": 21032 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012576424476366991, + "loss": 1.5491, + "step": 21033 + }, + { + "epoch": 1.65, + "learning_rate": 0.00012575204752440889, + "loss": 1.4725, + "step": 21034 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012573985044977813, + "loss": 1.5207, + "step": 21035 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012572765353986032, + "loss": 1.5062, + "step": 21036 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001257154567947384, + "loss": 1.5421, + "step": 21037 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001257032602144951, + "loss": 1.4578, + "step": 21038 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012569106379921332, + "loss": 1.5071, + "step": 21039 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012567886754897574, + "loss": 1.4432, + "step": 21040 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012566667146386528, + "loss": 1.5124, + "step": 21041 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012565447554396467, + "loss": 1.5155, + "step": 21042 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012564227978935672, + "loss": 1.5076, + "step": 21043 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012563008420012428, + "loss": 1.5524, + "step": 21044 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012561788877635008, + "loss": 1.4636, + "step": 21045 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012560569351811697, + "loss": 1.4983, + "step": 21046 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012559349842550778, + "loss": 1.5195, + "step": 21047 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012558130349860522, + "loss": 1.461, + "step": 21048 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001255691087374922, + "loss": 1.5016, + "step": 21049 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012555691414225137, + "loss": 1.5344, + "step": 21050 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012554471971296563, + "loss": 1.459, + "step": 21051 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001255325254497177, + "loss": 1.4809, + "step": 21052 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001255203313525905, + "loss": 1.4765, + "step": 21053 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001255081374216667, + "loss": 1.5284, + "step": 21054 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012549594365702914, + "loss": 1.4683, + "step": 21055 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012548375005876062, + "loss": 1.5303, + "step": 21056 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012547155662694388, + "loss": 1.5085, + "step": 21057 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012545936336166177, + "loss": 1.4855, + "step": 21058 + }, + { + "epoch": 1.66, + "learning_rate": 0.000125447170262997, + "loss": 1.5345, + "step": 21059 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001254349773310324, + "loss": 1.5119, + "step": 21060 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012542278456585077, + "loss": 1.5322, + "step": 21061 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012541059196753487, + "loss": 1.52, + "step": 21062 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012539839953616745, + "loss": 1.4737, + "step": 21063 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012538620727183135, + "loss": 1.5536, + "step": 21064 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012537401517460933, + "loss": 1.497, + "step": 21065 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012536182324458415, + "loss": 1.4993, + "step": 21066 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012534963148183858, + "loss": 1.5199, + "step": 21067 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012533743988645536, + "loss": 1.5112, + "step": 21068 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012532524845851735, + "loss": 1.4488, + "step": 21069 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001253130571981073, + "loss": 1.4815, + "step": 21070 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012530086610530798, + "loss": 1.4565, + "step": 21071 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012528867518020212, + "loss": 1.5093, + "step": 21072 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012527648442287254, + "loss": 1.4984, + "step": 21073 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012526429383340199, + "loss": 1.4905, + "step": 21074 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012525210341187323, + "loss": 1.5741, + "step": 21075 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012523991315836904, + "loss": 1.4425, + "step": 21076 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012522772307297216, + "loss": 1.5116, + "step": 21077 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012521553315576539, + "loss": 1.5003, + "step": 21078 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012520334340683145, + "loss": 1.5115, + "step": 21079 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012519115382625311, + "loss": 1.4693, + "step": 21080 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001251789644141132, + "loss": 1.4645, + "step": 21081 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012516677517049438, + "loss": 1.4905, + "step": 21082 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012515458609547948, + "loss": 1.4778, + "step": 21083 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012514239718915113, + "loss": 1.5438, + "step": 21084 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001251302084515923, + "loss": 1.5387, + "step": 21085 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012511801988288558, + "loss": 1.5163, + "step": 21086 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012510583148311384, + "loss": 1.5232, + "step": 21087 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001250936432523597, + "loss": 1.5432, + "step": 21088 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012508145519070596, + "loss": 1.4641, + "step": 21089 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012506926729823547, + "loss": 1.4768, + "step": 21090 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012505707957503084, + "loss": 1.4961, + "step": 21091 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012504489202117485, + "loss": 1.511, + "step": 21092 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012503270463675036, + "loss": 1.5203, + "step": 21093 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012502051742183996, + "loss": 1.5386, + "step": 21094 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001250083303765265, + "loss": 1.4964, + "step": 21095 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012499614350089264, + "loss": 1.429, + "step": 21096 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012498395679502117, + "loss": 1.4949, + "step": 21097 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012497177025899489, + "loss": 1.5083, + "step": 21098 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001249595838928964, + "loss": 1.5346, + "step": 21099 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012494739769680854, + "loss": 1.4961, + "step": 21100 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012493521167081402, + "loss": 1.496, + "step": 21101 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012492302581499563, + "loss": 1.4744, + "step": 21102 + }, + { + "epoch": 1.66, + "learning_rate": 0.000124910840129436, + "loss": 1.489, + "step": 21103 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012489865461421794, + "loss": 1.4956, + "step": 21104 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001248864692694242, + "loss": 1.5077, + "step": 21105 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012487428409513744, + "loss": 1.5525, + "step": 21106 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012486209909144045, + "loss": 1.5155, + "step": 21107 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001248499142584159, + "loss": 1.4572, + "step": 21108 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012483772959614656, + "loss": 1.5525, + "step": 21109 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012482554510471518, + "loss": 1.5293, + "step": 21110 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012481336078420442, + "loss": 1.4867, + "step": 21111 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012480117663469706, + "loss": 1.4974, + "step": 21112 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001247889926562758, + "loss": 1.5133, + "step": 21113 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012477680884902338, + "loss": 1.4684, + "step": 21114 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012476462521302244, + "loss": 1.483, + "step": 21115 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012475244174835586, + "loss": 1.4557, + "step": 21116 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001247402584551062, + "loss": 1.4987, + "step": 21117 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012472807533335625, + "loss": 1.5232, + "step": 21118 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001247158923831888, + "loss": 1.5314, + "step": 21119 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012470370960468641, + "loss": 1.5236, + "step": 21120 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012469152699793188, + "loss": 1.4819, + "step": 21121 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012467934456300797, + "loss": 1.5152, + "step": 21122 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001246671622999973, + "loss": 1.5385, + "step": 21123 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012465498020898264, + "loss": 1.491, + "step": 21124 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012464279829004665, + "loss": 1.4984, + "step": 21125 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012463061654327206, + "loss": 1.4662, + "step": 21126 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012461843496874164, + "loss": 1.4901, + "step": 21127 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012460625356653797, + "loss": 1.4673, + "step": 21128 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012459407233674383, + "loss": 1.5409, + "step": 21129 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012458189127944198, + "loss": 1.5017, + "step": 21130 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012456971039471497, + "loss": 1.4836, + "step": 21131 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012455752968264564, + "loss": 1.4845, + "step": 21132 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012454534914331666, + "loss": 1.4616, + "step": 21133 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012453316877681072, + "loss": 1.5253, + "step": 21134 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012452098858321047, + "loss": 1.4878, + "step": 21135 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001245088085625987, + "loss": 1.4801, + "step": 21136 + }, + { + "epoch": 1.66, + "learning_rate": 0.000124496628715058, + "loss": 1.5179, + "step": 21137 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012448444904067114, + "loss": 1.5277, + "step": 21138 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001244722695395208, + "loss": 1.5076, + "step": 21139 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012446009021168964, + "loss": 1.4864, + "step": 21140 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012444791105726042, + "loss": 1.491, + "step": 21141 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012443573207631572, + "loss": 1.4988, + "step": 21142 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012442355326893834, + "loss": 1.486, + "step": 21143 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001244113746352109, + "loss": 1.5021, + "step": 21144 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001243991961752161, + "loss": 1.477, + "step": 21145 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012438701788903658, + "loss": 1.4851, + "step": 21146 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012437483977675512, + "loss": 1.5169, + "step": 21147 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001243626618384544, + "loss": 1.5148, + "step": 21148 + }, + { + "epoch": 1.66, + "learning_rate": 0.000124350484074217, + "loss": 1.4509, + "step": 21149 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001243383064841257, + "loss": 1.524, + "step": 21150 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012432612906826312, + "loss": 1.4861, + "step": 21151 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012431395182671193, + "loss": 1.5201, + "step": 21152 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012430177475955488, + "loss": 1.5597, + "step": 21153 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012428959786687458, + "loss": 1.4812, + "step": 21154 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001242774211487537, + "loss": 1.488, + "step": 21155 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012426524460527498, + "loss": 1.4975, + "step": 21156 + }, + { + "epoch": 1.66, + "learning_rate": 0.000124253068236521, + "loss": 1.5283, + "step": 21157 + }, + { + "epoch": 1.66, + "learning_rate": 0.0001242408920425745, + "loss": 1.4898, + "step": 21158 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012422871602351816, + "loss": 1.483, + "step": 21159 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012421654017943457, + "loss": 1.5013, + "step": 21160 + }, + { + "epoch": 1.66, + "learning_rate": 0.00012420436451040647, + "loss": 1.4935, + "step": 21161 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001241921890165164, + "loss": 1.5478, + "step": 21162 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012418001369784727, + "loss": 1.5513, + "step": 21163 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001241678385544815, + "loss": 1.5083, + "step": 21164 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012415566358650192, + "loss": 1.524, + "step": 21165 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001241434887939911, + "loss": 1.5242, + "step": 21166 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012413131417703168, + "loss": 1.5072, + "step": 21167 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001241191397357064, + "loss": 1.5017, + "step": 21168 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012410696547009788, + "loss": 1.5253, + "step": 21169 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001240947913802888, + "loss": 1.5816, + "step": 21170 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012408261746636175, + "loss": 1.5197, + "step": 21171 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012407044372839943, + "loss": 1.5041, + "step": 21172 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012405827016648453, + "loss": 1.5085, + "step": 21173 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001240460967806996, + "loss": 1.4762, + "step": 21174 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012403392357112738, + "loss": 1.5228, + "step": 21175 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001240217505378505, + "loss": 1.4792, + "step": 21176 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012400957768095156, + "loss": 1.5102, + "step": 21177 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012399740500051323, + "loss": 1.4882, + "step": 21178 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012398523249661822, + "loss": 1.5305, + "step": 21179 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012397306016934912, + "loss": 1.4876, + "step": 21180 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012396088801878857, + "loss": 1.4954, + "step": 21181 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012394871604501923, + "loss": 1.5377, + "step": 21182 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012393654424812373, + "loss": 1.5149, + "step": 21183 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012392437262818468, + "loss": 1.5258, + "step": 21184 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001239122011852848, + "loss": 1.4927, + "step": 21185 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012390002991950663, + "loss": 1.5319, + "step": 21186 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012388785883093287, + "loss": 1.505, + "step": 21187 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012387568791964618, + "loss": 1.4866, + "step": 21188 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012386351718572913, + "loss": 1.5032, + "step": 21189 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012385134662926437, + "loss": 1.5263, + "step": 21190 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012383917625033452, + "loss": 1.4591, + "step": 21191 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012382700604902222, + "loss": 1.498, + "step": 21192 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012381483602541015, + "loss": 1.4554, + "step": 21193 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012380266617958082, + "loss": 1.4753, + "step": 21194 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012379049651161696, + "loss": 1.5304, + "step": 21195 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012377832702160116, + "loss": 1.5089, + "step": 21196 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001237661577096161, + "loss": 1.4948, + "step": 21197 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012375398857574432, + "loss": 1.5611, + "step": 21198 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012374181962006848, + "loss": 1.5484, + "step": 21199 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012372965084267117, + "loss": 1.5428, + "step": 21200 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012371748224363505, + "loss": 1.4486, + "step": 21201 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012370531382304274, + "loss": 1.4573, + "step": 21202 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012369314558097682, + "loss": 1.4977, + "step": 21203 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012368097751751993, + "loss": 1.4808, + "step": 21204 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001236688096327547, + "loss": 1.5489, + "step": 21205 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012365664192676368, + "loss": 1.5064, + "step": 21206 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012364447439962956, + "loss": 1.476, + "step": 21207 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012363230705143488, + "loss": 1.4458, + "step": 21208 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012362013988226228, + "loss": 1.5033, + "step": 21209 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012360797289219438, + "loss": 1.4532, + "step": 21210 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001235958060813138, + "loss": 1.5649, + "step": 21211 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012358363944970312, + "loss": 1.5217, + "step": 21212 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012357147299744495, + "loss": 1.4957, + "step": 21213 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012355930672462188, + "loss": 1.4544, + "step": 21214 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012354714063131654, + "loss": 1.5302, + "step": 21215 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012353497471761151, + "loss": 1.4729, + "step": 21216 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012352280898358944, + "loss": 1.5031, + "step": 21217 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012351064342933283, + "loss": 1.4977, + "step": 21218 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012349847805492438, + "loss": 1.4941, + "step": 21219 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001234863128604466, + "loss": 1.481, + "step": 21220 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012347414784598214, + "loss": 1.4848, + "step": 21221 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012346198301161357, + "loss": 1.4578, + "step": 21222 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001234498183574235, + "loss": 1.487, + "step": 21223 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001234376538834945, + "loss": 1.4395, + "step": 21224 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012342548958990912, + "loss": 1.4484, + "step": 21225 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012341332547675008, + "loss": 1.544, + "step": 21226 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012340116154409985, + "loss": 1.5079, + "step": 21227 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012338899779204107, + "loss": 1.5057, + "step": 21228 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012337683422065633, + "loss": 1.5528, + "step": 21229 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012336467083002816, + "loss": 1.4466, + "step": 21230 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001233525076202392, + "loss": 1.536, + "step": 21231 + }, + { + "epoch": 1.67, + "learning_rate": 0.000123340344591372, + "loss": 1.54, + "step": 21232 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012332818174350915, + "loss": 1.4931, + "step": 21233 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012331601907673322, + "loss": 1.4745, + "step": 21234 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012330385659112681, + "loss": 1.5217, + "step": 21235 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001232916942867725, + "loss": 1.5158, + "step": 21236 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001232795321637528, + "loss": 1.5001, + "step": 21237 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012326737022215034, + "loss": 1.4981, + "step": 21238 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001232552084620477, + "loss": 1.469, + "step": 21239 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012324304688352743, + "loss": 1.4726, + "step": 21240 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012323088548667205, + "loss": 1.5154, + "step": 21241 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012321872427156424, + "loss": 1.4398, + "step": 21242 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012320656323828652, + "loss": 1.542, + "step": 21243 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012319440238692144, + "loss": 1.4823, + "step": 21244 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012318224171755157, + "loss": 1.5124, + "step": 21245 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012317008123025953, + "loss": 1.5221, + "step": 21246 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012315792092512776, + "loss": 1.4478, + "step": 21247 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012314576080223896, + "loss": 1.51, + "step": 21248 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012313360086167556, + "loss": 1.5527, + "step": 21249 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001231214411035202, + "loss": 1.492, + "step": 21250 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012310928152785546, + "loss": 1.5022, + "step": 21251 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012309712213476383, + "loss": 1.4677, + "step": 21252 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012308496292432792, + "loss": 1.531, + "step": 21253 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012307280389663023, + "loss": 1.5035, + "step": 21254 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012306064505175334, + "loss": 1.4816, + "step": 21255 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012304848638977978, + "loss": 1.5128, + "step": 21256 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012303632791079214, + "loss": 1.5558, + "step": 21257 + }, + { + "epoch": 1.67, + "learning_rate": 0.000123024169614873, + "loss": 1.4896, + "step": 21258 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001230120115021048, + "loss": 1.5013, + "step": 21259 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012299985357257023, + "loss": 1.4947, + "step": 21260 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001229876958263517, + "loss": 1.4987, + "step": 21261 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012297553826353178, + "loss": 1.5189, + "step": 21262 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001229633808841931, + "loss": 1.5124, + "step": 21263 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001229512236884181, + "loss": 1.5027, + "step": 21264 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012293906667628943, + "loss": 1.501, + "step": 21265 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001229269098478895, + "loss": 1.4797, + "step": 21266 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012291475320330093, + "loss": 1.4768, + "step": 21267 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012290259674260624, + "loss": 1.4859, + "step": 21268 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012289044046588795, + "loss": 1.4962, + "step": 21269 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012287828437322862, + "loss": 1.4716, + "step": 21270 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012286612846471078, + "loss": 1.4764, + "step": 21271 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001228539727404169, + "loss": 1.5017, + "step": 21272 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001228418172004296, + "loss": 1.5362, + "step": 21273 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001228296618448314, + "loss": 1.4851, + "step": 21274 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001228175066737048, + "loss": 1.5003, + "step": 21275 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012280535168713232, + "loss": 1.5637, + "step": 21276 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012279319688519652, + "loss": 1.5072, + "step": 21277 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012278104226797986, + "loss": 1.4891, + "step": 21278 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001227688878355649, + "loss": 1.5303, + "step": 21279 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001227567335880342, + "loss": 1.5231, + "step": 21280 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012274457952547022, + "loss": 1.4983, + "step": 21281 + }, + { + "epoch": 1.67, + "learning_rate": 0.0001227324256479555, + "loss": 1.4658, + "step": 21282 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012272027195557258, + "loss": 1.4953, + "step": 21283 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012270811844840394, + "loss": 1.4629, + "step": 21284 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012269596512653216, + "loss": 1.4505, + "step": 21285 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012268381199003966, + "loss": 1.5504, + "step": 21286 + }, + { + "epoch": 1.67, + "learning_rate": 0.000122671659039009, + "loss": 1.484, + "step": 21287 + }, + { + "epoch": 1.67, + "learning_rate": 0.00012265950627352268, + "loss": 1.5077, + "step": 21288 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012264735369366329, + "loss": 1.4747, + "step": 21289 + }, + { + "epoch": 1.68, + "learning_rate": 0.0001226352012995132, + "loss": 1.5046, + "step": 21290 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012262304909115503, + "loss": 1.5168, + "step": 21291 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012261089706867127, + "loss": 1.5027, + "step": 21292 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012259874523214438, + "loss": 1.5706, + "step": 21293 + }, + { + "epoch": 1.68, + "learning_rate": 0.0001225865935816569, + "loss": 1.5313, + "step": 21294 + }, + { + "epoch": 1.68, + "learning_rate": 0.0001225744421172913, + "loss": 1.4795, + "step": 21295 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012256229083913012, + "loss": 1.5459, + "step": 21296 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012255013974725587, + "loss": 1.4756, + "step": 21297 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012253798884175098, + "loss": 1.5189, + "step": 21298 + }, + { + "epoch": 1.68, + "learning_rate": 0.000122525838122698, + "loss": 1.5421, + "step": 21299 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012251368759017944, + "loss": 1.5024, + "step": 21300 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012250153724427775, + "loss": 1.533, + "step": 21301 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012248938708507549, + "loss": 1.5192, + "step": 21302 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012247723711265504, + "loss": 1.4132, + "step": 21303 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012246508732709894, + "loss": 1.4636, + "step": 21304 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012245293772848977, + "loss": 1.4879, + "step": 21305 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012244078831690993, + "loss": 1.5046, + "step": 21306 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012242863909244195, + "loss": 1.5333, + "step": 21307 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012241649005516827, + "loss": 1.5256, + "step": 21308 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012240434120517143, + "loss": 1.5138, + "step": 21309 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012239219254253387, + "loss": 1.545, + "step": 21310 + }, + { + "epoch": 1.68, + "learning_rate": 0.0001223800440673381, + "loss": 1.5385, + "step": 21311 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012236789577966655, + "loss": 1.5394, + "step": 21312 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012235574767960176, + "loss": 1.5179, + "step": 21313 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012234359976722622, + "loss": 1.4832, + "step": 21314 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012233145204262232, + "loss": 1.5222, + "step": 21315 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012231930450587263, + "loss": 1.5096, + "step": 21316 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012230715715705958, + "loss": 1.5033, + "step": 21317 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012229500999626564, + "loss": 1.5265, + "step": 21318 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012228286302357327, + "loss": 1.5077, + "step": 21319 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012227071623906497, + "loss": 1.4834, + "step": 21320 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012225856964282326, + "loss": 1.5262, + "step": 21321 + }, + { + "epoch": 1.68, + "learning_rate": 0.0001222464232349305, + "loss": 1.4501, + "step": 21322 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012223427701546925, + "loss": 1.4505, + "step": 21323 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012222213098452193, + "loss": 1.4941, + "step": 21324 + }, + { + "epoch": 1.68, + "learning_rate": 0.000122209985142171, + "loss": 1.4711, + "step": 21325 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012219783948849892, + "loss": 1.5277, + "step": 21326 + }, + { + "epoch": 1.68, + "learning_rate": 0.0001221856940235882, + "loss": 1.4374, + "step": 21327 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012217354874752124, + "loss": 1.5413, + "step": 21328 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012216140366038056, + "loss": 1.4866, + "step": 21329 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012214925876224855, + "loss": 1.5087, + "step": 21330 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012213711405320774, + "loss": 1.5399, + "step": 21331 + }, + { + "epoch": 1.68, + "learning_rate": 0.0001221249695333405, + "loss": 1.4789, + "step": 21332 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012211282520272938, + "loss": 1.5415, + "step": 21333 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012210068106145678, + "loss": 1.4927, + "step": 21334 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012208853710960512, + "loss": 1.5164, + "step": 21335 + }, + { + "epoch": 1.68, + "learning_rate": 0.0001220763933472569, + "loss": 1.506, + "step": 21336 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012206424977449456, + "loss": 1.4867, + "step": 21337 + }, + { + "epoch": 1.68, + "learning_rate": 0.0001220521063914006, + "loss": 1.4949, + "step": 21338 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012203996319805738, + "loss": 1.497, + "step": 21339 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012202782019454736, + "loss": 1.4618, + "step": 21340 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012201567738095305, + "loss": 1.5089, + "step": 21341 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012200353475735682, + "loss": 1.5078, + "step": 21342 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012199139232384117, + "loss": 1.4883, + "step": 21343 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012197925008048845, + "loss": 1.4582, + "step": 21344 + }, + { + "epoch": 1.68, + "learning_rate": 0.0001219671080273812, + "loss": 1.4372, + "step": 21345 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012195496616460183, + "loss": 1.4758, + "step": 21346 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012194282449223273, + "loss": 1.4814, + "step": 21347 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012193068301035641, + "loss": 1.5142, + "step": 21348 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012191854171905521, + "loss": 1.4612, + "step": 21349 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012190640061841164, + "loss": 1.5153, + "step": 21350 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012189425970850804, + "loss": 1.5071, + "step": 21351 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012188211898942702, + "loss": 1.5361, + "step": 21352 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012186997846125082, + "loss": 1.5182, + "step": 21353 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012185783812406196, + "loss": 1.51, + "step": 21354 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012184569797794288, + "loss": 1.5089, + "step": 21355 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012183355802297594, + "loss": 1.5039, + "step": 21356 + }, + { + "epoch": 1.68, + "learning_rate": 0.0001218214182592436, + "loss": 1.4943, + "step": 21357 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012180927868682832, + "loss": 1.5506, + "step": 21358 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012179713930581244, + "loss": 1.4934, + "step": 21359 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012178500011627845, + "loss": 1.4646, + "step": 21360 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012177286111830871, + "loss": 1.5339, + "step": 21361 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012176072231198565, + "loss": 1.4714, + "step": 21362 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012174858369739177, + "loss": 1.4789, + "step": 21363 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012173644527460937, + "loss": 1.5097, + "step": 21364 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012172430704372094, + "loss": 1.4862, + "step": 21365 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012171216900480875, + "loss": 1.4829, + "step": 21366 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012170003115795542, + "loss": 1.4968, + "step": 21367 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012168789350324325, + "loss": 1.4659, + "step": 21368 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012167575604075465, + "loss": 1.5311, + "step": 21369 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012166361877057204, + "loss": 1.5308, + "step": 21370 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012165148169277782, + "loss": 1.5202, + "step": 21371 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012163934480745443, + "loss": 1.5175, + "step": 21372 + }, + { + "epoch": 1.68, + "learning_rate": 0.0001216272081146842, + "loss": 1.4841, + "step": 21373 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012161507161454957, + "loss": 1.5086, + "step": 21374 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012160293530713296, + "loss": 1.5395, + "step": 21375 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012159079919251672, + "loss": 1.5394, + "step": 21376 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012157866327078332, + "loss": 1.4747, + "step": 21377 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012156652754201507, + "loss": 1.4848, + "step": 21378 + }, + { + "epoch": 1.68, + "learning_rate": 0.0001215543920062944, + "loss": 1.5322, + "step": 21379 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012154225666370377, + "loss": 1.511, + "step": 21380 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012153012151432547, + "loss": 1.4616, + "step": 21381 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012151798655824189, + "loss": 1.4839, + "step": 21382 + }, + { + "epoch": 1.68, + "learning_rate": 0.0001215058517955355, + "loss": 1.5016, + "step": 21383 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012149371722628868, + "loss": 1.4918, + "step": 21384 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012148158285058377, + "loss": 1.4628, + "step": 21385 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012146944866850316, + "loss": 1.5204, + "step": 21386 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012145731468012928, + "loss": 1.5076, + "step": 21387 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012144518088554449, + "loss": 1.5035, + "step": 21388 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012143304728483115, + "loss": 1.4865, + "step": 21389 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012142091387807162, + "loss": 1.5287, + "step": 21390 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012140878066534834, + "loss": 1.5179, + "step": 21391 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012139664764674368, + "loss": 1.5151, + "step": 21392 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012138451482233998, + "loss": 1.4709, + "step": 21393 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012137238219221965, + "loss": 1.4805, + "step": 21394 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012136024975646502, + "loss": 1.5596, + "step": 21395 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012134811751515848, + "loss": 1.516, + "step": 21396 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012133598546838246, + "loss": 1.4998, + "step": 21397 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012132385361621918, + "loss": 1.5257, + "step": 21398 + }, + { + "epoch": 1.68, + "learning_rate": 0.0001213117219587512, + "loss": 1.4848, + "step": 21399 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012129959049606076, + "loss": 1.434, + "step": 21400 + }, + { + "epoch": 1.68, + "learning_rate": 0.0001212874592282303, + "loss": 1.4971, + "step": 21401 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012127532815534213, + "loss": 1.4906, + "step": 21402 + }, + { + "epoch": 1.68, + "learning_rate": 0.0001212631972774786, + "loss": 1.54, + "step": 21403 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012125106659472215, + "loss": 1.5003, + "step": 21404 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012123893610715506, + "loss": 1.5156, + "step": 21405 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012122680581485975, + "loss": 1.4549, + "step": 21406 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012121467571791853, + "loss": 1.4978, + "step": 21407 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012120254581641376, + "loss": 1.5288, + "step": 21408 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012119041611042786, + "loss": 1.4661, + "step": 21409 + }, + { + "epoch": 1.68, + "learning_rate": 0.0001211782866000431, + "loss": 1.4735, + "step": 21410 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012116615728534185, + "loss": 1.5271, + "step": 21411 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012115402816640653, + "loss": 1.5412, + "step": 21412 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012114189924331941, + "loss": 1.4692, + "step": 21413 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012112977051616283, + "loss": 1.4908, + "step": 21414 + }, + { + "epoch": 1.68, + "learning_rate": 0.00012111764198501924, + "loss": 1.4882, + "step": 21415 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012110551364997092, + "loss": 1.5197, + "step": 21416 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012109338551110018, + "loss": 1.4353, + "step": 21417 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012108125756848945, + "loss": 1.4465, + "step": 21418 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012106912982222098, + "loss": 1.4529, + "step": 21419 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012105700227237714, + "loss": 1.4944, + "step": 21420 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012104487491904036, + "loss": 1.5283, + "step": 21421 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012103274776229283, + "loss": 1.4882, + "step": 21422 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012102062080221697, + "loss": 1.5121, + "step": 21423 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012100849403889514, + "loss": 1.4706, + "step": 21424 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012099636747240959, + "loss": 1.5332, + "step": 21425 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012098424110284273, + "loss": 1.4404, + "step": 21426 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012097211493027684, + "loss": 1.4935, + "step": 21427 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012095998895479427, + "loss": 1.4642, + "step": 21428 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012094786317647732, + "loss": 1.5152, + "step": 21429 + }, + { + "epoch": 1.69, + "learning_rate": 0.0001209357375954084, + "loss": 1.5185, + "step": 21430 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012092361221166975, + "loss": 1.5258, + "step": 21431 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012091148702534374, + "loss": 1.4761, + "step": 21432 + }, + { + "epoch": 1.69, + "learning_rate": 0.0001208993620365127, + "loss": 1.5359, + "step": 21433 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012088723724525892, + "loss": 1.4912, + "step": 21434 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012087511265166474, + "loss": 1.4994, + "step": 21435 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012086298825581247, + "loss": 1.479, + "step": 21436 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012085086405778438, + "loss": 1.5248, + "step": 21437 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012083874005766292, + "loss": 1.4972, + "step": 21438 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012082661625553029, + "loss": 1.4632, + "step": 21439 + }, + { + "epoch": 1.69, + "learning_rate": 0.0001208144926514688, + "loss": 1.4907, + "step": 21440 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012080236924556087, + "loss": 1.4942, + "step": 21441 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012079024603788867, + "loss": 1.5233, + "step": 21442 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012077812302853464, + "loss": 1.5156, + "step": 21443 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012076600021758099, + "loss": 1.4618, + "step": 21444 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012075387760511003, + "loss": 1.6035, + "step": 21445 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012074175519120413, + "loss": 1.5227, + "step": 21446 + }, + { + "epoch": 1.69, + "learning_rate": 0.0001207296329759456, + "loss": 1.5141, + "step": 21447 + }, + { + "epoch": 1.69, + "learning_rate": 0.0001207175109594167, + "loss": 1.5028, + "step": 21448 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012070538914169972, + "loss": 1.4444, + "step": 21449 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012069326752287701, + "loss": 1.5117, + "step": 21450 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012068114610303082, + "loss": 1.4904, + "step": 21451 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012066902488224345, + "loss": 1.5067, + "step": 21452 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012065690386059727, + "loss": 1.4943, + "step": 21453 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012064478303817447, + "loss": 1.4842, + "step": 21454 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012063266241505745, + "loss": 1.5138, + "step": 21455 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012062054199132838, + "loss": 1.5191, + "step": 21456 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012060842176706964, + "loss": 1.5853, + "step": 21457 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012059630174236353, + "loss": 1.5062, + "step": 21458 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012058418191729226, + "loss": 1.5212, + "step": 21459 + }, + { + "epoch": 1.69, + "learning_rate": 0.0001205720622919382, + "loss": 1.4473, + "step": 21460 + }, + { + "epoch": 1.69, + "learning_rate": 0.0001205599428663835, + "loss": 1.4756, + "step": 21461 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012054782364071063, + "loss": 1.5317, + "step": 21462 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012053570461500176, + "loss": 1.4749, + "step": 21463 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012052358578933925, + "loss": 1.4983, + "step": 21464 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012051146716380525, + "loss": 1.4793, + "step": 21465 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012049934873848216, + "loss": 1.4981, + "step": 21466 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012048723051345221, + "loss": 1.5273, + "step": 21467 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012047511248879766, + "loss": 1.4867, + "step": 21468 + }, + { + "epoch": 1.69, + "learning_rate": 0.0001204629946646008, + "loss": 1.5411, + "step": 21469 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012045087704094395, + "loss": 1.4866, + "step": 21470 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012043875961790929, + "loss": 1.4881, + "step": 21471 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012042664239557918, + "loss": 1.4875, + "step": 21472 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012041452537403582, + "loss": 1.4711, + "step": 21473 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012040240855336149, + "loss": 1.5042, + "step": 21474 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012039029193363852, + "loss": 1.486, + "step": 21475 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012037817551494904, + "loss": 1.4848, + "step": 21476 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012036605929737547, + "loss": 1.532, + "step": 21477 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012035394328099999, + "loss": 1.5167, + "step": 21478 + }, + { + "epoch": 1.69, + "learning_rate": 0.0001203418274659049, + "loss": 1.4347, + "step": 21479 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012032971185217239, + "loss": 1.4821, + "step": 21480 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012031759643988479, + "loss": 1.4759, + "step": 21481 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012030548122912435, + "loss": 1.4815, + "step": 21482 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012029336621997326, + "loss": 1.496, + "step": 21483 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012028125141251388, + "loss": 1.5163, + "step": 21484 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012026913680682835, + "loss": 1.5377, + "step": 21485 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012025702240299898, + "loss": 1.4521, + "step": 21486 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012024490820110805, + "loss": 1.502, + "step": 21487 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012023279420123774, + "loss": 1.4525, + "step": 21488 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012022068040347037, + "loss": 1.4957, + "step": 21489 + }, + { + "epoch": 1.69, + "learning_rate": 0.0001202085668078881, + "loss": 1.4864, + "step": 21490 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012019645341457322, + "loss": 1.5423, + "step": 21491 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012018434022360795, + "loss": 1.5031, + "step": 21492 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012017222723507462, + "loss": 1.5593, + "step": 21493 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012016011444905538, + "loss": 1.5042, + "step": 21494 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012014800186563249, + "loss": 1.4622, + "step": 21495 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012013588948488822, + "loss": 1.4643, + "step": 21496 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012012377730690474, + "loss": 1.461, + "step": 21497 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012011166533176436, + "loss": 1.5146, + "step": 21498 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012009955355954928, + "loss": 1.4803, + "step": 21499 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012008744199034171, + "loss": 1.5241, + "step": 21500 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012007533062422394, + "loss": 1.4451, + "step": 21501 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012006321946127811, + "loss": 1.5289, + "step": 21502 + }, + { + "epoch": 1.69, + "learning_rate": 0.0001200511085015865, + "loss": 1.4795, + "step": 21503 + }, + { + "epoch": 1.69, + "learning_rate": 0.0001200389977452314, + "loss": 1.5238, + "step": 21504 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012002688719229491, + "loss": 1.5007, + "step": 21505 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012001477684285933, + "loss": 1.5033, + "step": 21506 + }, + { + "epoch": 1.69, + "learning_rate": 0.00012000266669700688, + "loss": 1.4943, + "step": 21507 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011999055675481973, + "loss": 1.5524, + "step": 21508 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011997844701638017, + "loss": 1.5184, + "step": 21509 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011996633748177036, + "loss": 1.4731, + "step": 21510 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011995422815107259, + "loss": 1.5365, + "step": 21511 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011994211902436901, + "loss": 1.5178, + "step": 21512 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011993001010174188, + "loss": 1.4859, + "step": 21513 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011991790138327336, + "loss": 1.5308, + "step": 21514 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011990579286904567, + "loss": 1.4976, + "step": 21515 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011989368455914109, + "loss": 1.4693, + "step": 21516 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011988157645364174, + "loss": 1.4888, + "step": 21517 + }, + { + "epoch": 1.69, + "learning_rate": 0.0001198694685526299, + "loss": 1.5032, + "step": 21518 + }, + { + "epoch": 1.69, + "learning_rate": 0.0001198573608561877, + "loss": 1.5124, + "step": 21519 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011984525336439739, + "loss": 1.467, + "step": 21520 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011983314607734121, + "loss": 1.4977, + "step": 21521 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011982103899510127, + "loss": 1.5004, + "step": 21522 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011980893211775985, + "loss": 1.4684, + "step": 21523 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011979682544539906, + "loss": 1.4886, + "step": 21524 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011978471897810123, + "loss": 1.4103, + "step": 21525 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011977261271594844, + "loss": 1.4514, + "step": 21526 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011976050665902296, + "loss": 1.4737, + "step": 21527 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011974840080740698, + "loss": 1.4997, + "step": 21528 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011973629516118261, + "loss": 1.4975, + "step": 21529 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011972418972043213, + "loss": 1.4788, + "step": 21530 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011971208448523768, + "loss": 1.5255, + "step": 21531 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011969997945568144, + "loss": 1.519, + "step": 21532 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011968787463184566, + "loss": 1.5204, + "step": 21533 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011967577001381246, + "loss": 1.4941, + "step": 21534 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011966366560166403, + "loss": 1.4406, + "step": 21535 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011965156139548263, + "loss": 1.5003, + "step": 21536 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011963945739535033, + "loss": 1.4469, + "step": 21537 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011962735360134938, + "loss": 1.5315, + "step": 21538 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011961525001356185, + "loss": 1.4969, + "step": 21539 + }, + { + "epoch": 1.69, + "learning_rate": 0.0001196031466320701, + "loss": 1.6015, + "step": 21540 + }, + { + "epoch": 1.69, + "learning_rate": 0.0001195910434569562, + "loss": 1.4983, + "step": 21541 + }, + { + "epoch": 1.69, + "learning_rate": 0.00011957894048830235, + "loss": 1.5032, + "step": 21542 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011956683772619066, + "loss": 1.5289, + "step": 21543 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011955473517070337, + "loss": 1.5344, + "step": 21544 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011954263282192266, + "loss": 1.5459, + "step": 21545 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011953053067993061, + "loss": 1.4862, + "step": 21546 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011951842874480949, + "loss": 1.4886, + "step": 21547 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011950632701664139, + "loss": 1.5196, + "step": 21548 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011949422549550847, + "loss": 1.4527, + "step": 21549 + }, + { + "epoch": 1.7, + "learning_rate": 0.000119482124181493, + "loss": 1.5406, + "step": 21550 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011947002307467702, + "loss": 1.4829, + "step": 21551 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011945792217514272, + "loss": 1.4831, + "step": 21552 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011944582148297232, + "loss": 1.5323, + "step": 21553 + }, + { + "epoch": 1.7, + "learning_rate": 0.0001194337209982479, + "loss": 1.4736, + "step": 21554 + }, + { + "epoch": 1.7, + "learning_rate": 0.0001194216207210516, + "loss": 1.5183, + "step": 21555 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011940952065146566, + "loss": 1.4709, + "step": 21556 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011939742078957224, + "loss": 1.5245, + "step": 21557 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011938532113545339, + "loss": 1.4484, + "step": 21558 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011937322168919137, + "loss": 1.4169, + "step": 21559 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011936112245086822, + "loss": 1.5267, + "step": 21560 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011934902342056614, + "loss": 1.4161, + "step": 21561 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011933692459836735, + "loss": 1.5142, + "step": 21562 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011932482598435384, + "loss": 1.5096, + "step": 21563 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011931272757860785, + "loss": 1.5489, + "step": 21564 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011930062938121154, + "loss": 1.4874, + "step": 21565 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011928853139224698, + "loss": 1.4895, + "step": 21566 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011927643361179639, + "loss": 1.5226, + "step": 21567 + }, + { + "epoch": 1.7, + "learning_rate": 0.0001192643360399418, + "loss": 1.5422, + "step": 21568 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011925223867676542, + "loss": 1.5371, + "step": 21569 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011924014152234943, + "loss": 1.5061, + "step": 21570 + }, + { + "epoch": 1.7, + "learning_rate": 0.0001192280445767758, + "loss": 1.5074, + "step": 21571 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011921594784012682, + "loss": 1.4699, + "step": 21572 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011920385131248457, + "loss": 1.4558, + "step": 21573 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011919175499393119, + "loss": 1.5069, + "step": 21574 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011917965888454877, + "loss": 1.4485, + "step": 21575 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011916756298441948, + "loss": 1.5545, + "step": 21576 + }, + { + "epoch": 1.7, + "learning_rate": 0.0001191554672936254, + "loss": 1.5062, + "step": 21577 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011914337181224867, + "loss": 1.5244, + "step": 21578 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011913127654037146, + "loss": 1.5448, + "step": 21579 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011911918147807581, + "loss": 1.5402, + "step": 21580 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011910708662544388, + "loss": 1.5194, + "step": 21581 + }, + { + "epoch": 1.7, + "learning_rate": 0.0001190949919825578, + "loss": 1.4934, + "step": 21582 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011908289754949964, + "loss": 1.4823, + "step": 21583 + }, + { + "epoch": 1.7, + "learning_rate": 0.0001190708033263516, + "loss": 1.5152, + "step": 21584 + }, + { + "epoch": 1.7, + "learning_rate": 0.0001190587093131957, + "loss": 1.5233, + "step": 21585 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011904661551011404, + "loss": 1.5369, + "step": 21586 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011903452191718881, + "loss": 1.5572, + "step": 21587 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011902242853450214, + "loss": 1.4551, + "step": 21588 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011901033536213604, + "loss": 1.484, + "step": 21589 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011899824240017266, + "loss": 1.5057, + "step": 21590 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011898614964869413, + "loss": 1.4681, + "step": 21591 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011897405710778252, + "loss": 1.5077, + "step": 21592 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011896196477751992, + "loss": 1.4724, + "step": 21593 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011894987265798849, + "loss": 1.4572, + "step": 21594 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011893778074927026, + "loss": 1.4778, + "step": 21595 + }, + { + "epoch": 1.7, + "learning_rate": 0.0001189256890514474, + "loss": 1.5069, + "step": 21596 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011891359756460192, + "loss": 1.4426, + "step": 21597 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011890150628881596, + "loss": 1.4473, + "step": 21598 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011888941522417162, + "loss": 1.5082, + "step": 21599 + }, + { + "epoch": 1.7, + "learning_rate": 0.000118877324370751, + "loss": 1.4897, + "step": 21600 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011886523372863617, + "loss": 1.4622, + "step": 21601 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011885314329790911, + "loss": 1.5669, + "step": 21602 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011884105307865213, + "loss": 1.5222, + "step": 21603 + }, + { + "epoch": 1.7, + "learning_rate": 0.0001188289630709472, + "loss": 1.4794, + "step": 21604 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011881687327487638, + "loss": 1.5106, + "step": 21605 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011880478369052183, + "loss": 1.4657, + "step": 21606 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011879269431796553, + "loss": 1.5357, + "step": 21607 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011878060515728966, + "loss": 1.4815, + "step": 21608 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011876851620857622, + "loss": 1.537, + "step": 21609 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011875642747190733, + "loss": 1.471, + "step": 21610 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011874433894736508, + "loss": 1.4808, + "step": 21611 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011873225063503147, + "loss": 1.4701, + "step": 21612 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011872016253498867, + "loss": 1.459, + "step": 21613 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011870807464731868, + "loss": 1.5109, + "step": 21614 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011869598697210359, + "loss": 1.469, + "step": 21615 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011868389950942551, + "loss": 1.5093, + "step": 21616 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011867181225936643, + "loss": 1.4654, + "step": 21617 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011865972522200841, + "loss": 1.5158, + "step": 21618 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011864763839743362, + "loss": 1.5314, + "step": 21619 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011863555178572409, + "loss": 1.4894, + "step": 21620 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011862346538696182, + "loss": 1.5045, + "step": 21621 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011861137920122891, + "loss": 1.4674, + "step": 21622 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011859929322860745, + "loss": 1.4562, + "step": 21623 + }, + { + "epoch": 1.7, + "learning_rate": 0.0001185872074691794, + "loss": 1.5016, + "step": 21624 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011857512192302693, + "loss": 1.5228, + "step": 21625 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011856303659023201, + "loss": 1.4864, + "step": 21626 + }, + { + "epoch": 1.7, + "learning_rate": 0.0001185509514708767, + "loss": 1.4566, + "step": 21627 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011853886656504313, + "loss": 1.4574, + "step": 21628 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011852678187281326, + "loss": 1.4946, + "step": 21629 + }, + { + "epoch": 1.7, + "learning_rate": 0.0001185146973942692, + "loss": 1.5484, + "step": 21630 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011850261312949295, + "loss": 1.5019, + "step": 21631 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011849052907856656, + "loss": 1.5157, + "step": 21632 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011847844524157213, + "loss": 1.5345, + "step": 21633 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011846636161859154, + "loss": 1.5075, + "step": 21634 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011845427820970708, + "loss": 1.5105, + "step": 21635 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011844219501500062, + "loss": 1.4903, + "step": 21636 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011843011203455427, + "loss": 1.47, + "step": 21637 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011841802926845003, + "loss": 1.4797, + "step": 21638 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011840594671676992, + "loss": 1.487, + "step": 21639 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011839386437959603, + "loss": 1.513, + "step": 21640 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011838178225701031, + "loss": 1.5482, + "step": 21641 + }, + { + "epoch": 1.7, + "learning_rate": 0.0001183697003490949, + "loss": 1.5106, + "step": 21642 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011835761865593172, + "loss": 1.5402, + "step": 21643 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011834553717760286, + "loss": 1.5133, + "step": 21644 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011833345591419037, + "loss": 1.4774, + "step": 21645 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011832137486577619, + "loss": 1.5177, + "step": 21646 + }, + { + "epoch": 1.7, + "learning_rate": 0.0001183092940324424, + "loss": 1.4412, + "step": 21647 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011829721341427105, + "loss": 1.5121, + "step": 21648 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011828513301134406, + "loss": 1.5466, + "step": 21649 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011827305282374356, + "loss": 1.5031, + "step": 21650 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011826097285155151, + "loss": 1.5064, + "step": 21651 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011824889309484997, + "loss": 1.5155, + "step": 21652 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011823681355372089, + "loss": 1.4834, + "step": 21653 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011822473422824636, + "loss": 1.5416, + "step": 21654 + }, + { + "epoch": 1.7, + "learning_rate": 0.0001182126551185083, + "loss": 1.5001, + "step": 21655 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011820057622458878, + "loss": 1.4959, + "step": 21656 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011818849754656982, + "loss": 1.5275, + "step": 21657 + }, + { + "epoch": 1.7, + "learning_rate": 0.0001181764190845334, + "loss": 1.4808, + "step": 21658 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011816434083856155, + "loss": 1.4909, + "step": 21659 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011815226280873624, + "loss": 1.5266, + "step": 21660 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011814018499513948, + "loss": 1.5244, + "step": 21661 + }, + { + "epoch": 1.7, + "learning_rate": 0.0001181281073978533, + "loss": 1.4977, + "step": 21662 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011811603001695967, + "loss": 1.5004, + "step": 21663 + }, + { + "epoch": 1.7, + "learning_rate": 0.0001181039528525406, + "loss": 1.4648, + "step": 21664 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011809187590467803, + "loss": 1.5262, + "step": 21665 + }, + { + "epoch": 1.7, + "learning_rate": 0.0001180797991734541, + "loss": 1.5244, + "step": 21666 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011806772265895069, + "loss": 1.4891, + "step": 21667 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011805564636124982, + "loss": 1.4786, + "step": 21668 + }, + { + "epoch": 1.7, + "learning_rate": 0.00011804357028043351, + "loss": 1.5007, + "step": 21669 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011803149441658369, + "loss": 1.4543, + "step": 21670 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011801941876978241, + "loss": 1.4938, + "step": 21671 + }, + { + "epoch": 1.71, + "learning_rate": 0.0001180073433401116, + "loss": 1.56, + "step": 21672 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011799526812765328, + "loss": 1.528, + "step": 21673 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011798319313248945, + "loss": 1.4719, + "step": 21674 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011797111835470206, + "loss": 1.507, + "step": 21675 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011795904379437308, + "loss": 1.5946, + "step": 21676 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011794696945158453, + "loss": 1.5284, + "step": 21677 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011793489532641835, + "loss": 1.5054, + "step": 21678 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011792282141895659, + "loss": 1.4852, + "step": 21679 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011791074772928112, + "loss": 1.5357, + "step": 21680 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011789867425747394, + "loss": 1.5356, + "step": 21681 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011788660100361706, + "loss": 1.4826, + "step": 21682 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011787452796779248, + "loss": 1.5301, + "step": 21683 + }, + { + "epoch": 1.71, + "learning_rate": 0.0001178624551500821, + "loss": 1.5182, + "step": 21684 + }, + { + "epoch": 1.71, + "learning_rate": 0.0001178503825505679, + "loss": 1.4864, + "step": 21685 + }, + { + "epoch": 1.71, + "learning_rate": 0.0001178383101693319, + "loss": 1.4372, + "step": 21686 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011782623800645602, + "loss": 1.5054, + "step": 21687 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011781416606202223, + "loss": 1.5361, + "step": 21688 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011780209433611247, + "loss": 1.4908, + "step": 21689 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011779002282880872, + "loss": 1.5077, + "step": 21690 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011777795154019296, + "loss": 1.4826, + "step": 21691 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011776588047034711, + "loss": 1.4563, + "step": 21692 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011775380961935316, + "loss": 1.5122, + "step": 21693 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011774173898729304, + "loss": 1.5389, + "step": 21694 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011772966857424871, + "loss": 1.4913, + "step": 21695 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011771759838030207, + "loss": 1.5403, + "step": 21696 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011770552840553516, + "loss": 1.5086, + "step": 21697 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011769345865002993, + "loss": 1.4935, + "step": 21698 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011768138911386826, + "loss": 1.473, + "step": 21699 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011766931979713214, + "loss": 1.4336, + "step": 21700 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011765725069990347, + "loss": 1.4842, + "step": 21701 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011764518182226421, + "loss": 1.531, + "step": 21702 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011763311316429636, + "loss": 1.5034, + "step": 21703 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011762104472608177, + "loss": 1.5245, + "step": 21704 + }, + { + "epoch": 1.71, + "learning_rate": 0.0001176089765077024, + "loss": 1.5292, + "step": 21705 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011759690850924027, + "loss": 1.5075, + "step": 21706 + }, + { + "epoch": 1.71, + "learning_rate": 0.0001175848407307772, + "loss": 1.4793, + "step": 21707 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011757277317239521, + "loss": 1.5059, + "step": 21708 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011756070583417617, + "loss": 1.544, + "step": 21709 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011754863871620203, + "loss": 1.4878, + "step": 21710 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011753657181855475, + "loss": 1.4575, + "step": 21711 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011752450514131617, + "loss": 1.5104, + "step": 21712 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011751243868456832, + "loss": 1.4892, + "step": 21713 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011750037244839306, + "loss": 1.5046, + "step": 21714 + }, + { + "epoch": 1.71, + "learning_rate": 0.0001174883064328724, + "loss": 1.4801, + "step": 21715 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011747624063808815, + "loss": 1.4941, + "step": 21716 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011746417506412228, + "loss": 1.5244, + "step": 21717 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011745210971105673, + "loss": 1.5306, + "step": 21718 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011744004457897338, + "loss": 1.444, + "step": 21719 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011742797966795418, + "loss": 1.4778, + "step": 21720 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011741591497808099, + "loss": 1.5031, + "step": 21721 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011740385050943576, + "loss": 1.4679, + "step": 21722 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011739178626210042, + "loss": 1.495, + "step": 21723 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011737972223615684, + "loss": 1.4789, + "step": 21724 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011736765843168697, + "loss": 1.5634, + "step": 21725 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011735559484877266, + "loss": 1.4928, + "step": 21726 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011734353148749584, + "loss": 1.5092, + "step": 21727 + }, + { + "epoch": 1.71, + "learning_rate": 0.0001173314683479384, + "loss": 1.5391, + "step": 21728 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011731940543018231, + "loss": 1.5576, + "step": 21729 + }, + { + "epoch": 1.71, + "learning_rate": 0.0001173073427343094, + "loss": 1.4675, + "step": 21730 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011729528026040158, + "loss": 1.4554, + "step": 21731 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011728321800854081, + "loss": 1.5468, + "step": 21732 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011727115597880888, + "loss": 1.4949, + "step": 21733 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011725909417128776, + "loss": 1.4844, + "step": 21734 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011724703258605935, + "loss": 1.4894, + "step": 21735 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011723497122320549, + "loss": 1.5277, + "step": 21736 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011722291008280812, + "loss": 1.4879, + "step": 21737 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011721084916494906, + "loss": 1.4581, + "step": 21738 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011719878846971024, + "loss": 1.4552, + "step": 21739 + }, + { + "epoch": 1.71, + "learning_rate": 0.0001171867279971736, + "loss": 1.5276, + "step": 21740 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011717466774742092, + "loss": 1.4879, + "step": 21741 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011716260772053415, + "loss": 1.5284, + "step": 21742 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011715054791659514, + "loss": 1.4829, + "step": 21743 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011713848833568573, + "loss": 1.5225, + "step": 21744 + }, + { + "epoch": 1.71, + "learning_rate": 0.0001171264289778879, + "loss": 1.4853, + "step": 21745 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011711436984328347, + "loss": 1.4977, + "step": 21746 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011710231093195437, + "loss": 1.4956, + "step": 21747 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011709025224398237, + "loss": 1.4475, + "step": 21748 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011707819377944944, + "loss": 1.557, + "step": 21749 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011706613553843736, + "loss": 1.4646, + "step": 21750 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011705407752102806, + "loss": 1.4843, + "step": 21751 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011704201972730343, + "loss": 1.4955, + "step": 21752 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011702996215734525, + "loss": 1.4307, + "step": 21753 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011701790481123548, + "loss": 1.4937, + "step": 21754 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011700584768905588, + "loss": 1.4803, + "step": 21755 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011699379079088839, + "loss": 1.5109, + "step": 21756 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011698173411681487, + "loss": 1.5359, + "step": 21757 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011696967766691713, + "loss": 1.4953, + "step": 21758 + }, + { + "epoch": 1.71, + "learning_rate": 0.000116957621441277, + "loss": 1.4488, + "step": 21759 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011694556543997643, + "loss": 1.5283, + "step": 21760 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011693350966309725, + "loss": 1.4602, + "step": 21761 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011692145411072126, + "loss": 1.5352, + "step": 21762 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011690939878293037, + "loss": 1.5044, + "step": 21763 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011689734367980642, + "loss": 1.5356, + "step": 21764 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011688528880143119, + "loss": 1.494, + "step": 21765 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011687323414788663, + "loss": 1.5042, + "step": 21766 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011686117971925447, + "loss": 1.4992, + "step": 21767 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011684912551561664, + "loss": 1.4584, + "step": 21768 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011683707153705497, + "loss": 1.4876, + "step": 21769 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011682501778365127, + "loss": 1.4736, + "step": 21770 + }, + { + "epoch": 1.71, + "learning_rate": 0.0001168129642554874, + "loss": 1.4856, + "step": 21771 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011680091095264516, + "loss": 1.4931, + "step": 21772 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011678885787520643, + "loss": 1.5092, + "step": 21773 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011677680502325305, + "loss": 1.4945, + "step": 21774 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011676475239686673, + "loss": 1.4686, + "step": 21775 + }, + { + "epoch": 1.71, + "learning_rate": 0.0001167526999961295, + "loss": 1.502, + "step": 21776 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011674064782112306, + "loss": 1.4837, + "step": 21777 + }, + { + "epoch": 1.71, + "learning_rate": 0.0001167285958719293, + "loss": 1.4697, + "step": 21778 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011671654414862998, + "loss": 1.4899, + "step": 21779 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011670449265130696, + "loss": 1.5091, + "step": 21780 + }, + { + "epoch": 1.71, + "learning_rate": 0.0001166924413800421, + "loss": 1.4932, + "step": 21781 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011668039033491711, + "loss": 1.5346, + "step": 21782 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011666833951601395, + "loss": 1.5021, + "step": 21783 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011665628892341433, + "loss": 1.489, + "step": 21784 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011664423855720012, + "loss": 1.4885, + "step": 21785 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011663218841745314, + "loss": 1.4825, + "step": 21786 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011662013850425516, + "loss": 1.4402, + "step": 21787 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011660808881768803, + "loss": 1.5133, + "step": 21788 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011659603935783357, + "loss": 1.4744, + "step": 21789 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011658399012477353, + "loss": 1.5261, + "step": 21790 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011657194111858974, + "loss": 1.501, + "step": 21791 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011655989233936404, + "loss": 1.5039, + "step": 21792 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011654784378717825, + "loss": 1.499, + "step": 21793 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011653579546211413, + "loss": 1.4708, + "step": 21794 + }, + { + "epoch": 1.71, + "learning_rate": 0.0001165237473642535, + "loss": 1.4568, + "step": 21795 + }, + { + "epoch": 1.71, + "learning_rate": 0.00011651169949367813, + "loss": 1.5327, + "step": 21796 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011649965185046984, + "loss": 1.4441, + "step": 21797 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011648760443471045, + "loss": 1.4718, + "step": 21798 + }, + { + "epoch": 1.72, + "learning_rate": 0.0001164755572464817, + "loss": 1.5542, + "step": 21799 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011646351028586544, + "loss": 1.5415, + "step": 21800 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011645146355294344, + "loss": 1.4788, + "step": 21801 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011643941704779747, + "loss": 1.5376, + "step": 21802 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011642737077050936, + "loss": 1.4918, + "step": 21803 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011641532472116087, + "loss": 1.5142, + "step": 21804 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011640327889983377, + "loss": 1.474, + "step": 21805 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011639123330660983, + "loss": 1.4919, + "step": 21806 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011637918794157096, + "loss": 1.5138, + "step": 21807 + }, + { + "epoch": 1.72, + "learning_rate": 0.0001163671428047988, + "loss": 1.4818, + "step": 21808 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011635509789637518, + "loss": 1.4592, + "step": 21809 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011634305321638191, + "loss": 1.5153, + "step": 21810 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011633100876490072, + "loss": 1.5415, + "step": 21811 + }, + { + "epoch": 1.72, + "learning_rate": 0.0001163189645420134, + "loss": 1.5633, + "step": 21812 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011630692054780172, + "loss": 1.4835, + "step": 21813 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011629487678234742, + "loss": 1.5361, + "step": 21814 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011628283324573238, + "loss": 1.5168, + "step": 21815 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011627078993803824, + "loss": 1.5538, + "step": 21816 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011625874685934683, + "loss": 1.5534, + "step": 21817 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011624670400973996, + "loss": 1.5094, + "step": 21818 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011623466138929928, + "loss": 1.5114, + "step": 21819 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011622261899810666, + "loss": 1.462, + "step": 21820 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011621057683624378, + "loss": 1.4697, + "step": 21821 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011619853490379242, + "loss": 1.5199, + "step": 21822 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011618649320083437, + "loss": 1.5217, + "step": 21823 + }, + { + "epoch": 1.72, + "learning_rate": 0.0001161744517274514, + "loss": 1.5031, + "step": 21824 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011616241048372522, + "loss": 1.4758, + "step": 21825 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011615036946973759, + "loss": 1.4821, + "step": 21826 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011613832868557032, + "loss": 1.5424, + "step": 21827 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011612628813130506, + "loss": 1.432, + "step": 21828 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011611424780702362, + "loss": 1.5258, + "step": 21829 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011610220771280778, + "loss": 1.5107, + "step": 21830 + }, + { + "epoch": 1.72, + "learning_rate": 0.0001160901678487392, + "loss": 1.5418, + "step": 21831 + }, + { + "epoch": 1.72, + "learning_rate": 0.0001160781282148997, + "loss": 1.5465, + "step": 21832 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011606608881137095, + "loss": 1.5296, + "step": 21833 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011605404963823474, + "loss": 1.4953, + "step": 21834 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011604201069557283, + "loss": 1.5021, + "step": 21835 + }, + { + "epoch": 1.72, + "learning_rate": 0.0001160299719834669, + "loss": 1.5264, + "step": 21836 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011601793350199873, + "loss": 1.5237, + "step": 21837 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011600589525124995, + "loss": 1.4743, + "step": 21838 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011599385723130249, + "loss": 1.4846, + "step": 21839 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011598181944223793, + "loss": 1.5016, + "step": 21840 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011596978188413807, + "loss": 1.4983, + "step": 21841 + }, + { + "epoch": 1.72, + "learning_rate": 0.0001159577445570846, + "loss": 1.5422, + "step": 21842 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011594570746115924, + "loss": 1.4817, + "step": 21843 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011593367059644377, + "loss": 1.4687, + "step": 21844 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011592163396301983, + "loss": 1.5071, + "step": 21845 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011590959756096922, + "loss": 1.4531, + "step": 21846 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011589756139037365, + "loss": 1.5099, + "step": 21847 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011588552545131478, + "loss": 1.5048, + "step": 21848 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011587348974387441, + "loss": 1.4703, + "step": 21849 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011586145426813417, + "loss": 1.4876, + "step": 21850 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011584941902417583, + "loss": 1.5792, + "step": 21851 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011583738401208111, + "loss": 1.5129, + "step": 21852 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011582534923193166, + "loss": 1.4772, + "step": 21853 + }, + { + "epoch": 1.72, + "learning_rate": 0.0001158133146838092, + "loss": 1.5065, + "step": 21854 + }, + { + "epoch": 1.72, + "learning_rate": 0.0001158012803677955, + "loss": 1.5115, + "step": 21855 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011578924628397227, + "loss": 1.5596, + "step": 21856 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011577721243242117, + "loss": 1.5103, + "step": 21857 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011576517881322387, + "loss": 1.4645, + "step": 21858 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011575314542646217, + "loss": 1.497, + "step": 21859 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011574111227221767, + "loss": 1.5305, + "step": 21860 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011572907935057216, + "loss": 1.5523, + "step": 21861 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011571704666160724, + "loss": 1.4699, + "step": 21862 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011570501420540468, + "loss": 1.4998, + "step": 21863 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011569298198204616, + "loss": 1.5148, + "step": 21864 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011568094999161332, + "loss": 1.4403, + "step": 21865 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011566891823418795, + "loss": 1.537, + "step": 21866 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011565688670985163, + "loss": 1.5663, + "step": 21867 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011564485541868609, + "loss": 1.52, + "step": 21868 + }, + { + "epoch": 1.72, + "learning_rate": 0.000115632824360773, + "loss": 1.4904, + "step": 21869 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011562079353619413, + "loss": 1.5177, + "step": 21870 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011560876294503105, + "loss": 1.5503, + "step": 21871 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011559673258736552, + "loss": 1.5356, + "step": 21872 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011558470246327922, + "loss": 1.4913, + "step": 21873 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011557267257285374, + "loss": 1.5184, + "step": 21874 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011556064291617085, + "loss": 1.4641, + "step": 21875 + }, + { + "epoch": 1.72, + "learning_rate": 0.0001155486134933122, + "loss": 1.5139, + "step": 21876 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011553658430435943, + "loss": 1.4969, + "step": 21877 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011552455534939425, + "loss": 1.5087, + "step": 21878 + }, + { + "epoch": 1.72, + "learning_rate": 0.0001155125266284983, + "loss": 1.5017, + "step": 21879 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011550049814175326, + "loss": 1.4887, + "step": 21880 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011548846988924081, + "loss": 1.4585, + "step": 21881 + }, + { + "epoch": 1.72, + "learning_rate": 0.0001154764418710426, + "loss": 1.4869, + "step": 21882 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011546441408724029, + "loss": 1.4536, + "step": 21883 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011545238653791557, + "loss": 1.5074, + "step": 21884 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011544035922315002, + "loss": 1.4954, + "step": 21885 + }, + { + "epoch": 1.72, + "learning_rate": 0.0001154283321430254, + "loss": 1.5201, + "step": 21886 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011541630529762333, + "loss": 1.4452, + "step": 21887 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011540427868702549, + "loss": 1.4284, + "step": 21888 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011539225231131347, + "loss": 1.6, + "step": 21889 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011538022617056898, + "loss": 1.4925, + "step": 21890 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011536820026487365, + "loss": 1.5019, + "step": 21891 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011535617459430909, + "loss": 1.4889, + "step": 21892 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011534414915895704, + "loss": 1.4703, + "step": 21893 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011533212395889905, + "loss": 1.4774, + "step": 21894 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011532009899421685, + "loss": 1.4353, + "step": 21895 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011530807426499201, + "loss": 1.466, + "step": 21896 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011529604977130619, + "loss": 1.4694, + "step": 21897 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011528402551324109, + "loss": 1.4774, + "step": 21898 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011527200149087825, + "loss": 1.5012, + "step": 21899 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011525997770429937, + "loss": 1.5184, + "step": 21900 + }, + { + "epoch": 1.72, + "learning_rate": 0.000115247954153586, + "loss": 1.5062, + "step": 21901 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011523593083881994, + "loss": 1.5275, + "step": 21902 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011522390776008271, + "loss": 1.4936, + "step": 21903 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011521188491745593, + "loss": 1.4416, + "step": 21904 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011519986231102129, + "loss": 1.5371, + "step": 21905 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011518783994086033, + "loss": 1.4748, + "step": 21906 + }, + { + "epoch": 1.72, + "learning_rate": 0.0001151758178070548, + "loss": 1.522, + "step": 21907 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011516379590968619, + "loss": 1.4949, + "step": 21908 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011515177424883618, + "loss": 1.5433, + "step": 21909 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011513975282458643, + "loss": 1.5048, + "step": 21910 + }, + { + "epoch": 1.72, + "learning_rate": 0.0001151277316370185, + "loss": 1.5097, + "step": 21911 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011511571068621402, + "loss": 1.4218, + "step": 21912 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011510368997225464, + "loss": 1.4586, + "step": 21913 + }, + { + "epoch": 1.72, + "learning_rate": 0.0001150916694952219, + "loss": 1.4927, + "step": 21914 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011507964925519752, + "loss": 1.468, + "step": 21915 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011506762925226295, + "loss": 1.4981, + "step": 21916 + }, + { + "epoch": 1.72, + "learning_rate": 0.0001150556094865, + "loss": 1.532, + "step": 21917 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011504358995799012, + "loss": 1.4571, + "step": 21918 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011503157066681504, + "loss": 1.4705, + "step": 21919 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011501955161305623, + "loss": 1.488, + "step": 21920 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011500753279679539, + "loss": 1.4521, + "step": 21921 + }, + { + "epoch": 1.72, + "learning_rate": 0.0001149955142181141, + "loss": 1.5566, + "step": 21922 + }, + { + "epoch": 1.72, + "learning_rate": 0.00011498349587709395, + "loss": 1.4782, + "step": 21923 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011497147777381656, + "loss": 1.4882, + "step": 21924 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011495945990836345, + "loss": 1.5078, + "step": 21925 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011494744228081631, + "loss": 1.4632, + "step": 21926 + }, + { + "epoch": 1.73, + "learning_rate": 0.0001149354248912567, + "loss": 1.5036, + "step": 21927 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011492340773976616, + "loss": 1.496, + "step": 21928 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011491139082642636, + "loss": 1.4721, + "step": 21929 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011489937415131884, + "loss": 1.4573, + "step": 21930 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011488735771452521, + "loss": 1.452, + "step": 21931 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011487534151612698, + "loss": 1.501, + "step": 21932 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011486332555620586, + "loss": 1.4838, + "step": 21933 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011485130983484338, + "loss": 1.51, + "step": 21934 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011483929435212109, + "loss": 1.5409, + "step": 21935 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011482727910812061, + "loss": 1.5138, + "step": 21936 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011481526410292347, + "loss": 1.4601, + "step": 21937 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011480324933661126, + "loss": 1.4668, + "step": 21938 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011479123480926561, + "loss": 1.5292, + "step": 21939 + }, + { + "epoch": 1.73, + "learning_rate": 0.000114779220520968, + "loss": 1.5164, + "step": 21940 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011476720647180006, + "loss": 1.4796, + "step": 21941 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011475519266184337, + "loss": 1.5116, + "step": 21942 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011474317909117944, + "loss": 1.4171, + "step": 21943 + }, + { + "epoch": 1.73, + "learning_rate": 0.0001147311657598899, + "loss": 1.4449, + "step": 21944 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011471915266805624, + "loss": 1.5341, + "step": 21945 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011470713981576008, + "loss": 1.4861, + "step": 21946 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011469512720308299, + "loss": 1.4571, + "step": 21947 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011468311483010644, + "loss": 1.5567, + "step": 21948 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011467110269691208, + "loss": 1.5348, + "step": 21949 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011465909080358144, + "loss": 1.5227, + "step": 21950 + }, + { + "epoch": 1.73, + "learning_rate": 0.0001146470791501961, + "loss": 1.5149, + "step": 21951 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011463506773683756, + "loss": 1.5066, + "step": 21952 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011462305656358741, + "loss": 1.5197, + "step": 21953 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011461104563052715, + "loss": 1.5093, + "step": 21954 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011459903493773839, + "loss": 1.49, + "step": 21955 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011458702448530265, + "loss": 1.4679, + "step": 21956 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011457501427330145, + "loss": 1.5195, + "step": 21957 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011456300430181636, + "loss": 1.4719, + "step": 21958 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011455099457092893, + "loss": 1.473, + "step": 21959 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011453898508072067, + "loss": 1.4846, + "step": 21960 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011452697583127316, + "loss": 1.5012, + "step": 21961 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011451496682266787, + "loss": 1.4668, + "step": 21962 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011450295805498637, + "loss": 1.4933, + "step": 21963 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011449094952831017, + "loss": 1.5032, + "step": 21964 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011447894124272089, + "loss": 1.4718, + "step": 21965 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011446693319829996, + "loss": 1.4638, + "step": 21966 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011445492539512896, + "loss": 1.4554, + "step": 21967 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011444291783328943, + "loss": 1.4749, + "step": 21968 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011443091051286282, + "loss": 1.4621, + "step": 21969 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011441890343393071, + "loss": 1.524, + "step": 21970 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011440689659657464, + "loss": 1.5302, + "step": 21971 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011439489000087607, + "loss": 1.49, + "step": 21972 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011438288364691657, + "loss": 1.4521, + "step": 21973 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011437087753477761, + "loss": 1.4869, + "step": 21974 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011435887166454074, + "loss": 1.4977, + "step": 21975 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011434686603628748, + "loss": 1.4957, + "step": 21976 + }, + { + "epoch": 1.73, + "learning_rate": 0.0001143348606500993, + "loss": 1.4507, + "step": 21977 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011432285550605777, + "loss": 1.4978, + "step": 21978 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011431085060424426, + "loss": 1.4572, + "step": 21979 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011429884594474047, + "loss": 1.4642, + "step": 21980 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011428684152762778, + "loss": 1.5046, + "step": 21981 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011427483735298775, + "loss": 1.4848, + "step": 21982 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011426283342090188, + "loss": 1.5113, + "step": 21983 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011425082973145161, + "loss": 1.4739, + "step": 21984 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011423882628471852, + "loss": 1.5461, + "step": 21985 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011422682308078403, + "loss": 1.5106, + "step": 21986 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011421482011972967, + "loss": 1.4884, + "step": 21987 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011420281740163697, + "loss": 1.5756, + "step": 21988 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011419081492658736, + "loss": 1.465, + "step": 21989 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011417881269466236, + "loss": 1.5383, + "step": 21990 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011416681070594343, + "loss": 1.5478, + "step": 21991 + }, + { + "epoch": 1.73, + "learning_rate": 0.0001141548089605121, + "loss": 1.5555, + "step": 21992 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011414280745844985, + "loss": 1.4659, + "step": 21993 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011413080619983814, + "loss": 1.5253, + "step": 21994 + }, + { + "epoch": 1.73, + "learning_rate": 0.0001141188051847584, + "loss": 1.4709, + "step": 21995 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011410680441329222, + "loss": 1.4962, + "step": 21996 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011409480388552105, + "loss": 1.4983, + "step": 21997 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011408280360152633, + "loss": 1.5203, + "step": 21998 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011407080356138956, + "loss": 1.4904, + "step": 21999 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011405880376519222, + "loss": 1.5718, + "step": 22000 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011404680421301575, + "loss": 1.5214, + "step": 22001 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011403480490494166, + "loss": 1.5165, + "step": 22002 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011402280584105137, + "loss": 1.4844, + "step": 22003 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011401080702142637, + "loss": 1.4727, + "step": 22004 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011399880844614818, + "loss": 1.5617, + "step": 22005 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011398681011529816, + "loss": 1.4765, + "step": 22006 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011397481202895786, + "loss": 1.4933, + "step": 22007 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011396281418720869, + "loss": 1.52, + "step": 22008 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011395081659013211, + "loss": 1.4937, + "step": 22009 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011393881923780964, + "loss": 1.5215, + "step": 22010 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011392682213032258, + "loss": 1.4979, + "step": 22011 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011391482526775258, + "loss": 1.4988, + "step": 22012 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011390282865018097, + "loss": 1.4822, + "step": 22013 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011389083227768928, + "loss": 1.4733, + "step": 22014 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011387883615035888, + "loss": 1.521, + "step": 22015 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011386684026827125, + "loss": 1.437, + "step": 22016 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011385484463150784, + "loss": 1.5031, + "step": 22017 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011384284924015007, + "loss": 1.5062, + "step": 22018 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011383085409427944, + "loss": 1.5117, + "step": 22019 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011381885919397733, + "loss": 1.5086, + "step": 22020 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011380686453932518, + "loss": 1.5233, + "step": 22021 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011379487013040448, + "loss": 1.5505, + "step": 22022 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011378287596729661, + "loss": 1.4835, + "step": 22023 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011377088205008303, + "loss": 1.4274, + "step": 22024 + }, + { + "epoch": 1.73, + "learning_rate": 0.0001137588883788452, + "loss": 1.4837, + "step": 22025 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011374689495366443, + "loss": 1.4864, + "step": 22026 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011373490177462229, + "loss": 1.4719, + "step": 22027 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011372290884180014, + "loss": 1.4943, + "step": 22028 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011371091615527947, + "loss": 1.4556, + "step": 22029 + }, + { + "epoch": 1.73, + "learning_rate": 0.0001136989237151416, + "loss": 1.5462, + "step": 22030 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011368693152146806, + "loss": 1.4792, + "step": 22031 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011367493957434017, + "loss": 1.4675, + "step": 22032 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011366294787383939, + "loss": 1.5415, + "step": 22033 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011365095642004719, + "loss": 1.5002, + "step": 22034 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011363896521304489, + "loss": 1.4228, + "step": 22035 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011362697425291398, + "loss": 1.5013, + "step": 22036 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011361498353973583, + "loss": 1.4515, + "step": 22037 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011360299307359184, + "loss": 1.4855, + "step": 22038 + }, + { + "epoch": 1.73, + "learning_rate": 0.0001135910028545635, + "loss": 1.5149, + "step": 22039 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011357901288273212, + "loss": 1.5121, + "step": 22040 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011356702315817913, + "loss": 1.4721, + "step": 22041 + }, + { + "epoch": 1.73, + "learning_rate": 0.0001135550336809859, + "loss": 1.4097, + "step": 22042 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011354304445123397, + "loss": 1.5125, + "step": 22043 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011353105546900463, + "loss": 1.486, + "step": 22044 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011351906673437926, + "loss": 1.4732, + "step": 22045 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011350707824743935, + "loss": 1.5026, + "step": 22046 + }, + { + "epoch": 1.73, + "learning_rate": 0.0001134950900082662, + "loss": 1.4605, + "step": 22047 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011348310201694129, + "loss": 1.4983, + "step": 22048 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011347111427354592, + "loss": 1.531, + "step": 22049 + }, + { + "epoch": 1.73, + "learning_rate": 0.00011345912677816154, + "loss": 1.4764, + "step": 22050 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011344713953086954, + "loss": 1.5228, + "step": 22051 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011343515253175127, + "loss": 1.4626, + "step": 22052 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011342316578088812, + "loss": 1.5128, + "step": 22053 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011341117927836155, + "loss": 1.512, + "step": 22054 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011339919302425283, + "loss": 1.5125, + "step": 22055 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011338720701864342, + "loss": 1.5102, + "step": 22056 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011337522126161464, + "loss": 1.4214, + "step": 22057 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011336323575324788, + "loss": 1.4589, + "step": 22058 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011335125049362455, + "loss": 1.503, + "step": 22059 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011333926548282602, + "loss": 1.4847, + "step": 22060 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011332728072093365, + "loss": 1.4716, + "step": 22061 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011331529620802879, + "loss": 1.5293, + "step": 22062 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011330331194419284, + "loss": 1.5373, + "step": 22063 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011329132792950714, + "loss": 1.5418, + "step": 22064 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011327934416405309, + "loss": 1.4043, + "step": 22065 + }, + { + "epoch": 1.74, + "learning_rate": 0.000113267360647912, + "loss": 1.4734, + "step": 22066 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011325537738116526, + "loss": 1.4359, + "step": 22067 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011324339436389427, + "loss": 1.538, + "step": 22068 + }, + { + "epoch": 1.74, + "learning_rate": 0.0001132314115961803, + "loss": 1.4314, + "step": 22069 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011321942907810477, + "loss": 1.4777, + "step": 22070 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011320744680974905, + "loss": 1.4658, + "step": 22071 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011319546479119441, + "loss": 1.4965, + "step": 22072 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011318348302252232, + "loss": 1.5015, + "step": 22073 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011317150150381393, + "loss": 1.497, + "step": 22074 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011315952023515083, + "loss": 1.4711, + "step": 22075 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011314753921661424, + "loss": 1.5293, + "step": 22076 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011313555844828553, + "loss": 1.5261, + "step": 22077 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011312357793024604, + "loss": 1.4559, + "step": 22078 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011311159766257706, + "loss": 1.4679, + "step": 22079 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011309961764536004, + "loss": 1.5415, + "step": 22080 + }, + { + "epoch": 1.74, + "learning_rate": 0.0001130876378786762, + "loss": 1.4063, + "step": 22081 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011307565836260694, + "loss": 1.4841, + "step": 22082 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011306367909723363, + "loss": 1.5321, + "step": 22083 + }, + { + "epoch": 1.74, + "learning_rate": 0.0001130517000826375, + "loss": 1.5106, + "step": 22084 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011303972131889997, + "loss": 1.5351, + "step": 22085 + }, + { + "epoch": 1.74, + "learning_rate": 0.0001130277428061023, + "loss": 1.5237, + "step": 22086 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011301576454432588, + "loss": 1.5138, + "step": 22087 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011300378653365203, + "loss": 1.4375, + "step": 22088 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011299180877416198, + "loss": 1.4774, + "step": 22089 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011297983126593716, + "loss": 1.4497, + "step": 22090 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011296785400905886, + "loss": 1.4189, + "step": 22091 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011295587700360843, + "loss": 1.5062, + "step": 22092 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011294390024966711, + "loss": 1.4501, + "step": 22093 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011293192374731625, + "loss": 1.5694, + "step": 22094 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011291994749663724, + "loss": 1.5273, + "step": 22095 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011290797149771127, + "loss": 1.5321, + "step": 22096 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011289599575061972, + "loss": 1.515, + "step": 22097 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011288402025544389, + "loss": 1.5293, + "step": 22098 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011287204501226505, + "loss": 1.5375, + "step": 22099 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011286007002116457, + "loss": 1.5174, + "step": 22100 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011284809528222368, + "loss": 1.5306, + "step": 22101 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011283612079552377, + "loss": 1.4794, + "step": 22102 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011282414656114606, + "loss": 1.4456, + "step": 22103 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011281217257917188, + "loss": 1.4921, + "step": 22104 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011280019884968248, + "loss": 1.4898, + "step": 22105 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011278822537275926, + "loss": 1.5146, + "step": 22106 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011277625214848345, + "loss": 1.499, + "step": 22107 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011276427917693632, + "loss": 1.452, + "step": 22108 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011275230645819924, + "loss": 1.4796, + "step": 22109 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011274033399235341, + "loss": 1.5113, + "step": 22110 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011272836177948015, + "loss": 1.5105, + "step": 22111 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011271638981966076, + "loss": 1.5193, + "step": 22112 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011270441811297649, + "loss": 1.4914, + "step": 22113 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011269244665950867, + "loss": 1.4938, + "step": 22114 + }, + { + "epoch": 1.74, + "learning_rate": 0.0001126804754593385, + "loss": 1.4603, + "step": 22115 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011266850451254733, + "loss": 1.4681, + "step": 22116 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011265653381921644, + "loss": 1.5172, + "step": 22117 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011264456337942704, + "loss": 1.5043, + "step": 22118 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011263259319326046, + "loss": 1.5021, + "step": 22119 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011262062326079795, + "loss": 1.4801, + "step": 22120 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011260865358212072, + "loss": 1.5219, + "step": 22121 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011259668415731015, + "loss": 1.4715, + "step": 22122 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011258471498644745, + "loss": 1.4628, + "step": 22123 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011257274606961392, + "loss": 1.5561, + "step": 22124 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011256077740689074, + "loss": 1.4529, + "step": 22125 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011254880899835928, + "loss": 1.4963, + "step": 22126 + }, + { + "epoch": 1.74, + "learning_rate": 0.0001125368408441007, + "loss": 1.531, + "step": 22127 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011252487294419628, + "loss": 1.4919, + "step": 22128 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011251290529872734, + "loss": 1.4949, + "step": 22129 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011250093790777506, + "loss": 1.5161, + "step": 22130 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011248897077142073, + "loss": 1.5005, + "step": 22131 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011247700388974557, + "loss": 1.4761, + "step": 22132 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011246503726283083, + "loss": 1.4723, + "step": 22133 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011245307089075781, + "loss": 1.5189, + "step": 22134 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011244110477360771, + "loss": 1.4977, + "step": 22135 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011242913891146172, + "loss": 1.5253, + "step": 22136 + }, + { + "epoch": 1.74, + "learning_rate": 0.0001124171733044012, + "loss": 1.5039, + "step": 22137 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011240520795250735, + "loss": 1.5078, + "step": 22138 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011239324285586138, + "loss": 1.4823, + "step": 22139 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011238127801454451, + "loss": 1.5498, + "step": 22140 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011236931342863805, + "loss": 1.4971, + "step": 22141 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011235734909822314, + "loss": 1.4966, + "step": 22142 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011234538502338112, + "loss": 1.5257, + "step": 22143 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011233342120419309, + "loss": 1.516, + "step": 22144 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011232145764074035, + "loss": 1.459, + "step": 22145 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011230949433310417, + "loss": 1.5085, + "step": 22146 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011229753128136567, + "loss": 1.4783, + "step": 22147 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011228556848560616, + "loss": 1.471, + "step": 22148 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011227360594590681, + "loss": 1.5175, + "step": 22149 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011226164366234887, + "loss": 1.4708, + "step": 22150 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011224968163501354, + "loss": 1.4838, + "step": 22151 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011223771986398197, + "loss": 1.5274, + "step": 22152 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011222575834933553, + "loss": 1.4748, + "step": 22153 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011221379709115532, + "loss": 1.4734, + "step": 22154 + }, + { + "epoch": 1.74, + "learning_rate": 0.0001122018360895226, + "loss": 1.5461, + "step": 22155 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011218987534451851, + "loss": 1.5037, + "step": 22156 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011217791485622431, + "loss": 1.4722, + "step": 22157 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011216595462472125, + "loss": 1.4863, + "step": 22158 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011215399465009044, + "loss": 1.5193, + "step": 22159 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011214203493241313, + "loss": 1.4726, + "step": 22160 + }, + { + "epoch": 1.74, + "learning_rate": 0.0001121300754717705, + "loss": 1.5501, + "step": 22161 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011211811626824376, + "loss": 1.501, + "step": 22162 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011210615732191411, + "loss": 1.4904, + "step": 22163 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011209419863286272, + "loss": 1.5401, + "step": 22164 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011208224020117082, + "loss": 1.4915, + "step": 22165 + }, + { + "epoch": 1.74, + "learning_rate": 0.0001120702820269196, + "loss": 1.5085, + "step": 22166 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011205832411019021, + "loss": 1.4283, + "step": 22167 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011204636645106383, + "loss": 1.5081, + "step": 22168 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011203440904962171, + "loss": 1.4884, + "step": 22169 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011202245190594502, + "loss": 1.5082, + "step": 22170 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011201049502011491, + "loss": 1.5, + "step": 22171 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011199853839221262, + "loss": 1.4355, + "step": 22172 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011198658202231921, + "loss": 1.4994, + "step": 22173 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011197462591051596, + "loss": 1.4153, + "step": 22174 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011196267005688404, + "loss": 1.4387, + "step": 22175 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011195071446150456, + "loss": 1.4575, + "step": 22176 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011193875912445873, + "loss": 1.5414, + "step": 22177 + }, + { + "epoch": 1.74, + "learning_rate": 0.00011192680404582776, + "loss": 1.4559, + "step": 22178 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011191484922569275, + "loss": 1.4674, + "step": 22179 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011190289466413493, + "loss": 1.5104, + "step": 22180 + }, + { + "epoch": 1.75, + "learning_rate": 0.0001118909403612354, + "loss": 1.4944, + "step": 22181 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011187898631707536, + "loss": 1.5167, + "step": 22182 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011186703253173598, + "loss": 1.5368, + "step": 22183 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011185507900529835, + "loss": 1.493, + "step": 22184 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011184312573784371, + "loss": 1.5532, + "step": 22185 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011183117272945321, + "loss": 1.5172, + "step": 22186 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011181921998020801, + "loss": 1.4727, + "step": 22187 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011180726749018917, + "loss": 1.4873, + "step": 22188 + }, + { + "epoch": 1.75, + "learning_rate": 0.000111795315259478, + "loss": 1.5176, + "step": 22189 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011178336328815548, + "loss": 1.4858, + "step": 22190 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011177141157630284, + "loss": 1.5321, + "step": 22191 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011175946012400125, + "loss": 1.4761, + "step": 22192 + }, + { + "epoch": 1.75, + "learning_rate": 0.0001117475089313318, + "loss": 1.4917, + "step": 22193 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011173555799837564, + "loss": 1.499, + "step": 22194 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011172360732521398, + "loss": 1.5193, + "step": 22195 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011171165691192785, + "loss": 1.5205, + "step": 22196 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011169970675859848, + "loss": 1.4806, + "step": 22197 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011168775686530694, + "loss": 1.5406, + "step": 22198 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011167580723213436, + "loss": 1.4453, + "step": 22199 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011166385785916191, + "loss": 1.5255, + "step": 22200 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011165190874647077, + "loss": 1.5439, + "step": 22201 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011163995989414195, + "loss": 1.4272, + "step": 22202 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011162801130225664, + "loss": 1.489, + "step": 22203 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011161606297089599, + "loss": 1.481, + "step": 22204 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011160411490014106, + "loss": 1.541, + "step": 22205 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011159216709007302, + "loss": 1.4939, + "step": 22206 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011158021954077298, + "loss": 1.4661, + "step": 22207 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011156827225232202, + "loss": 1.4798, + "step": 22208 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011155632522480133, + "loss": 1.5505, + "step": 22209 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011154437845829191, + "loss": 1.5458, + "step": 22210 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011153243195287496, + "loss": 1.5215, + "step": 22211 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011152048570863162, + "loss": 1.5153, + "step": 22212 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011150853972564289, + "loss": 1.4705, + "step": 22213 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011149659400398998, + "loss": 1.4618, + "step": 22214 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011148464854375384, + "loss": 1.4674, + "step": 22215 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011147270334501578, + "loss": 1.492, + "step": 22216 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011146075840785676, + "loss": 1.5024, + "step": 22217 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011144881373235797, + "loss": 1.5261, + "step": 22218 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011143686931860042, + "loss": 1.428, + "step": 22219 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011142492516666525, + "loss": 1.4806, + "step": 22220 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011141298127663361, + "loss": 1.4767, + "step": 22221 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011140103764858646, + "loss": 1.4633, + "step": 22222 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011138909428260498, + "loss": 1.4788, + "step": 22223 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011137715117877028, + "loss": 1.5492, + "step": 22224 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011136520833716337, + "loss": 1.5026, + "step": 22225 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011135326575786542, + "loss": 1.5523, + "step": 22226 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011134132344095741, + "loss": 1.5013, + "step": 22227 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011132938138652051, + "loss": 1.5252, + "step": 22228 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011131743959463578, + "loss": 1.4747, + "step": 22229 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011130549806538426, + "loss": 1.501, + "step": 22230 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011129355679884704, + "loss": 1.4947, + "step": 22231 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011128161579510522, + "loss": 1.4905, + "step": 22232 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011126967505423989, + "loss": 1.5202, + "step": 22233 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011125773457633209, + "loss": 1.5299, + "step": 22234 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011124579436146288, + "loss": 1.5049, + "step": 22235 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011123385440971336, + "loss": 1.4932, + "step": 22236 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011122191472116455, + "loss": 1.4861, + "step": 22237 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011120997529589756, + "loss": 1.6041, + "step": 22238 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011119803613399344, + "loss": 1.4824, + "step": 22239 + }, + { + "epoch": 1.75, + "learning_rate": 0.0001111860972355332, + "loss": 1.5449, + "step": 22240 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011117415860059799, + "loss": 1.5004, + "step": 22241 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011116222022926879, + "loss": 1.4683, + "step": 22242 + }, + { + "epoch": 1.75, + "learning_rate": 0.0001111502821216267, + "loss": 1.5271, + "step": 22243 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011113834427775273, + "loss": 1.491, + "step": 22244 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011112640669772796, + "loss": 1.5192, + "step": 22245 + }, + { + "epoch": 1.75, + "learning_rate": 0.0001111144693816334, + "loss": 1.4832, + "step": 22246 + }, + { + "epoch": 1.75, + "learning_rate": 0.0001111025323295502, + "loss": 1.4747, + "step": 22247 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011109059554155931, + "loss": 1.4918, + "step": 22248 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011107865901774181, + "loss": 1.4671, + "step": 22249 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011106672275817876, + "loss": 1.5032, + "step": 22250 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011105478676295113, + "loss": 1.4992, + "step": 22251 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011104285103214002, + "loss": 1.4906, + "step": 22252 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011103091556582651, + "loss": 1.4976, + "step": 22253 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011101898036409152, + "loss": 1.5076, + "step": 22254 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011100704542701617, + "loss": 1.4712, + "step": 22255 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011099511075468144, + "loss": 1.5207, + "step": 22256 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011098317634716837, + "loss": 1.4867, + "step": 22257 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011097124220455806, + "loss": 1.4517, + "step": 22258 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011095930832693144, + "loss": 1.5027, + "step": 22259 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011094737471436954, + "loss": 1.5226, + "step": 22260 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011093544136695348, + "loss": 1.4952, + "step": 22261 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011092350828476414, + "loss": 1.5291, + "step": 22262 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011091157546788265, + "loss": 1.5101, + "step": 22263 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011089964291638999, + "loss": 1.5111, + "step": 22264 + }, + { + "epoch": 1.75, + "learning_rate": 0.0001108877106303672, + "loss": 1.4397, + "step": 22265 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011087577860989527, + "loss": 1.4682, + "step": 22266 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011086384685505521, + "loss": 1.4917, + "step": 22267 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011085191536592802, + "loss": 1.4723, + "step": 22268 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011083998414259472, + "loss": 1.4565, + "step": 22269 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011082805318513633, + "loss": 1.5246, + "step": 22270 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011081612249363382, + "loss": 1.4989, + "step": 22271 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011080419206816826, + "loss": 1.458, + "step": 22272 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011079226190882055, + "loss": 1.4989, + "step": 22273 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011078033201567177, + "loss": 1.4782, + "step": 22274 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011076840238880291, + "loss": 1.5185, + "step": 22275 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011075647302829493, + "loss": 1.4855, + "step": 22276 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011074454393422883, + "loss": 1.4611, + "step": 22277 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011073261510668558, + "loss": 1.5054, + "step": 22278 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011072068654574628, + "loss": 1.5035, + "step": 22279 + }, + { + "epoch": 1.75, + "learning_rate": 0.0001107087582514918, + "loss": 1.5051, + "step": 22280 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011069683022400316, + "loss": 1.495, + "step": 22281 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011068490246336139, + "loss": 1.4847, + "step": 22282 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011067297496964742, + "loss": 1.532, + "step": 22283 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011066104774294227, + "loss": 1.5232, + "step": 22284 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011064912078332687, + "loss": 1.4724, + "step": 22285 + }, + { + "epoch": 1.75, + "learning_rate": 0.0001106371940908822, + "loss": 1.5398, + "step": 22286 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011062526766568931, + "loss": 1.4782, + "step": 22287 + }, + { + "epoch": 1.75, + "learning_rate": 0.0001106133415078291, + "loss": 1.504, + "step": 22288 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011060141561738254, + "loss": 1.5223, + "step": 22289 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011058948999443069, + "loss": 1.5212, + "step": 22290 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011057756463905443, + "loss": 1.4785, + "step": 22291 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011056563955133474, + "loss": 1.4861, + "step": 22292 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011055371473135259, + "loss": 1.4508, + "step": 22293 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011054179017918892, + "loss": 1.479, + "step": 22294 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011052986589492473, + "loss": 1.5162, + "step": 22295 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011051794187864104, + "loss": 1.538, + "step": 22296 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011050601813041866, + "loss": 1.4756, + "step": 22297 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011049409465033864, + "loss": 1.5446, + "step": 22298 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011048217143848196, + "loss": 1.4862, + "step": 22299 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011047024849492949, + "loss": 1.5338, + "step": 22300 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011045832581976223, + "loss": 1.4681, + "step": 22301 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011044640341306111, + "loss": 1.5111, + "step": 22302 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011043448127490707, + "loss": 1.4947, + "step": 22303 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011042255940538112, + "loss": 1.5316, + "step": 22304 + }, + { + "epoch": 1.75, + "learning_rate": 0.00011041063780456408, + "loss": 1.4901, + "step": 22305 + }, + { + "epoch": 1.76, + "learning_rate": 0.000110398716472537, + "loss": 1.5236, + "step": 22306 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011038679540938079, + "loss": 1.4831, + "step": 22307 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011037487461517637, + "loss": 1.5462, + "step": 22308 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011036295409000464, + "loss": 1.5154, + "step": 22309 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011035103383394662, + "loss": 1.5286, + "step": 22310 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011033911384708321, + "loss": 1.4627, + "step": 22311 + }, + { + "epoch": 1.76, + "learning_rate": 0.0001103271941294953, + "loss": 1.4518, + "step": 22312 + }, + { + "epoch": 1.76, + "learning_rate": 0.0001103152746812639, + "loss": 1.5009, + "step": 22313 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011030335550246985, + "loss": 1.4868, + "step": 22314 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011029143659319408, + "loss": 1.4571, + "step": 22315 + }, + { + "epoch": 1.76, + "learning_rate": 0.0001102795179535176, + "loss": 1.5134, + "step": 22316 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011026759958352125, + "loss": 1.5193, + "step": 22317 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011025568148328596, + "loss": 1.5022, + "step": 22318 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011024376365289268, + "loss": 1.4813, + "step": 22319 + }, + { + "epoch": 1.76, + "learning_rate": 0.0001102318460924223, + "loss": 1.5038, + "step": 22320 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011021992880195575, + "loss": 1.4511, + "step": 22321 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011020801178157391, + "loss": 1.473, + "step": 22322 + }, + { + "epoch": 1.76, + "learning_rate": 0.0001101960950313577, + "loss": 1.5346, + "step": 22323 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011018417855138809, + "loss": 1.4534, + "step": 22324 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011017226234174585, + "loss": 1.4577, + "step": 22325 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011016034640251202, + "loss": 1.4306, + "step": 22326 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011014843073376745, + "loss": 1.53, + "step": 22327 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011013651533559308, + "loss": 1.4874, + "step": 22328 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011012460020806972, + "loss": 1.482, + "step": 22329 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011011268535127837, + "loss": 1.4827, + "step": 22330 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011010077076529984, + "loss": 1.4756, + "step": 22331 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011008885645021504, + "loss": 1.5332, + "step": 22332 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011007694240610492, + "loss": 1.5333, + "step": 22333 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011006502863305033, + "loss": 1.5014, + "step": 22334 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011005311513113211, + "loss": 1.4914, + "step": 22335 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011004120190043124, + "loss": 1.4641, + "step": 22336 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011002928894102855, + "loss": 1.483, + "step": 22337 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011001737625300494, + "loss": 1.4994, + "step": 22338 + }, + { + "epoch": 1.76, + "learning_rate": 0.00011000546383644125, + "loss": 1.4944, + "step": 22339 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010999355169141841, + "loss": 1.5314, + "step": 22340 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010998163981801721, + "loss": 1.5216, + "step": 22341 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010996972821631867, + "loss": 1.4536, + "step": 22342 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010995781688640358, + "loss": 1.4331, + "step": 22343 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010994590582835276, + "loss": 1.4396, + "step": 22344 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010993399504224723, + "loss": 1.5322, + "step": 22345 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010992208452816769, + "loss": 1.4916, + "step": 22346 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010991017428619509, + "loss": 1.5532, + "step": 22347 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010989826431641032, + "loss": 1.5208, + "step": 22348 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010988635461889417, + "loss": 1.4384, + "step": 22349 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010987444519372756, + "loss": 1.5096, + "step": 22350 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010986253604099131, + "loss": 1.5011, + "step": 22351 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010985062716076627, + "loss": 1.5186, + "step": 22352 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010983871855313336, + "loss": 1.4804, + "step": 22353 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010982681021817336, + "loss": 1.5077, + "step": 22354 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010981490215596718, + "loss": 1.4601, + "step": 22355 + }, + { + "epoch": 1.76, + "learning_rate": 0.0001098029943665956, + "loss": 1.4919, + "step": 22356 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010979108685013947, + "loss": 1.4943, + "step": 22357 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010977917960667972, + "loss": 1.5274, + "step": 22358 + }, + { + "epoch": 1.76, + "learning_rate": 0.0001097672726362971, + "loss": 1.5344, + "step": 22359 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010975536593907256, + "loss": 1.5375, + "step": 22360 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010974345951508687, + "loss": 1.4987, + "step": 22361 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010973155336442089, + "loss": 1.5552, + "step": 22362 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010971964748715539, + "loss": 1.5421, + "step": 22363 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010970774188337128, + "loss": 1.4894, + "step": 22364 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010969583655314938, + "loss": 1.5147, + "step": 22365 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010968393149657047, + "loss": 1.4657, + "step": 22366 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010967202671371546, + "loss": 1.5131, + "step": 22367 + }, + { + "epoch": 1.76, + "learning_rate": 0.0001096601222046651, + "loss": 1.5263, + "step": 22368 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010964821796950027, + "loss": 1.5198, + "step": 22369 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010963631400830177, + "loss": 1.504, + "step": 22370 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010962441032115042, + "loss": 1.504, + "step": 22371 + }, + { + "epoch": 1.76, + "learning_rate": 0.000109612506908127, + "loss": 1.4983, + "step": 22372 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010960060376931239, + "loss": 1.4627, + "step": 22373 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010958870090478744, + "loss": 1.4973, + "step": 22374 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010957679831463285, + "loss": 1.4917, + "step": 22375 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010956489599892952, + "loss": 1.4273, + "step": 22376 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010955299395775825, + "loss": 1.4616, + "step": 22377 + }, + { + "epoch": 1.76, + "learning_rate": 0.0001095410921911998, + "loss": 1.4451, + "step": 22378 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010952919069933504, + "loss": 1.5194, + "step": 22379 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010951728948224471, + "loss": 1.531, + "step": 22380 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010950538854000966, + "loss": 1.428, + "step": 22381 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010949348787271067, + "loss": 1.4964, + "step": 22382 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010948158748042854, + "loss": 1.4974, + "step": 22383 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010946968736324409, + "loss": 1.544, + "step": 22384 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010945778752123806, + "loss": 1.4822, + "step": 22385 + }, + { + "epoch": 1.76, + "learning_rate": 0.0001094458879544913, + "loss": 1.5334, + "step": 22386 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010943398866308462, + "loss": 1.4283, + "step": 22387 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010942208964709866, + "loss": 1.5194, + "step": 22388 + }, + { + "epoch": 1.76, + "learning_rate": 0.0001094101909066144, + "loss": 1.494, + "step": 22389 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010939829244171253, + "loss": 1.5064, + "step": 22390 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010938639425247387, + "loss": 1.5267, + "step": 22391 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010937449633897914, + "loss": 1.5105, + "step": 22392 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010936259870130918, + "loss": 1.5159, + "step": 22393 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010935070133954478, + "loss": 1.5247, + "step": 22394 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010933880425376664, + "loss": 1.4715, + "step": 22395 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010932690744405565, + "loss": 1.5097, + "step": 22396 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010931501091049243, + "loss": 1.4488, + "step": 22397 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010930311465315787, + "loss": 1.5317, + "step": 22398 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010929121867213272, + "loss": 1.4989, + "step": 22399 + }, + { + "epoch": 1.76, + "learning_rate": 0.0001092793229674977, + "loss": 1.5307, + "step": 22400 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010926742753933359, + "loss": 1.5297, + "step": 22401 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010925553238772123, + "loss": 1.4549, + "step": 22402 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010924363751274127, + "loss": 1.5012, + "step": 22403 + }, + { + "epoch": 1.76, + "learning_rate": 0.0001092317429144745, + "loss": 1.469, + "step": 22404 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010921984859300173, + "loss": 1.4796, + "step": 22405 + }, + { + "epoch": 1.76, + "learning_rate": 0.0001092079545484037, + "loss": 1.5004, + "step": 22406 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010919606078076112, + "loss": 1.5037, + "step": 22407 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010918416729015481, + "loss": 1.4786, + "step": 22408 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010917227407666545, + "loss": 1.4631, + "step": 22409 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010916038114037382, + "loss": 1.5497, + "step": 22410 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010914848848136067, + "loss": 1.5403, + "step": 22411 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010913659609970675, + "loss": 1.5205, + "step": 22412 + }, + { + "epoch": 1.76, + "learning_rate": 0.0001091247039954928, + "loss": 1.5166, + "step": 22413 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010911281216879952, + "loss": 1.5074, + "step": 22414 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010910092061970769, + "loss": 1.4752, + "step": 22415 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010908902934829806, + "loss": 1.4567, + "step": 22416 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010907713835465132, + "loss": 1.4509, + "step": 22417 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010906524763884823, + "loss": 1.479, + "step": 22418 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010905335720096947, + "loss": 1.4656, + "step": 22419 + }, + { + "epoch": 1.76, + "learning_rate": 0.0001090414670410959, + "loss": 1.4906, + "step": 22420 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010902957715930813, + "loss": 1.5144, + "step": 22421 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010901768755568692, + "loss": 1.504, + "step": 22422 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010900579823031303, + "loss": 1.5101, + "step": 22423 + }, + { + "epoch": 1.76, + "learning_rate": 0.0001089939091832671, + "loss": 1.498, + "step": 22424 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010898202041462994, + "loss": 1.5007, + "step": 22425 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010897013192448221, + "loss": 1.4982, + "step": 22426 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010895824371290463, + "loss": 1.4582, + "step": 22427 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010894635577997797, + "loss": 1.4976, + "step": 22428 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010893446812578285, + "loss": 1.481, + "step": 22429 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010892258075040004, + "loss": 1.4704, + "step": 22430 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010891069365391027, + "loss": 1.4746, + "step": 22431 + }, + { + "epoch": 1.76, + "learning_rate": 0.00010889880683639416, + "loss": 1.4661, + "step": 22432 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010888692029793252, + "loss": 1.4654, + "step": 22433 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010887503403860598, + "loss": 1.4912, + "step": 22434 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010886314805849521, + "loss": 1.4258, + "step": 22435 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010885126235768101, + "loss": 1.515, + "step": 22436 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010883937693624408, + "loss": 1.4786, + "step": 22437 + }, + { + "epoch": 1.77, + "learning_rate": 0.000108827491794265, + "loss": 1.473, + "step": 22438 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010881560693182455, + "loss": 1.4791, + "step": 22439 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010880372234900343, + "loss": 1.5673, + "step": 22440 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010879183804588227, + "loss": 1.4753, + "step": 22441 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010877995402254182, + "loss": 1.4289, + "step": 22442 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010876807027906269, + "loss": 1.5229, + "step": 22443 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010875618681552563, + "loss": 1.4608, + "step": 22444 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010874430363201133, + "loss": 1.4905, + "step": 22445 + }, + { + "epoch": 1.77, + "learning_rate": 0.0001087324207286004, + "loss": 1.5226, + "step": 22446 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010872053810537356, + "loss": 1.5354, + "step": 22447 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010870865576241154, + "loss": 1.4736, + "step": 22448 + }, + { + "epoch": 1.77, + "learning_rate": 0.0001086967736997949, + "loss": 1.4953, + "step": 22449 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010868489191760441, + "loss": 1.4688, + "step": 22450 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010867301041592063, + "loss": 1.4704, + "step": 22451 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010866112919482438, + "loss": 1.5704, + "step": 22452 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010864924825439622, + "loss": 1.4646, + "step": 22453 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010863736759471688, + "loss": 1.4738, + "step": 22454 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010862548721586695, + "loss": 1.5035, + "step": 22455 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010861360711792714, + "loss": 1.4775, + "step": 22456 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010860172730097814, + "loss": 1.5012, + "step": 22457 + }, + { + "epoch": 1.77, + "learning_rate": 0.0001085898477651005, + "loss": 1.448, + "step": 22458 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010857796851037497, + "loss": 1.578, + "step": 22459 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010856608953688221, + "loss": 1.5021, + "step": 22460 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010855421084470279, + "loss": 1.5365, + "step": 22461 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010854233243391744, + "loss": 1.4428, + "step": 22462 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010853045430460674, + "loss": 1.4533, + "step": 22463 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010851857645685136, + "loss": 1.5313, + "step": 22464 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010850669889073202, + "loss": 1.493, + "step": 22465 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010849482160632924, + "loss": 1.4714, + "step": 22466 + }, + { + "epoch": 1.77, + "learning_rate": 0.0001084829446037237, + "loss": 1.4713, + "step": 22467 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010847106788299608, + "loss": 1.4399, + "step": 22468 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010845919144422703, + "loss": 1.4523, + "step": 22469 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010844731528749709, + "loss": 1.5294, + "step": 22470 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010843543941288698, + "loss": 1.5254, + "step": 22471 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010842356382047731, + "loss": 1.5011, + "step": 22472 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010841168851034869, + "loss": 1.4864, + "step": 22473 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010839981348258177, + "loss": 1.4627, + "step": 22474 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010838793873725712, + "loss": 1.4814, + "step": 22475 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010837606427445541, + "loss": 1.5466, + "step": 22476 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010836419009425728, + "loss": 1.5257, + "step": 22477 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010835231619674328, + "loss": 1.5206, + "step": 22478 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010834044258199413, + "loss": 1.4478, + "step": 22479 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010832856925009034, + "loss": 1.4991, + "step": 22480 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010831669620111257, + "loss": 1.4905, + "step": 22481 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010830482343514139, + "loss": 1.4902, + "step": 22482 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010829295095225752, + "loss": 1.5115, + "step": 22483 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010828107875254148, + "loss": 1.4628, + "step": 22484 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010826920683607387, + "loss": 1.4631, + "step": 22485 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010825733520293536, + "loss": 1.5167, + "step": 22486 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010824546385320647, + "loss": 1.5267, + "step": 22487 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010823359278696785, + "loss": 1.4825, + "step": 22488 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010822172200430012, + "loss": 1.4904, + "step": 22489 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010820985150528378, + "loss": 1.5027, + "step": 22490 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010819798128999954, + "loss": 1.5103, + "step": 22491 + }, + { + "epoch": 1.77, + "learning_rate": 0.0001081861113585279, + "loss": 1.4874, + "step": 22492 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010817424171094951, + "loss": 1.4735, + "step": 22493 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010816237234734496, + "loss": 1.5577, + "step": 22494 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010815050326779477, + "loss": 1.54, + "step": 22495 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010813863447237961, + "loss": 1.5361, + "step": 22496 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010812676596118, + "loss": 1.5017, + "step": 22497 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010811489773427649, + "loss": 1.4795, + "step": 22498 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010810302979174973, + "loss": 1.5457, + "step": 22499 + }, + { + "epoch": 1.77, + "learning_rate": 0.0001080911621336803, + "loss": 1.4952, + "step": 22500 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010807929476014879, + "loss": 1.4751, + "step": 22501 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010806742767123569, + "loss": 1.4867, + "step": 22502 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010805556086702164, + "loss": 1.4954, + "step": 22503 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010804369434758717, + "loss": 1.4967, + "step": 22504 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010803182811301285, + "loss": 1.5063, + "step": 22505 + }, + { + "epoch": 1.77, + "learning_rate": 0.0001080199621633793, + "loss": 1.4559, + "step": 22506 + }, + { + "epoch": 1.77, + "learning_rate": 0.000108008096498767, + "loss": 1.5029, + "step": 22507 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010799623111925659, + "loss": 1.4774, + "step": 22508 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010798436602492855, + "loss": 1.4985, + "step": 22509 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010797250121586348, + "loss": 1.4558, + "step": 22510 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010796063669214196, + "loss": 1.5066, + "step": 22511 + }, + { + "epoch": 1.77, + "learning_rate": 0.0001079487724538445, + "loss": 1.4567, + "step": 22512 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010793690850105167, + "loss": 1.474, + "step": 22513 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010792504483384399, + "loss": 1.4869, + "step": 22514 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010791318145230209, + "loss": 1.5176, + "step": 22515 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010790131835650642, + "loss": 1.4988, + "step": 22516 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010788945554653758, + "loss": 1.525, + "step": 22517 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010787759302247613, + "loss": 1.4302, + "step": 22518 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010786573078440255, + "loss": 1.4917, + "step": 22519 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010785386883239744, + "loss": 1.4803, + "step": 22520 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010784200716654126, + "loss": 1.4866, + "step": 22521 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010783014578691458, + "loss": 1.5103, + "step": 22522 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010781828469359799, + "loss": 1.4509, + "step": 22523 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010780642388667193, + "loss": 1.5375, + "step": 22524 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010779456336621699, + "loss": 1.4623, + "step": 22525 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010778270313231366, + "loss": 1.4987, + "step": 22526 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010777084318504246, + "loss": 1.429, + "step": 22527 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010775898352448399, + "loss": 1.5332, + "step": 22528 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010774712415071858, + "loss": 1.5299, + "step": 22529 + }, + { + "epoch": 1.77, + "learning_rate": 0.000107735265063827, + "loss": 1.491, + "step": 22530 + }, + { + "epoch": 1.77, + "learning_rate": 0.0001077234062638896, + "loss": 1.5448, + "step": 22531 + }, + { + "epoch": 1.77, + "learning_rate": 0.000107711547750987, + "loss": 1.4953, + "step": 22532 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010769968952519958, + "loss": 1.4868, + "step": 22533 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010768783158660797, + "loss": 1.5291, + "step": 22534 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010767597393529263, + "loss": 1.49, + "step": 22535 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010766411657133405, + "loss": 1.5584, + "step": 22536 + }, + { + "epoch": 1.77, + "learning_rate": 0.0001076522594948128, + "loss": 1.4957, + "step": 22537 + }, + { + "epoch": 1.77, + "learning_rate": 0.0001076404027058093, + "loss": 1.5531, + "step": 22538 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010762854620440407, + "loss": 1.5091, + "step": 22539 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010761668999067768, + "loss": 1.5344, + "step": 22540 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010760483406471054, + "loss": 1.4824, + "step": 22541 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010759297842658318, + "loss": 1.5409, + "step": 22542 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010758112307637613, + "loss": 1.4496, + "step": 22543 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010756926801416982, + "loss": 1.5418, + "step": 22544 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010755741324004471, + "loss": 1.4553, + "step": 22545 + }, + { + "epoch": 1.77, + "learning_rate": 0.0001075455587540814, + "loss": 1.497, + "step": 22546 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010753370455636034, + "loss": 1.4693, + "step": 22547 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010752185064696194, + "loss": 1.4922, + "step": 22548 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010750999702596678, + "loss": 1.4742, + "step": 22549 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010749814369345528, + "loss": 1.4543, + "step": 22550 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010748629064950791, + "loss": 1.5142, + "step": 22551 + }, + { + "epoch": 1.77, + "learning_rate": 0.0001074744378942052, + "loss": 1.5065, + "step": 22552 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010746258542762757, + "loss": 1.4988, + "step": 22553 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010745073324985548, + "loss": 1.4793, + "step": 22554 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010743888136096949, + "loss": 1.4903, + "step": 22555 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010742702976104995, + "loss": 1.4896, + "step": 22556 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010741517845017745, + "loss": 1.5044, + "step": 22557 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010740332742843234, + "loss": 1.4454, + "step": 22558 + }, + { + "epoch": 1.77, + "learning_rate": 0.00010739147669589512, + "loss": 1.4959, + "step": 22559 + }, + { + "epoch": 1.78, + "learning_rate": 0.0001073796262526463, + "loss": 1.482, + "step": 22560 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010736777609876626, + "loss": 1.4417, + "step": 22561 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010735592623433549, + "loss": 1.4732, + "step": 22562 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010734407665943445, + "loss": 1.5112, + "step": 22563 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010733222737414364, + "loss": 1.5287, + "step": 22564 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010732037837854343, + "loss": 1.4786, + "step": 22565 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010730852967271431, + "loss": 1.4928, + "step": 22566 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010729668125673669, + "loss": 1.4728, + "step": 22567 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010728483313069103, + "loss": 1.4968, + "step": 22568 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010727298529465785, + "loss": 1.5454, + "step": 22569 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010726113774871744, + "loss": 1.5241, + "step": 22570 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010724929049295036, + "loss": 1.5023, + "step": 22571 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010723744352743699, + "loss": 1.4663, + "step": 22572 + }, + { + "epoch": 1.78, + "learning_rate": 0.0001072255968522578, + "loss": 1.4948, + "step": 22573 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010721375046749321, + "loss": 1.4967, + "step": 22574 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010720190437322361, + "loss": 1.4847, + "step": 22575 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010719005856952947, + "loss": 1.4802, + "step": 22576 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010717821305649116, + "loss": 1.4902, + "step": 22577 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010716636783418922, + "loss": 1.5366, + "step": 22578 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010715452290270399, + "loss": 1.5164, + "step": 22579 + }, + { + "epoch": 1.78, + "learning_rate": 0.0001071426782621159, + "loss": 1.4549, + "step": 22580 + }, + { + "epoch": 1.78, + "learning_rate": 0.0001071308339125054, + "loss": 1.5186, + "step": 22581 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010711898985395285, + "loss": 1.5346, + "step": 22582 + }, + { + "epoch": 1.78, + "learning_rate": 0.0001071071460865387, + "loss": 1.4753, + "step": 22583 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010709530261034338, + "loss": 1.4763, + "step": 22584 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010708345942544725, + "loss": 1.4687, + "step": 22585 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010707161653193077, + "loss": 1.5035, + "step": 22586 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010705977392987431, + "loss": 1.5378, + "step": 22587 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010704793161935828, + "loss": 1.5034, + "step": 22588 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010703608960046311, + "loss": 1.4832, + "step": 22589 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010702424787326918, + "loss": 1.4567, + "step": 22590 + }, + { + "epoch": 1.78, + "learning_rate": 0.0001070124064378569, + "loss": 1.4593, + "step": 22591 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010700056529430658, + "loss": 1.4776, + "step": 22592 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010698872444269878, + "loss": 1.4831, + "step": 22593 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010697688388311377, + "loss": 1.5085, + "step": 22594 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010696504361563201, + "loss": 1.4711, + "step": 22595 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010695320364033382, + "loss": 1.4342, + "step": 22596 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010694136395729962, + "loss": 1.4482, + "step": 22597 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010692952456660984, + "loss": 1.4474, + "step": 22598 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010691768546834477, + "loss": 1.521, + "step": 22599 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010690584666258484, + "loss": 1.4989, + "step": 22600 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010689400814941049, + "loss": 1.4859, + "step": 22601 + }, + { + "epoch": 1.78, + "learning_rate": 0.000106882169928902, + "loss": 1.5119, + "step": 22602 + }, + { + "epoch": 1.78, + "learning_rate": 0.0001068703320011398, + "loss": 1.548, + "step": 22603 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010685849436620421, + "loss": 1.4926, + "step": 22604 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010684665702417565, + "loss": 1.5866, + "step": 22605 + }, + { + "epoch": 1.78, + "learning_rate": 0.0001068348199751345, + "loss": 1.5834, + "step": 22606 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010682298321916105, + "loss": 1.4642, + "step": 22607 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010681114675633571, + "loss": 1.5222, + "step": 22608 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010679931058673887, + "loss": 1.4938, + "step": 22609 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010678747471045091, + "loss": 1.5062, + "step": 22610 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010677563912755213, + "loss": 1.4864, + "step": 22611 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010676380383812289, + "loss": 1.4801, + "step": 22612 + }, + { + "epoch": 1.78, + "learning_rate": 0.0001067519688422436, + "loss": 1.5258, + "step": 22613 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010674013413999453, + "loss": 1.5016, + "step": 22614 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010672829973145614, + "loss": 1.4776, + "step": 22615 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010671646561670865, + "loss": 1.4929, + "step": 22616 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010670463179583248, + "loss": 1.5025, + "step": 22617 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010669279826890802, + "loss": 1.5004, + "step": 22618 + }, + { + "epoch": 1.78, + "learning_rate": 0.0001066809650360155, + "loss": 1.4967, + "step": 22619 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010666913209723538, + "loss": 1.4433, + "step": 22620 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010665729945264789, + "loss": 1.5558, + "step": 22621 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010664546710233341, + "loss": 1.4951, + "step": 22622 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010663363504637235, + "loss": 1.5076, + "step": 22623 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010662180328484489, + "loss": 1.4819, + "step": 22624 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010660997181783147, + "loss": 1.4556, + "step": 22625 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010659814064541243, + "loss": 1.4857, + "step": 22626 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010658630976766807, + "loss": 1.5088, + "step": 22627 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010657447918467867, + "loss": 1.4529, + "step": 22628 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010656264889652461, + "loss": 1.4939, + "step": 22629 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010655081890328623, + "loss": 1.5387, + "step": 22630 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010653898920504378, + "loss": 1.5149, + "step": 22631 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010652715980187763, + "loss": 1.4823, + "step": 22632 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010651533069386803, + "loss": 1.5193, + "step": 22633 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010650350188109535, + "loss": 1.4964, + "step": 22634 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010649167336363995, + "loss": 1.4818, + "step": 22635 + }, + { + "epoch": 1.78, + "learning_rate": 0.000106479845141582, + "loss": 1.5112, + "step": 22636 + }, + { + "epoch": 1.78, + "learning_rate": 0.0001064680172150019, + "loss": 1.5171, + "step": 22637 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010645618958397998, + "loss": 1.4833, + "step": 22638 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010644436224859643, + "loss": 1.4768, + "step": 22639 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010643253520893168, + "loss": 1.5342, + "step": 22640 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010642070846506594, + "loss": 1.539, + "step": 22641 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010640888201707959, + "loss": 1.4766, + "step": 22642 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010639705586505285, + "loss": 1.5173, + "step": 22643 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010638523000906605, + "loss": 1.5257, + "step": 22644 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010637340444919945, + "loss": 1.4916, + "step": 22645 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010636157918553338, + "loss": 1.5133, + "step": 22646 + }, + { + "epoch": 1.78, + "learning_rate": 0.0001063497542181481, + "loss": 1.5254, + "step": 22647 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010633792954712389, + "loss": 1.4927, + "step": 22648 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010632610517254106, + "loss": 1.5256, + "step": 22649 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010631428109447986, + "loss": 1.4586, + "step": 22650 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010630245731302057, + "loss": 1.5632, + "step": 22651 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010629063382824353, + "loss": 1.5457, + "step": 22652 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010627881064022891, + "loss": 1.4549, + "step": 22653 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010626698774905707, + "loss": 1.4875, + "step": 22654 + }, + { + "epoch": 1.78, + "learning_rate": 0.0001062551651548082, + "loss": 1.5048, + "step": 22655 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010624334285756267, + "loss": 1.5346, + "step": 22656 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010623152085740066, + "loss": 1.4566, + "step": 22657 + }, + { + "epoch": 1.78, + "learning_rate": 0.0001062196991544025, + "loss": 1.5029, + "step": 22658 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010620787774864843, + "loss": 1.5195, + "step": 22659 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010619605664021868, + "loss": 1.5459, + "step": 22660 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010618423582919357, + "loss": 1.5148, + "step": 22661 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010617241531565327, + "loss": 1.425, + "step": 22662 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010616059509967811, + "loss": 1.4984, + "step": 22663 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010614877518134833, + "loss": 1.5439, + "step": 22664 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010613695556074413, + "loss": 1.4581, + "step": 22665 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010612513623794582, + "loss": 1.5079, + "step": 22666 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010611331721303364, + "loss": 1.5066, + "step": 22667 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010610149848608778, + "loss": 1.4937, + "step": 22668 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010608968005718855, + "loss": 1.5368, + "step": 22669 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010607786192641615, + "loss": 1.4859, + "step": 22670 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010606604409385077, + "loss": 1.4986, + "step": 22671 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010605422655957276, + "loss": 1.4943, + "step": 22672 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010604240932366233, + "loss": 1.4813, + "step": 22673 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010603059238619964, + "loss": 1.5121, + "step": 22674 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010601877574726497, + "loss": 1.4797, + "step": 22675 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010600695940693858, + "loss": 1.5324, + "step": 22676 + }, + { + "epoch": 1.78, + "learning_rate": 0.0001059951433653006, + "loss": 1.4732, + "step": 22677 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010598332762243139, + "loss": 1.4849, + "step": 22678 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010597151217841103, + "loss": 1.4856, + "step": 22679 + }, + { + "epoch": 1.78, + "learning_rate": 0.0001059596970333198, + "loss": 1.4329, + "step": 22680 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010594788218723797, + "loss": 1.5016, + "step": 22681 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010593606764024567, + "loss": 1.479, + "step": 22682 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010592425339242316, + "loss": 1.4275, + "step": 22683 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010591243944385068, + "loss": 1.5041, + "step": 22684 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010590062579460838, + "loss": 1.5302, + "step": 22685 + }, + { + "epoch": 1.78, + "learning_rate": 0.00010588881244477652, + "loss": 1.4901, + "step": 22686 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010587699939443517, + "loss": 1.4926, + "step": 22687 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010586518664366476, + "loss": 1.5216, + "step": 22688 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010585337419254535, + "loss": 1.4605, + "step": 22689 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010584156204115718, + "loss": 1.5521, + "step": 22690 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010582975018958041, + "loss": 1.5468, + "step": 22691 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010581793863789528, + "loss": 1.5286, + "step": 22692 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010580612738618198, + "loss": 1.4871, + "step": 22693 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010579431643452065, + "loss": 1.5462, + "step": 22694 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010578250578299154, + "loss": 1.5106, + "step": 22695 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010577069543167481, + "loss": 1.4886, + "step": 22696 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010575888538065064, + "loss": 1.501, + "step": 22697 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010574707562999924, + "loss": 1.5218, + "step": 22698 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010573526617980077, + "loss": 1.5093, + "step": 22699 + }, + { + "epoch": 1.79, + "learning_rate": 0.0001057234570301354, + "loss": 1.4758, + "step": 22700 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010571164818108336, + "loss": 1.5314, + "step": 22701 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010569983963272471, + "loss": 1.4941, + "step": 22702 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010568803138513975, + "loss": 1.5097, + "step": 22703 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010567622343840859, + "loss": 1.4647, + "step": 22704 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010566441579261148, + "loss": 1.4662, + "step": 22705 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010565260844782844, + "loss": 1.482, + "step": 22706 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010564080140413978, + "loss": 1.4603, + "step": 22707 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010562899466162556, + "loss": 1.4483, + "step": 22708 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010561718822036597, + "loss": 1.5144, + "step": 22709 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010560538208044122, + "loss": 1.4334, + "step": 22710 + }, + { + "epoch": 1.79, + "learning_rate": 0.0001055935762419314, + "loss": 1.564, + "step": 22711 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010558177070491668, + "loss": 1.448, + "step": 22712 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010556996546947727, + "loss": 1.4851, + "step": 22713 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010555816053569323, + "loss": 1.462, + "step": 22714 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010554635590364478, + "loss": 1.451, + "step": 22715 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010553455157341204, + "loss": 1.4989, + "step": 22716 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010552274754507514, + "loss": 1.5183, + "step": 22717 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010551094381871421, + "loss": 1.4964, + "step": 22718 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010549914039440949, + "loss": 1.4584, + "step": 22719 + }, + { + "epoch": 1.79, + "learning_rate": 0.000105487337272241, + "loss": 1.4742, + "step": 22720 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010547553445228892, + "loss": 1.511, + "step": 22721 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010546373193463346, + "loss": 1.5218, + "step": 22722 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010545192971935461, + "loss": 1.4669, + "step": 22723 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010544012780653259, + "loss": 1.5405, + "step": 22724 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010542832619624755, + "loss": 1.4752, + "step": 22725 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010541652488857955, + "loss": 1.5509, + "step": 22726 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010540472388360876, + "loss": 1.4941, + "step": 22727 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010539292318141526, + "loss": 1.4664, + "step": 22728 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010538112278207921, + "loss": 1.4677, + "step": 22729 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010536932268568071, + "loss": 1.5383, + "step": 22730 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010535752289229988, + "loss": 1.47, + "step": 22731 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010534572340201687, + "loss": 1.4819, + "step": 22732 + }, + { + "epoch": 1.79, + "learning_rate": 0.0001053339242149117, + "loss": 1.4962, + "step": 22733 + }, + { + "epoch": 1.79, + "learning_rate": 0.0001053221253310645, + "loss": 1.5743, + "step": 22734 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010531032675055547, + "loss": 1.4377, + "step": 22735 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010529852847346465, + "loss": 1.4685, + "step": 22736 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010528673049987219, + "loss": 1.5273, + "step": 22737 + }, + { + "epoch": 1.79, + "learning_rate": 0.0001052749328298581, + "loss": 1.4849, + "step": 22738 + }, + { + "epoch": 1.79, + "learning_rate": 0.0001052631354635026, + "loss": 1.5341, + "step": 22739 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010525133840088565, + "loss": 1.4533, + "step": 22740 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010523954164208745, + "loss": 1.4679, + "step": 22741 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010522774518718809, + "loss": 1.5031, + "step": 22742 + }, + { + "epoch": 1.79, + "learning_rate": 0.0001052159490362676, + "loss": 1.4862, + "step": 22743 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010520415318940611, + "loss": 1.478, + "step": 22744 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010519235764668369, + "loss": 1.4957, + "step": 22745 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010518056240818044, + "loss": 1.487, + "step": 22746 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010516876747397645, + "loss": 1.4871, + "step": 22747 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010515697284415177, + "loss": 1.5029, + "step": 22748 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010514517851878647, + "loss": 1.4669, + "step": 22749 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010513338449796069, + "loss": 1.4967, + "step": 22750 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010512159078175449, + "loss": 1.5234, + "step": 22751 + }, + { + "epoch": 1.79, + "learning_rate": 0.0001051097973702479, + "loss": 1.4715, + "step": 22752 + }, + { + "epoch": 1.79, + "learning_rate": 0.000105098004263521, + "loss": 1.4645, + "step": 22753 + }, + { + "epoch": 1.79, + "learning_rate": 0.0001050862114616539, + "loss": 1.5045, + "step": 22754 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010507441896472663, + "loss": 1.4925, + "step": 22755 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010506262677281926, + "loss": 1.5146, + "step": 22756 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010505083488601187, + "loss": 1.5286, + "step": 22757 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010503904330438449, + "loss": 1.4822, + "step": 22758 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010502725202801721, + "loss": 1.4133, + "step": 22759 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010501546105699005, + "loss": 1.5108, + "step": 22760 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010500367039138311, + "loss": 1.4719, + "step": 22761 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010499188003127639, + "loss": 1.4998, + "step": 22762 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010498008997674997, + "loss": 1.4765, + "step": 22763 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010496830022788392, + "loss": 1.5333, + "step": 22764 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010495651078475819, + "loss": 1.5041, + "step": 22765 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010494472164745294, + "loss": 1.4651, + "step": 22766 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010493293281604818, + "loss": 1.4308, + "step": 22767 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010492114429062394, + "loss": 1.5181, + "step": 22768 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010490935607126025, + "loss": 1.4879, + "step": 22769 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010489756815803713, + "loss": 1.4838, + "step": 22770 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010488578055103466, + "loss": 1.5253, + "step": 22771 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010487399325033284, + "loss": 1.4948, + "step": 22772 + }, + { + "epoch": 1.79, + "learning_rate": 0.0001048622062560117, + "loss": 1.5264, + "step": 22773 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010485041956815126, + "loss": 1.4837, + "step": 22774 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010483863318683155, + "loss": 1.4739, + "step": 22775 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010482684711213261, + "loss": 1.5389, + "step": 22776 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010481506134413445, + "loss": 1.4962, + "step": 22777 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010480327588291708, + "loss": 1.4658, + "step": 22778 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010479149072856055, + "loss": 1.469, + "step": 22779 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010477970588114482, + "loss": 1.4517, + "step": 22780 + }, + { + "epoch": 1.79, + "learning_rate": 0.0001047679213407499, + "loss": 1.5454, + "step": 22781 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010475613710745588, + "loss": 1.4624, + "step": 22782 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010474435318134273, + "loss": 1.4844, + "step": 22783 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010473256956249043, + "loss": 1.5321, + "step": 22784 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010472078625097902, + "loss": 1.454, + "step": 22785 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010470900324688847, + "loss": 1.5223, + "step": 22786 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010469722055029879, + "loss": 1.512, + "step": 22787 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010468543816129, + "loss": 1.4963, + "step": 22788 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010467365607994205, + "loss": 1.428, + "step": 22789 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010466187430633499, + "loss": 1.5333, + "step": 22790 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010465009284054878, + "loss": 1.4658, + "step": 22791 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010463831168266339, + "loss": 1.5547, + "step": 22792 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010462653083275886, + "loss": 1.4573, + "step": 22793 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010461475029091513, + "loss": 1.5352, + "step": 22794 + }, + { + "epoch": 1.79, + "learning_rate": 0.0001046029700572122, + "loss": 1.479, + "step": 22795 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010459119013173006, + "loss": 1.4623, + "step": 22796 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010457941051454864, + "loss": 1.5222, + "step": 22797 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010456763120574798, + "loss": 1.4991, + "step": 22798 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010455585220540804, + "loss": 1.4826, + "step": 22799 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010454407351360881, + "loss": 1.5275, + "step": 22800 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010453229513043021, + "loss": 1.5, + "step": 22801 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010452051705595226, + "loss": 1.5034, + "step": 22802 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010450873929025488, + "loss": 1.4893, + "step": 22803 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010449696183341804, + "loss": 1.4802, + "step": 22804 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010448518468552174, + "loss": 1.4957, + "step": 22805 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010447340784664591, + "loss": 1.468, + "step": 22806 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010446163131687053, + "loss": 1.4638, + "step": 22807 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010444985509627555, + "loss": 1.5348, + "step": 22808 + }, + { + "epoch": 1.79, + "learning_rate": 0.0001044380791849409, + "loss": 1.458, + "step": 22809 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010442630358294658, + "loss": 1.5023, + "step": 22810 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010441452829037246, + "loss": 1.4982, + "step": 22811 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010440275330729852, + "loss": 1.4688, + "step": 22812 + }, + { + "epoch": 1.79, + "learning_rate": 0.00010439097863380474, + "loss": 1.4668, + "step": 22813 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010437920426997111, + "loss": 1.4996, + "step": 22814 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010436743021587746, + "loss": 1.4867, + "step": 22815 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010435565647160376, + "loss": 1.4677, + "step": 22816 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010434388303723001, + "loss": 1.4844, + "step": 22817 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010433210991283605, + "loss": 1.5006, + "step": 22818 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010432033709850191, + "loss": 1.511, + "step": 22819 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010430856459430745, + "loss": 1.4673, + "step": 22820 + }, + { + "epoch": 1.8, + "learning_rate": 0.0001042967924003326, + "loss": 1.5142, + "step": 22821 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010428502051665735, + "loss": 1.4542, + "step": 22822 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010427324894336155, + "loss": 1.5123, + "step": 22823 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010426147768052518, + "loss": 1.4775, + "step": 22824 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010424970672822813, + "loss": 1.46, + "step": 22825 + }, + { + "epoch": 1.8, + "learning_rate": 0.0001042379360865503, + "loss": 1.4957, + "step": 22826 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010422616575557168, + "loss": 1.5132, + "step": 22827 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010421439573537203, + "loss": 1.4731, + "step": 22828 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010420262602603147, + "loss": 1.4955, + "step": 22829 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010419085662762976, + "loss": 1.5059, + "step": 22830 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010417908754024688, + "loss": 1.4794, + "step": 22831 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010416731876396267, + "loss": 1.5094, + "step": 22832 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010415555029885711, + "loss": 1.5002, + "step": 22833 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010414378214501009, + "loss": 1.4772, + "step": 22834 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010413201430250144, + "loss": 1.452, + "step": 22835 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010412024677141108, + "loss": 1.4774, + "step": 22836 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010410847955181899, + "loss": 1.4811, + "step": 22837 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010409671264380496, + "loss": 1.4968, + "step": 22838 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010408494604744895, + "loss": 1.5102, + "step": 22839 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010407317976283078, + "loss": 1.4899, + "step": 22840 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010406141379003036, + "loss": 1.4421, + "step": 22841 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010404964812912764, + "loss": 1.4693, + "step": 22842 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010403788278020245, + "loss": 1.5323, + "step": 22843 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010402611774333458, + "loss": 1.5194, + "step": 22844 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010401435301860407, + "loss": 1.5545, + "step": 22845 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010400258860609075, + "loss": 1.4692, + "step": 22846 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010399082450587444, + "loss": 1.4663, + "step": 22847 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010397906071803504, + "loss": 1.4776, + "step": 22848 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010396729724265245, + "loss": 1.4952, + "step": 22849 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010395553407980648, + "loss": 1.4432, + "step": 22850 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010394377122957706, + "loss": 1.4555, + "step": 22851 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010393200869204397, + "loss": 1.4416, + "step": 22852 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010392024646728714, + "loss": 1.483, + "step": 22853 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010390848455538642, + "loss": 1.5144, + "step": 22854 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010389672295642164, + "loss": 1.4468, + "step": 22855 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010388496167047269, + "loss": 1.5179, + "step": 22856 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010387320069761937, + "loss": 1.452, + "step": 22857 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010386144003794156, + "loss": 1.4674, + "step": 22858 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010384967969151907, + "loss": 1.4886, + "step": 22859 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010383791965843186, + "loss": 1.5132, + "step": 22860 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010382615993875968, + "loss": 1.5014, + "step": 22861 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010381440053258241, + "loss": 1.5393, + "step": 22862 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010380264143997986, + "loss": 1.526, + "step": 22863 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010379088266103188, + "loss": 1.4809, + "step": 22864 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010377912419581831, + "loss": 1.4711, + "step": 22865 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010376736604441898, + "loss": 1.5532, + "step": 22866 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010375560820691372, + "loss": 1.4814, + "step": 22867 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010374385068338238, + "loss": 1.4672, + "step": 22868 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010373209347390473, + "loss": 1.4777, + "step": 22869 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010372033657856065, + "loss": 1.5357, + "step": 22870 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010370857999742997, + "loss": 1.4779, + "step": 22871 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010369682373059244, + "loss": 1.4525, + "step": 22872 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010368506777812797, + "loss": 1.4993, + "step": 22873 + }, + { + "epoch": 1.8, + "learning_rate": 0.0001036733121401163, + "loss": 1.4899, + "step": 22874 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010366155681663724, + "loss": 1.534, + "step": 22875 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010364980180777066, + "loss": 1.5109, + "step": 22876 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010363804711359635, + "loss": 1.4721, + "step": 22877 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010362629273419416, + "loss": 1.5575, + "step": 22878 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010361453866964382, + "loss": 1.5054, + "step": 22879 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010360278492002518, + "loss": 1.5069, + "step": 22880 + }, + { + "epoch": 1.8, + "learning_rate": 0.000103591031485418, + "loss": 1.4965, + "step": 22881 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010357927836590211, + "loss": 1.5167, + "step": 22882 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010356752556155733, + "loss": 1.4705, + "step": 22883 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010355577307246342, + "loss": 1.5329, + "step": 22884 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010354402089870018, + "loss": 1.4555, + "step": 22885 + }, + { + "epoch": 1.8, + "learning_rate": 0.0001035322690403474, + "loss": 1.4729, + "step": 22886 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010352051749748484, + "loss": 1.4726, + "step": 22887 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010350876627019237, + "loss": 1.5012, + "step": 22888 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010349701535854967, + "loss": 1.4709, + "step": 22889 + }, + { + "epoch": 1.8, + "learning_rate": 0.0001034852647626366, + "loss": 1.5106, + "step": 22890 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010347351448253285, + "loss": 1.4691, + "step": 22891 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010346176451831834, + "loss": 1.5302, + "step": 22892 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010345001487007275, + "loss": 1.466, + "step": 22893 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010343826553787585, + "loss": 1.5027, + "step": 22894 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010342651652180746, + "loss": 1.4952, + "step": 22895 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010341476782194731, + "loss": 1.4946, + "step": 22896 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010340301943837518, + "loss": 1.4654, + "step": 22897 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010339127137117084, + "loss": 1.5068, + "step": 22898 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010337952362041402, + "loss": 1.508, + "step": 22899 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010336777618618455, + "loss": 1.4684, + "step": 22900 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010335602906856212, + "loss": 1.4587, + "step": 22901 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010334428226762653, + "loss": 1.4956, + "step": 22902 + }, + { + "epoch": 1.8, + "learning_rate": 0.0001033325357834575, + "loss": 1.5032, + "step": 22903 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010332078961613479, + "loss": 1.5001, + "step": 22904 + }, + { + "epoch": 1.8, + "learning_rate": 0.0001033090437657382, + "loss": 1.4814, + "step": 22905 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010329729823234738, + "loss": 1.5568, + "step": 22906 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010328555301604211, + "loss": 1.5091, + "step": 22907 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010327380811690218, + "loss": 1.5406, + "step": 22908 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010326206353500738, + "loss": 1.4809, + "step": 22909 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010325031927043732, + "loss": 1.4833, + "step": 22910 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010323857532327179, + "loss": 1.4426, + "step": 22911 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010322683169359055, + "loss": 1.4682, + "step": 22912 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010321508838147329, + "loss": 1.5285, + "step": 22913 + }, + { + "epoch": 1.8, + "learning_rate": 0.0001032033453869998, + "loss": 1.5218, + "step": 22914 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010319160271024973, + "loss": 1.4553, + "step": 22915 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010317986035130285, + "loss": 1.5579, + "step": 22916 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010316811831023891, + "loss": 1.5168, + "step": 22917 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010315637658713757, + "loss": 1.4908, + "step": 22918 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010314463518207858, + "loss": 1.4826, + "step": 22919 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010313289409514169, + "loss": 1.4761, + "step": 22920 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010312115332640657, + "loss": 1.4753, + "step": 22921 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010310941287595291, + "loss": 1.4427, + "step": 22922 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010309767274386049, + "loss": 1.481, + "step": 22923 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010308593293020902, + "loss": 1.4827, + "step": 22924 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010307419343507815, + "loss": 1.4635, + "step": 22925 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010306245425854764, + "loss": 1.4784, + "step": 22926 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010305071540069714, + "loss": 1.4865, + "step": 22927 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010303897686160636, + "loss": 1.5222, + "step": 22928 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010302723864135504, + "loss": 1.4921, + "step": 22929 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010301550074002281, + "loss": 1.5343, + "step": 22930 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010300376315768943, + "loss": 1.4455, + "step": 22931 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010299202589443458, + "loss": 1.4808, + "step": 22932 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010298028895033789, + "loss": 1.4955, + "step": 22933 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010296855232547914, + "loss": 1.5006, + "step": 22934 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010295681601993794, + "loss": 1.5178, + "step": 22935 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010294508003379398, + "loss": 1.4912, + "step": 22936 + }, + { + "epoch": 1.8, + "learning_rate": 0.000102933344367127, + "loss": 1.525, + "step": 22937 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010292160902001657, + "loss": 1.5018, + "step": 22938 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010290987399254247, + "loss": 1.5116, + "step": 22939 + }, + { + "epoch": 1.8, + "learning_rate": 0.00010289813928478434, + "loss": 1.4678, + "step": 22940 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010288640489682186, + "loss": 1.4764, + "step": 22941 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010287467082873469, + "loss": 1.4457, + "step": 22942 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010286293708060252, + "loss": 1.4873, + "step": 22943 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010285120365250497, + "loss": 1.5063, + "step": 22944 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010283947054452173, + "loss": 1.5344, + "step": 22945 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010282773775673248, + "loss": 1.4949, + "step": 22946 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010281600528921683, + "loss": 1.4459, + "step": 22947 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010280427314205447, + "loss": 1.4492, + "step": 22948 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010279254131532507, + "loss": 1.4217, + "step": 22949 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010278080980910823, + "loss": 1.5072, + "step": 22950 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010276907862348368, + "loss": 1.5213, + "step": 22951 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010275734775853099, + "loss": 1.4951, + "step": 22952 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010274561721432985, + "loss": 1.5847, + "step": 22953 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010273388699095984, + "loss": 1.5048, + "step": 22954 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010272215708850072, + "loss": 1.5439, + "step": 22955 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010271042750703202, + "loss": 1.477, + "step": 22956 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010269869824663344, + "loss": 1.4352, + "step": 22957 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010268696930738464, + "loss": 1.487, + "step": 22958 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010267524068936514, + "loss": 1.4756, + "step": 22959 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010266351239265466, + "loss": 1.4454, + "step": 22960 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010265178441733284, + "loss": 1.4651, + "step": 22961 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010264005676347925, + "loss": 1.4831, + "step": 22962 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010262832943117355, + "loss": 1.4699, + "step": 22963 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010261660242049535, + "loss": 1.508, + "step": 22964 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010260487573152424, + "loss": 1.4717, + "step": 22965 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010259314936433992, + "loss": 1.4451, + "step": 22966 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010258142331902193, + "loss": 1.4724, + "step": 22967 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010256969759564992, + "loss": 1.5254, + "step": 22968 + }, + { + "epoch": 1.81, + "learning_rate": 0.0001025579721943034, + "loss": 1.5293, + "step": 22969 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010254624711506215, + "loss": 1.4848, + "step": 22970 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010253452235800568, + "loss": 1.4734, + "step": 22971 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010252279792321365, + "loss": 1.4733, + "step": 22972 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010251107381076556, + "loss": 1.5553, + "step": 22973 + }, + { + "epoch": 1.81, + "learning_rate": 0.0001024993500207411, + "loss": 1.529, + "step": 22974 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010248762655321987, + "loss": 1.4404, + "step": 22975 + }, + { + "epoch": 1.81, + "learning_rate": 0.0001024759034082814, + "loss": 1.5427, + "step": 22976 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010246418058600531, + "loss": 1.4662, + "step": 22977 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010245245808647124, + "loss": 1.4702, + "step": 22978 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010244073590975871, + "loss": 1.4922, + "step": 22979 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010242901405594737, + "loss": 1.4821, + "step": 22980 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010241729252511675, + "loss": 1.4992, + "step": 22981 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010240557131734644, + "loss": 1.4419, + "step": 22982 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010239385043271608, + "loss": 1.5223, + "step": 22983 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010238212987130517, + "loss": 1.4876, + "step": 22984 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010237040963319328, + "loss": 1.4961, + "step": 22985 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010235868971846006, + "loss": 1.5028, + "step": 22986 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010234697012718507, + "loss": 1.442, + "step": 22987 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010233525085944783, + "loss": 1.4895, + "step": 22988 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010232353191532795, + "loss": 1.4778, + "step": 22989 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010231181329490499, + "loss": 1.4689, + "step": 22990 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010230009499825848, + "loss": 1.5079, + "step": 22991 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010228837702546801, + "loss": 1.4551, + "step": 22992 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010227665937661313, + "loss": 1.496, + "step": 22993 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010226494205177339, + "loss": 1.4893, + "step": 22994 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010225322505102839, + "loss": 1.5217, + "step": 22995 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010224150837445759, + "loss": 1.4603, + "step": 22996 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010222979202214062, + "loss": 1.5026, + "step": 22997 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010221807599415697, + "loss": 1.5203, + "step": 22998 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010220636029058624, + "loss": 1.5108, + "step": 22999 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010219464491150799, + "loss": 1.4758, + "step": 23000 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010218292985700162, + "loss": 1.5473, + "step": 23001 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010217121512714682, + "loss": 1.4933, + "step": 23002 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010215950072202307, + "loss": 1.5054, + "step": 23003 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010214778664170995, + "loss": 1.448, + "step": 23004 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010213607288628692, + "loss": 1.4779, + "step": 23005 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010212435945583352, + "loss": 1.4982, + "step": 23006 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010211264635042933, + "loss": 1.5869, + "step": 23007 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010210093357015384, + "loss": 1.5239, + "step": 23008 + }, + { + "epoch": 1.81, + "learning_rate": 0.0001020892211150866, + "loss": 1.4848, + "step": 23009 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010207750898530707, + "loss": 1.5005, + "step": 23010 + }, + { + "epoch": 1.81, + "learning_rate": 0.0001020657971808948, + "loss": 1.5111, + "step": 23011 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010205408570192937, + "loss": 1.4591, + "step": 23012 + }, + { + "epoch": 1.81, + "learning_rate": 0.0001020423745484902, + "loss": 1.5381, + "step": 23013 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010203066372065684, + "loss": 1.5171, + "step": 23014 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010201895321850883, + "loss": 1.5242, + "step": 23015 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010200724304212562, + "loss": 1.4484, + "step": 23016 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010199553319158671, + "loss": 1.5298, + "step": 23017 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010198382366697168, + "loss": 1.4984, + "step": 23018 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010197211446836002, + "loss": 1.4855, + "step": 23019 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010196040559583115, + "loss": 1.5343, + "step": 23020 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010194869704946465, + "loss": 1.5338, + "step": 23021 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010193698882933998, + "loss": 1.5077, + "step": 23022 + }, + { + "epoch": 1.81, + "learning_rate": 0.0001019252809355366, + "loss": 1.496, + "step": 23023 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010191357336813408, + "loss": 1.4513, + "step": 23024 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010190186612721182, + "loss": 1.4927, + "step": 23025 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010189015921284938, + "loss": 1.5307, + "step": 23026 + }, + { + "epoch": 1.81, + "learning_rate": 0.0001018784526251262, + "loss": 1.4922, + "step": 23027 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010186674636412174, + "loss": 1.5316, + "step": 23028 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010185504042991555, + "loss": 1.4437, + "step": 23029 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010184333482258704, + "loss": 1.5198, + "step": 23030 + }, + { + "epoch": 1.81, + "learning_rate": 0.0001018316295422157, + "loss": 1.5083, + "step": 23031 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010181992458888098, + "loss": 1.4806, + "step": 23032 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010180821996266248, + "loss": 1.5073, + "step": 23033 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010179651566363951, + "loss": 1.467, + "step": 23034 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010178481169189161, + "loss": 1.467, + "step": 23035 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010177310804749827, + "loss": 1.4938, + "step": 23036 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010176140473053887, + "loss": 1.4996, + "step": 23037 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010174970174109293, + "loss": 1.4971, + "step": 23038 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010173799907923988, + "loss": 1.448, + "step": 23039 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010172629674505917, + "loss": 1.5061, + "step": 23040 + }, + { + "epoch": 1.81, + "learning_rate": 0.0001017145947386303, + "loss": 1.4966, + "step": 23041 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010170289306003266, + "loss": 1.4931, + "step": 23042 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010169119170934572, + "loss": 1.5274, + "step": 23043 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010167949068664896, + "loss": 1.4545, + "step": 23044 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010166778999202176, + "loss": 1.4611, + "step": 23045 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010165608962554362, + "loss": 1.4817, + "step": 23046 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010164438958729393, + "loss": 1.4668, + "step": 23047 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010163268987735211, + "loss": 1.5251, + "step": 23048 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010162099049579767, + "loss": 1.4751, + "step": 23049 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010160929144271005, + "loss": 1.5318, + "step": 23050 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010159759271816858, + "loss": 1.4913, + "step": 23051 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010158589432225278, + "loss": 1.5081, + "step": 23052 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010157419625504204, + "loss": 1.4747, + "step": 23053 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010156249851661577, + "loss": 1.494, + "step": 23054 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010155080110705343, + "loss": 1.4563, + "step": 23055 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010153910402643439, + "loss": 1.5073, + "step": 23056 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010152740727483809, + "loss": 1.4669, + "step": 23057 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010151571085234395, + "loss": 1.5015, + "step": 23058 + }, + { + "epoch": 1.81, + "learning_rate": 0.0001015040147590314, + "loss": 1.4809, + "step": 23059 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010149231899497979, + "loss": 1.4894, + "step": 23060 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010148062356026859, + "loss": 1.4793, + "step": 23061 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010146892845497716, + "loss": 1.4813, + "step": 23062 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010145723367918496, + "loss": 1.4445, + "step": 23063 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010144553923297125, + "loss": 1.4913, + "step": 23064 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010143384511641564, + "loss": 1.4849, + "step": 23065 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010142215132959738, + "loss": 1.5091, + "step": 23066 + }, + { + "epoch": 1.81, + "learning_rate": 0.00010141045787259595, + "loss": 1.5116, + "step": 23067 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010139876474549067, + "loss": 1.4573, + "step": 23068 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010138707194836093, + "loss": 1.4778, + "step": 23069 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010137537948128618, + "loss": 1.491, + "step": 23070 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010136368734434576, + "loss": 1.4263, + "step": 23071 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010135199553761906, + "loss": 1.4591, + "step": 23072 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010134030406118548, + "loss": 1.5257, + "step": 23073 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010132861291512436, + "loss": 1.4615, + "step": 23074 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010131692209951513, + "loss": 1.4619, + "step": 23075 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010130523161443708, + "loss": 1.5101, + "step": 23076 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010129354145996967, + "loss": 1.5424, + "step": 23077 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010128185163619227, + "loss": 1.497, + "step": 23078 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010127016214318413, + "loss": 1.548, + "step": 23079 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010125847298102473, + "loss": 1.4805, + "step": 23080 + }, + { + "epoch": 1.82, + "learning_rate": 0.0001012467841497934, + "loss": 1.5035, + "step": 23081 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010123509564956953, + "loss": 1.4556, + "step": 23082 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010122340748043242, + "loss": 1.5092, + "step": 23083 + }, + { + "epoch": 1.82, + "learning_rate": 0.0001012117196424615, + "loss": 1.5532, + "step": 23084 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010120003213573604, + "loss": 1.476, + "step": 23085 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010118834496033542, + "loss": 1.5387, + "step": 23086 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010117665811633905, + "loss": 1.4975, + "step": 23087 + }, + { + "epoch": 1.82, + "learning_rate": 0.0001011649716038262, + "loss": 1.4863, + "step": 23088 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010115328542287622, + "loss": 1.5355, + "step": 23089 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010114159957356854, + "loss": 1.4692, + "step": 23090 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010112991405598238, + "loss": 1.4596, + "step": 23091 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010111822887019717, + "loss": 1.498, + "step": 23092 + }, + { + "epoch": 1.82, + "learning_rate": 0.0001011065440162922, + "loss": 1.4717, + "step": 23093 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010109485949434678, + "loss": 1.519, + "step": 23094 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010108317530444027, + "loss": 1.5225, + "step": 23095 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010107149144665206, + "loss": 1.5158, + "step": 23096 + }, + { + "epoch": 1.82, + "learning_rate": 0.0001010598079210614, + "loss": 1.4734, + "step": 23097 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010104812472774762, + "loss": 1.471, + "step": 23098 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010103644186679009, + "loss": 1.4027, + "step": 23099 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010102475933826809, + "loss": 1.4616, + "step": 23100 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010101307714226093, + "loss": 1.44, + "step": 23101 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010100139527884799, + "loss": 1.4507, + "step": 23102 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010098971374810847, + "loss": 1.5042, + "step": 23103 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010097803255012181, + "loss": 1.4895, + "step": 23104 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010096635168496722, + "loss": 1.5046, + "step": 23105 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010095467115272404, + "loss": 1.4742, + "step": 23106 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010094299095347161, + "loss": 1.5331, + "step": 23107 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010093131108728918, + "loss": 1.4922, + "step": 23108 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010091963155425606, + "loss": 1.4882, + "step": 23109 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010090795235445157, + "loss": 1.5499, + "step": 23110 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010089627348795494, + "loss": 1.4763, + "step": 23111 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010088459495484555, + "loss": 1.5037, + "step": 23112 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010087291675520265, + "loss": 1.4663, + "step": 23113 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010086123888910558, + "loss": 1.5126, + "step": 23114 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010084956135663355, + "loss": 1.492, + "step": 23115 + }, + { + "epoch": 1.82, + "learning_rate": 0.0001008378841578659, + "loss": 1.5243, + "step": 23116 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010082620729288185, + "loss": 1.4971, + "step": 23117 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010081453076176071, + "loss": 1.4985, + "step": 23118 + }, + { + "epoch": 1.82, + "learning_rate": 0.0001008028545645818, + "loss": 1.5018, + "step": 23119 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010079117870142435, + "loss": 1.4952, + "step": 23120 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010077950317236764, + "loss": 1.5402, + "step": 23121 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010076782797749094, + "loss": 1.5079, + "step": 23122 + }, + { + "epoch": 1.82, + "learning_rate": 0.0001007561531168735, + "loss": 1.4781, + "step": 23123 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010074447859059464, + "loss": 1.4385, + "step": 23124 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010073280439873356, + "loss": 1.4781, + "step": 23125 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010072113054136954, + "loss": 1.4826, + "step": 23126 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010070945701858183, + "loss": 1.4774, + "step": 23127 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010069778383044977, + "loss": 1.4778, + "step": 23128 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010068611097705252, + "loss": 1.4795, + "step": 23129 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010067443845846935, + "loss": 1.5305, + "step": 23130 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010066276627477956, + "loss": 1.508, + "step": 23131 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010065109442606234, + "loss": 1.5115, + "step": 23132 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010063942291239697, + "loss": 1.5617, + "step": 23133 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010062775173386266, + "loss": 1.5114, + "step": 23134 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010061608089053865, + "loss": 1.4871, + "step": 23135 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010060441038250424, + "loss": 1.4669, + "step": 23136 + }, + { + "epoch": 1.82, + "learning_rate": 0.0001005927402098386, + "loss": 1.4519, + "step": 23137 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010058107037262102, + "loss": 1.4105, + "step": 23138 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010056940087093068, + "loss": 1.5392, + "step": 23139 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010055773170484681, + "loss": 1.4741, + "step": 23140 + }, + { + "epoch": 1.82, + "learning_rate": 0.0001005460628744487, + "loss": 1.4988, + "step": 23141 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010053439437981544, + "loss": 1.4855, + "step": 23142 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010052272622102644, + "loss": 1.4614, + "step": 23143 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010051105839816078, + "loss": 1.4421, + "step": 23144 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010049939091129776, + "loss": 1.482, + "step": 23145 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010048772376051651, + "loss": 1.4988, + "step": 23146 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010047605694589633, + "loss": 1.4412, + "step": 23147 + }, + { + "epoch": 1.82, + "learning_rate": 0.0001004643904675164, + "loss": 1.4968, + "step": 23148 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010045272432545592, + "loss": 1.5058, + "step": 23149 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010044105851979408, + "loss": 1.512, + "step": 23150 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010042939305061011, + "loss": 1.4854, + "step": 23151 + }, + { + "epoch": 1.82, + "learning_rate": 0.0001004177279179832, + "loss": 1.5431, + "step": 23152 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010040606312199258, + "loss": 1.4484, + "step": 23153 + }, + { + "epoch": 1.82, + "learning_rate": 0.0001003943986627174, + "loss": 1.4796, + "step": 23154 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010038273454023688, + "loss": 1.4992, + "step": 23155 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010037107075463023, + "loss": 1.4708, + "step": 23156 + }, + { + "epoch": 1.82, + "learning_rate": 0.0001003594073059766, + "loss": 1.5394, + "step": 23157 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010034774419435517, + "loss": 1.5295, + "step": 23158 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010033608141984517, + "loss": 1.423, + "step": 23159 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010032441898252584, + "loss": 1.4703, + "step": 23160 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010031275688247622, + "loss": 1.543, + "step": 23161 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010030109511977561, + "loss": 1.4311, + "step": 23162 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010028943369450311, + "loss": 1.5006, + "step": 23163 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010027777260673792, + "loss": 1.4791, + "step": 23164 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010026611185655924, + "loss": 1.5414, + "step": 23165 + }, + { + "epoch": 1.82, + "learning_rate": 0.0001002544514440462, + "loss": 1.4892, + "step": 23166 + }, + { + "epoch": 1.82, + "learning_rate": 0.000100242791369278, + "loss": 1.4704, + "step": 23167 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010023113163233375, + "loss": 1.5016, + "step": 23168 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010021947223329267, + "loss": 1.4912, + "step": 23169 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010020781317223392, + "loss": 1.4829, + "step": 23170 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010019615444923662, + "loss": 1.4721, + "step": 23171 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010018449606437995, + "loss": 1.5134, + "step": 23172 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010017283801774308, + "loss": 1.5038, + "step": 23173 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010016118030940508, + "loss": 1.5026, + "step": 23174 + }, + { + "epoch": 1.82, + "learning_rate": 0.0001001495229394452, + "loss": 1.4628, + "step": 23175 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010013786590794255, + "loss": 1.4898, + "step": 23176 + }, + { + "epoch": 1.82, + "learning_rate": 0.0001001262092149763, + "loss": 1.5195, + "step": 23177 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010011455286062555, + "loss": 1.5194, + "step": 23178 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010010289684496946, + "loss": 1.4768, + "step": 23179 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010009124116808717, + "loss": 1.4865, + "step": 23180 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010007958583005778, + "loss": 1.4597, + "step": 23181 + }, + { + "epoch": 1.82, + "learning_rate": 0.0001000679308309605, + "loss": 1.4952, + "step": 23182 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010005627617087437, + "loss": 1.4849, + "step": 23183 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010004462184987858, + "loss": 1.4883, + "step": 23184 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010003296786805229, + "loss": 1.5479, + "step": 23185 + }, + { + "epoch": 1.82, + "learning_rate": 0.0001000213142254745, + "loss": 1.4993, + "step": 23186 + }, + { + "epoch": 1.82, + "learning_rate": 0.00010000966092222444, + "loss": 1.4793, + "step": 23187 + }, + { + "epoch": 1.82, + "learning_rate": 9.999800795838119e-05, + "loss": 1.4786, + "step": 23188 + }, + { + "epoch": 1.82, + "learning_rate": 9.998635533402383e-05, + "loss": 1.4791, + "step": 23189 + }, + { + "epoch": 1.82, + "learning_rate": 9.997470304923156e-05, + "loss": 1.5096, + "step": 23190 + }, + { + "epoch": 1.82, + "learning_rate": 9.996305110408345e-05, + "loss": 1.4732, + "step": 23191 + }, + { + "epoch": 1.82, + "learning_rate": 9.995139949865862e-05, + "loss": 1.4746, + "step": 23192 + }, + { + "epoch": 1.82, + "learning_rate": 9.993974823303615e-05, + "loss": 1.5067, + "step": 23193 + }, + { + "epoch": 1.82, + "learning_rate": 9.992809730729518e-05, + "loss": 1.4806, + "step": 23194 + }, + { + "epoch": 1.83, + "learning_rate": 9.99164467215148e-05, + "loss": 1.4541, + "step": 23195 + }, + { + "epoch": 1.83, + "learning_rate": 9.990479647577411e-05, + "loss": 1.4791, + "step": 23196 + }, + { + "epoch": 1.83, + "learning_rate": 9.989314657015219e-05, + "loss": 1.528, + "step": 23197 + }, + { + "epoch": 1.83, + "learning_rate": 9.988149700472813e-05, + "loss": 1.5084, + "step": 23198 + }, + { + "epoch": 1.83, + "learning_rate": 9.986984777958112e-05, + "loss": 1.5612, + "step": 23199 + }, + { + "epoch": 1.83, + "learning_rate": 9.985819889479011e-05, + "loss": 1.5408, + "step": 23200 + }, + { + "epoch": 1.83, + "learning_rate": 9.984655035043428e-05, + "loss": 1.5164, + "step": 23201 + }, + { + "epoch": 1.83, + "learning_rate": 9.98349021465927e-05, + "loss": 1.4374, + "step": 23202 + }, + { + "epoch": 1.83, + "learning_rate": 9.982325428334446e-05, + "loss": 1.4252, + "step": 23203 + }, + { + "epoch": 1.83, + "learning_rate": 9.981160676076866e-05, + "loss": 1.4942, + "step": 23204 + }, + { + "epoch": 1.83, + "learning_rate": 9.979995957894424e-05, + "loss": 1.4809, + "step": 23205 + }, + { + "epoch": 1.83, + "learning_rate": 9.978831273795049e-05, + "loss": 1.483, + "step": 23206 + }, + { + "epoch": 1.83, + "learning_rate": 9.977666623786636e-05, + "loss": 1.5499, + "step": 23207 + }, + { + "epoch": 1.83, + "learning_rate": 9.976502007877098e-05, + "loss": 1.4879, + "step": 23208 + }, + { + "epoch": 1.83, + "learning_rate": 9.975337426074335e-05, + "loss": 1.5193, + "step": 23209 + }, + { + "epoch": 1.83, + "learning_rate": 9.97417287838626e-05, + "loss": 1.4998, + "step": 23210 + }, + { + "epoch": 1.83, + "learning_rate": 9.97300836482078e-05, + "loss": 1.5015, + "step": 23211 + }, + { + "epoch": 1.83, + "learning_rate": 9.971843885385795e-05, + "loss": 1.52, + "step": 23212 + }, + { + "epoch": 1.83, + "learning_rate": 9.970679440089218e-05, + "loss": 1.51, + "step": 23213 + }, + { + "epoch": 1.83, + "learning_rate": 9.969515028938954e-05, + "loss": 1.5337, + "step": 23214 + }, + { + "epoch": 1.83, + "learning_rate": 9.968350651942902e-05, + "loss": 1.4732, + "step": 23215 + }, + { + "epoch": 1.83, + "learning_rate": 9.967186309108976e-05, + "loss": 1.5094, + "step": 23216 + }, + { + "epoch": 1.83, + "learning_rate": 9.966022000445076e-05, + "loss": 1.5066, + "step": 23217 + }, + { + "epoch": 1.83, + "learning_rate": 9.964857725959107e-05, + "loss": 1.4778, + "step": 23218 + }, + { + "epoch": 1.83, + "learning_rate": 9.963693485658978e-05, + "loss": 1.4559, + "step": 23219 + }, + { + "epoch": 1.83, + "learning_rate": 9.96252927955259e-05, + "loss": 1.5343, + "step": 23220 + }, + { + "epoch": 1.83, + "learning_rate": 9.961365107647847e-05, + "loss": 1.5254, + "step": 23221 + }, + { + "epoch": 1.83, + "learning_rate": 9.960200969952654e-05, + "loss": 1.4689, + "step": 23222 + }, + { + "epoch": 1.83, + "learning_rate": 9.959036866474917e-05, + "loss": 1.4973, + "step": 23223 + }, + { + "epoch": 1.83, + "learning_rate": 9.957872797222539e-05, + "loss": 1.4738, + "step": 23224 + }, + { + "epoch": 1.83, + "learning_rate": 9.95670876220342e-05, + "loss": 1.5202, + "step": 23225 + }, + { + "epoch": 1.83, + "learning_rate": 9.955544761425468e-05, + "loss": 1.4793, + "step": 23226 + }, + { + "epoch": 1.83, + "learning_rate": 9.954380794896582e-05, + "loss": 1.5485, + "step": 23227 + }, + { + "epoch": 1.83, + "learning_rate": 9.953216862624667e-05, + "loss": 1.4828, + "step": 23228 + }, + { + "epoch": 1.83, + "learning_rate": 9.952052964617624e-05, + "loss": 1.5201, + "step": 23229 + }, + { + "epoch": 1.83, + "learning_rate": 9.950889100883352e-05, + "loss": 1.4719, + "step": 23230 + }, + { + "epoch": 1.83, + "learning_rate": 9.949725271429762e-05, + "loss": 1.4592, + "step": 23231 + }, + { + "epoch": 1.83, + "learning_rate": 9.948561476264749e-05, + "loss": 1.5255, + "step": 23232 + }, + { + "epoch": 1.83, + "learning_rate": 9.947397715396216e-05, + "loss": 1.4423, + "step": 23233 + }, + { + "epoch": 1.83, + "learning_rate": 9.946233988832063e-05, + "loss": 1.4989, + "step": 23234 + }, + { + "epoch": 1.83, + "learning_rate": 9.945070296580192e-05, + "loss": 1.5015, + "step": 23235 + }, + { + "epoch": 1.83, + "learning_rate": 9.943906638648506e-05, + "loss": 1.4783, + "step": 23236 + }, + { + "epoch": 1.83, + "learning_rate": 9.942743015044899e-05, + "loss": 1.5405, + "step": 23237 + }, + { + "epoch": 1.83, + "learning_rate": 9.941579425777279e-05, + "loss": 1.476, + "step": 23238 + }, + { + "epoch": 1.83, + "learning_rate": 9.940415870853542e-05, + "loss": 1.4923, + "step": 23239 + }, + { + "epoch": 1.83, + "learning_rate": 9.939252350281595e-05, + "loss": 1.5342, + "step": 23240 + }, + { + "epoch": 1.83, + "learning_rate": 9.938088864069326e-05, + "loss": 1.4878, + "step": 23241 + }, + { + "epoch": 1.83, + "learning_rate": 9.936925412224642e-05, + "loss": 1.4526, + "step": 23242 + }, + { + "epoch": 1.83, + "learning_rate": 9.935761994755441e-05, + "loss": 1.5063, + "step": 23243 + }, + { + "epoch": 1.83, + "learning_rate": 9.934598611669621e-05, + "loss": 1.4893, + "step": 23244 + }, + { + "epoch": 1.83, + "learning_rate": 9.933435262975082e-05, + "loss": 1.4756, + "step": 23245 + }, + { + "epoch": 1.83, + "learning_rate": 9.93227194867972e-05, + "loss": 1.5063, + "step": 23246 + }, + { + "epoch": 1.83, + "learning_rate": 9.931108668791433e-05, + "loss": 1.4604, + "step": 23247 + }, + { + "epoch": 1.83, + "learning_rate": 9.929945423318127e-05, + "loss": 1.5556, + "step": 23248 + }, + { + "epoch": 1.83, + "learning_rate": 9.92878221226769e-05, + "loss": 1.4782, + "step": 23249 + }, + { + "epoch": 1.83, + "learning_rate": 9.927619035648023e-05, + "loss": 1.4677, + "step": 23250 + }, + { + "epoch": 1.83, + "learning_rate": 9.926455893467024e-05, + "loss": 1.4752, + "step": 23251 + }, + { + "epoch": 1.83, + "learning_rate": 9.925292785732585e-05, + "loss": 1.5321, + "step": 23252 + }, + { + "epoch": 1.83, + "learning_rate": 9.924129712452611e-05, + "loss": 1.4372, + "step": 23253 + }, + { + "epoch": 1.83, + "learning_rate": 9.922966673634995e-05, + "loss": 1.4731, + "step": 23254 + }, + { + "epoch": 1.83, + "learning_rate": 9.921803669287638e-05, + "loss": 1.5141, + "step": 23255 + }, + { + "epoch": 1.83, + "learning_rate": 9.920640699418427e-05, + "loss": 1.5115, + "step": 23256 + }, + { + "epoch": 1.83, + "learning_rate": 9.919477764035266e-05, + "loss": 1.5025, + "step": 23257 + }, + { + "epoch": 1.83, + "learning_rate": 9.918314863146045e-05, + "loss": 1.5393, + "step": 23258 + }, + { + "epoch": 1.83, + "learning_rate": 9.917151996758661e-05, + "loss": 1.4938, + "step": 23259 + }, + { + "epoch": 1.83, + "learning_rate": 9.915989164881013e-05, + "loss": 1.5019, + "step": 23260 + }, + { + "epoch": 1.83, + "learning_rate": 9.91482636752099e-05, + "loss": 1.4829, + "step": 23261 + }, + { + "epoch": 1.83, + "learning_rate": 9.913663604686494e-05, + "loss": 1.5005, + "step": 23262 + }, + { + "epoch": 1.83, + "learning_rate": 9.912500876385411e-05, + "loss": 1.4897, + "step": 23263 + }, + { + "epoch": 1.83, + "learning_rate": 9.911338182625639e-05, + "loss": 1.5313, + "step": 23264 + }, + { + "epoch": 1.83, + "learning_rate": 9.910175523415076e-05, + "loss": 1.4891, + "step": 23265 + }, + { + "epoch": 1.83, + "learning_rate": 9.90901289876161e-05, + "loss": 1.4781, + "step": 23266 + }, + { + "epoch": 1.83, + "learning_rate": 9.907850308673136e-05, + "loss": 1.4773, + "step": 23267 + }, + { + "epoch": 1.83, + "learning_rate": 9.906687753157544e-05, + "loss": 1.447, + "step": 23268 + }, + { + "epoch": 1.83, + "learning_rate": 9.905525232222742e-05, + "loss": 1.5631, + "step": 23269 + }, + { + "epoch": 1.83, + "learning_rate": 9.904362745876608e-05, + "loss": 1.4349, + "step": 23270 + }, + { + "epoch": 1.83, + "learning_rate": 9.903200294127035e-05, + "loss": 1.5655, + "step": 23271 + }, + { + "epoch": 1.83, + "learning_rate": 9.902037876981926e-05, + "loss": 1.4839, + "step": 23272 + }, + { + "epoch": 1.83, + "learning_rate": 9.900875494449162e-05, + "loss": 1.4854, + "step": 23273 + }, + { + "epoch": 1.83, + "learning_rate": 9.899713146536644e-05, + "loss": 1.5485, + "step": 23274 + }, + { + "epoch": 1.83, + "learning_rate": 9.898550833252256e-05, + "loss": 1.5119, + "step": 23275 + }, + { + "epoch": 1.83, + "learning_rate": 9.89738855460389e-05, + "loss": 1.4561, + "step": 23276 + }, + { + "epoch": 1.83, + "learning_rate": 9.896226310599445e-05, + "loss": 1.5289, + "step": 23277 + }, + { + "epoch": 1.83, + "learning_rate": 9.895064101246805e-05, + "loss": 1.4963, + "step": 23278 + }, + { + "epoch": 1.83, + "learning_rate": 9.893901926553862e-05, + "loss": 1.463, + "step": 23279 + }, + { + "epoch": 1.83, + "learning_rate": 9.892739786528508e-05, + "loss": 1.4729, + "step": 23280 + }, + { + "epoch": 1.83, + "learning_rate": 9.891577681178631e-05, + "loss": 1.4852, + "step": 23281 + }, + { + "epoch": 1.83, + "learning_rate": 9.890415610512125e-05, + "loss": 1.4672, + "step": 23282 + }, + { + "epoch": 1.83, + "learning_rate": 9.889253574536874e-05, + "loss": 1.4813, + "step": 23283 + }, + { + "epoch": 1.83, + "learning_rate": 9.888091573260766e-05, + "loss": 1.5023, + "step": 23284 + }, + { + "epoch": 1.83, + "learning_rate": 9.886929606691704e-05, + "loss": 1.4814, + "step": 23285 + }, + { + "epoch": 1.83, + "learning_rate": 9.885767674837566e-05, + "loss": 1.5318, + "step": 23286 + }, + { + "epoch": 1.83, + "learning_rate": 9.884605777706244e-05, + "loss": 1.4603, + "step": 23287 + }, + { + "epoch": 1.83, + "learning_rate": 9.883443915305623e-05, + "loss": 1.4687, + "step": 23288 + }, + { + "epoch": 1.83, + "learning_rate": 9.882282087643597e-05, + "loss": 1.4829, + "step": 23289 + }, + { + "epoch": 1.83, + "learning_rate": 9.881120294728052e-05, + "loss": 1.4893, + "step": 23290 + }, + { + "epoch": 1.83, + "learning_rate": 9.879958536566875e-05, + "loss": 1.5107, + "step": 23291 + }, + { + "epoch": 1.83, + "learning_rate": 9.878796813167952e-05, + "loss": 1.4976, + "step": 23292 + }, + { + "epoch": 1.83, + "learning_rate": 9.877635124539173e-05, + "loss": 1.5122, + "step": 23293 + }, + { + "epoch": 1.83, + "learning_rate": 9.876473470688426e-05, + "loss": 1.4882, + "step": 23294 + }, + { + "epoch": 1.83, + "learning_rate": 9.875311851623596e-05, + "loss": 1.4889, + "step": 23295 + }, + { + "epoch": 1.83, + "learning_rate": 9.87415026735257e-05, + "loss": 1.4956, + "step": 23296 + }, + { + "epoch": 1.83, + "learning_rate": 9.872988717883239e-05, + "loss": 1.4513, + "step": 23297 + }, + { + "epoch": 1.83, + "learning_rate": 9.87182720322348e-05, + "loss": 1.5278, + "step": 23298 + }, + { + "epoch": 1.83, + "learning_rate": 9.870665723381182e-05, + "loss": 1.5456, + "step": 23299 + }, + { + "epoch": 1.83, + "learning_rate": 9.869504278364238e-05, + "loss": 1.5336, + "step": 23300 + }, + { + "epoch": 1.83, + "learning_rate": 9.86834286818053e-05, + "loss": 1.4963, + "step": 23301 + }, + { + "epoch": 1.83, + "learning_rate": 9.867181492837938e-05, + "loss": 1.5211, + "step": 23302 + }, + { + "epoch": 1.83, + "learning_rate": 9.866020152344354e-05, + "loss": 1.5356, + "step": 23303 + }, + { + "epoch": 1.83, + "learning_rate": 9.86485884670766e-05, + "loss": 1.505, + "step": 23304 + }, + { + "epoch": 1.83, + "learning_rate": 9.863697575935738e-05, + "loss": 1.4933, + "step": 23305 + }, + { + "epoch": 1.83, + "learning_rate": 9.862536340036478e-05, + "loss": 1.5003, + "step": 23306 + }, + { + "epoch": 1.83, + "learning_rate": 9.861375139017762e-05, + "loss": 1.524, + "step": 23307 + }, + { + "epoch": 1.83, + "learning_rate": 9.860213972887469e-05, + "loss": 1.4502, + "step": 23308 + }, + { + "epoch": 1.83, + "learning_rate": 9.859052841653492e-05, + "loss": 1.5013, + "step": 23309 + }, + { + "epoch": 1.83, + "learning_rate": 9.857891745323704e-05, + "loss": 1.489, + "step": 23310 + }, + { + "epoch": 1.83, + "learning_rate": 9.856730683905997e-05, + "loss": 1.4755, + "step": 23311 + }, + { + "epoch": 1.83, + "learning_rate": 9.855569657408248e-05, + "loss": 1.4971, + "step": 23312 + }, + { + "epoch": 1.83, + "learning_rate": 9.854408665838343e-05, + "loss": 1.5056, + "step": 23313 + }, + { + "epoch": 1.83, + "learning_rate": 9.853247709204165e-05, + "loss": 1.5129, + "step": 23314 + }, + { + "epoch": 1.83, + "learning_rate": 9.852086787513589e-05, + "loss": 1.4901, + "step": 23315 + }, + { + "epoch": 1.83, + "learning_rate": 9.850925900774508e-05, + "loss": 1.4541, + "step": 23316 + }, + { + "epoch": 1.83, + "learning_rate": 9.849765048994796e-05, + "loss": 1.4747, + "step": 23317 + }, + { + "epoch": 1.83, + "learning_rate": 9.848604232182342e-05, + "loss": 1.4944, + "step": 23318 + }, + { + "epoch": 1.83, + "learning_rate": 9.847443450345018e-05, + "loss": 1.482, + "step": 23319 + }, + { + "epoch": 1.83, + "learning_rate": 9.846282703490715e-05, + "loss": 1.4598, + "step": 23320 + }, + { + "epoch": 1.83, + "learning_rate": 9.8451219916273e-05, + "loss": 1.4648, + "step": 23321 + }, + { + "epoch": 1.84, + "learning_rate": 9.843961314762668e-05, + "loss": 1.5068, + "step": 23322 + }, + { + "epoch": 1.84, + "learning_rate": 9.842800672904693e-05, + "loss": 1.4899, + "step": 23323 + }, + { + "epoch": 1.84, + "learning_rate": 9.841640066061254e-05, + "loss": 1.4411, + "step": 23324 + }, + { + "epoch": 1.84, + "learning_rate": 9.840479494240231e-05, + "loss": 1.4817, + "step": 23325 + }, + { + "epoch": 1.84, + "learning_rate": 9.839318957449509e-05, + "loss": 1.5139, + "step": 23326 + }, + { + "epoch": 1.84, + "learning_rate": 9.83815845569696e-05, + "loss": 1.5073, + "step": 23327 + }, + { + "epoch": 1.84, + "learning_rate": 9.83699798899047e-05, + "loss": 1.5103, + "step": 23328 + }, + { + "epoch": 1.84, + "learning_rate": 9.83583755733791e-05, + "loss": 1.4886, + "step": 23329 + }, + { + "epoch": 1.84, + "learning_rate": 9.834677160747164e-05, + "loss": 1.5074, + "step": 23330 + }, + { + "epoch": 1.84, + "learning_rate": 9.833516799226107e-05, + "loss": 1.4846, + "step": 23331 + }, + { + "epoch": 1.84, + "learning_rate": 9.832356472782626e-05, + "loss": 1.5083, + "step": 23332 + }, + { + "epoch": 1.84, + "learning_rate": 9.83119618142459e-05, + "loss": 1.4695, + "step": 23333 + }, + { + "epoch": 1.84, + "learning_rate": 9.83003592515988e-05, + "loss": 1.4922, + "step": 23334 + }, + { + "epoch": 1.84, + "learning_rate": 9.828875703996372e-05, + "loss": 1.4509, + "step": 23335 + }, + { + "epoch": 1.84, + "learning_rate": 9.827715517941945e-05, + "loss": 1.4694, + "step": 23336 + }, + { + "epoch": 1.84, + "learning_rate": 9.826555367004476e-05, + "loss": 1.5196, + "step": 23337 + }, + { + "epoch": 1.84, + "learning_rate": 9.825395251191842e-05, + "loss": 1.4977, + "step": 23338 + }, + { + "epoch": 1.84, + "learning_rate": 9.824235170511917e-05, + "loss": 1.4824, + "step": 23339 + }, + { + "epoch": 1.84, + "learning_rate": 9.823075124972583e-05, + "loss": 1.4403, + "step": 23340 + }, + { + "epoch": 1.84, + "learning_rate": 9.821915114581706e-05, + "loss": 1.4389, + "step": 23341 + }, + { + "epoch": 1.84, + "learning_rate": 9.82075513934717e-05, + "loss": 1.5082, + "step": 23342 + }, + { + "epoch": 1.84, + "learning_rate": 9.81959519927685e-05, + "loss": 1.4626, + "step": 23343 + }, + { + "epoch": 1.84, + "learning_rate": 9.818435294378617e-05, + "loss": 1.4829, + "step": 23344 + }, + { + "epoch": 1.84, + "learning_rate": 9.817275424660352e-05, + "loss": 1.5267, + "step": 23345 + }, + { + "epoch": 1.84, + "learning_rate": 9.816115590129925e-05, + "loss": 1.4914, + "step": 23346 + }, + { + "epoch": 1.84, + "learning_rate": 9.814955790795211e-05, + "loss": 1.4862, + "step": 23347 + }, + { + "epoch": 1.84, + "learning_rate": 9.813796026664086e-05, + "loss": 1.5304, + "step": 23348 + }, + { + "epoch": 1.84, + "learning_rate": 9.812636297744427e-05, + "loss": 1.4628, + "step": 23349 + }, + { + "epoch": 1.84, + "learning_rate": 9.811476604044102e-05, + "loss": 1.4947, + "step": 23350 + }, + { + "epoch": 1.84, + "learning_rate": 9.81031694557099e-05, + "loss": 1.5369, + "step": 23351 + }, + { + "epoch": 1.84, + "learning_rate": 9.809157322332962e-05, + "loss": 1.4544, + "step": 23352 + }, + { + "epoch": 1.84, + "learning_rate": 9.80799773433789e-05, + "loss": 1.4716, + "step": 23353 + }, + { + "epoch": 1.84, + "learning_rate": 9.806838181593648e-05, + "loss": 1.5128, + "step": 23354 + }, + { + "epoch": 1.84, + "learning_rate": 9.80567866410811e-05, + "loss": 1.4711, + "step": 23355 + }, + { + "epoch": 1.84, + "learning_rate": 9.804519181889146e-05, + "loss": 1.5027, + "step": 23356 + }, + { + "epoch": 1.84, + "learning_rate": 9.803359734944633e-05, + "loss": 1.4414, + "step": 23357 + }, + { + "epoch": 1.84, + "learning_rate": 9.802200323282436e-05, + "loss": 1.4758, + "step": 23358 + }, + { + "epoch": 1.84, + "learning_rate": 9.801040946910431e-05, + "loss": 1.4998, + "step": 23359 + }, + { + "epoch": 1.84, + "learning_rate": 9.799881605836493e-05, + "loss": 1.5293, + "step": 23360 + }, + { + "epoch": 1.84, + "learning_rate": 9.798722300068482e-05, + "loss": 1.4766, + "step": 23361 + }, + { + "epoch": 1.84, + "learning_rate": 9.797563029614278e-05, + "loss": 1.4813, + "step": 23362 + }, + { + "epoch": 1.84, + "learning_rate": 9.796403794481751e-05, + "loss": 1.4586, + "step": 23363 + }, + { + "epoch": 1.84, + "learning_rate": 9.795244594678774e-05, + "loss": 1.4692, + "step": 23364 + }, + { + "epoch": 1.84, + "learning_rate": 9.79408543021321e-05, + "loss": 1.461, + "step": 23365 + }, + { + "epoch": 1.84, + "learning_rate": 9.792926301092934e-05, + "loss": 1.492, + "step": 23366 + }, + { + "epoch": 1.84, + "learning_rate": 9.791767207325819e-05, + "loss": 1.5019, + "step": 23367 + }, + { + "epoch": 1.84, + "learning_rate": 9.790608148919726e-05, + "loss": 1.4644, + "step": 23368 + }, + { + "epoch": 1.84, + "learning_rate": 9.789449125882531e-05, + "loss": 1.4834, + "step": 23369 + }, + { + "epoch": 1.84, + "learning_rate": 9.7882901382221e-05, + "loss": 1.4351, + "step": 23370 + }, + { + "epoch": 1.84, + "learning_rate": 9.787131185946303e-05, + "loss": 1.4679, + "step": 23371 + }, + { + "epoch": 1.84, + "learning_rate": 9.78597226906301e-05, + "loss": 1.4277, + "step": 23372 + }, + { + "epoch": 1.84, + "learning_rate": 9.784813387580086e-05, + "loss": 1.494, + "step": 23373 + }, + { + "epoch": 1.84, + "learning_rate": 9.783654541505404e-05, + "loss": 1.4189, + "step": 23374 + }, + { + "epoch": 1.84, + "learning_rate": 9.782495730846825e-05, + "loss": 1.4776, + "step": 23375 + }, + { + "epoch": 1.84, + "learning_rate": 9.781336955612222e-05, + "loss": 1.4519, + "step": 23376 + }, + { + "epoch": 1.84, + "learning_rate": 9.780178215809465e-05, + "loss": 1.4571, + "step": 23377 + }, + { + "epoch": 1.84, + "learning_rate": 9.779019511446409e-05, + "loss": 1.4977, + "step": 23378 + }, + { + "epoch": 1.84, + "learning_rate": 9.777860842530933e-05, + "loss": 1.4889, + "step": 23379 + }, + { + "epoch": 1.84, + "learning_rate": 9.776702209070901e-05, + "loss": 1.5173, + "step": 23380 + }, + { + "epoch": 1.84, + "learning_rate": 9.77554361107418e-05, + "loss": 1.4579, + "step": 23381 + }, + { + "epoch": 1.84, + "learning_rate": 9.774385048548635e-05, + "loss": 1.4513, + "step": 23382 + }, + { + "epoch": 1.84, + "learning_rate": 9.773226521502128e-05, + "loss": 1.4969, + "step": 23383 + }, + { + "epoch": 1.84, + "learning_rate": 9.772068029942533e-05, + "loss": 1.4716, + "step": 23384 + }, + { + "epoch": 1.84, + "learning_rate": 9.770909573877709e-05, + "loss": 1.5082, + "step": 23385 + }, + { + "epoch": 1.84, + "learning_rate": 9.769751153315525e-05, + "loss": 1.4596, + "step": 23386 + }, + { + "epoch": 1.84, + "learning_rate": 9.768592768263843e-05, + "loss": 1.4261, + "step": 23387 + }, + { + "epoch": 1.84, + "learning_rate": 9.767434418730527e-05, + "loss": 1.5104, + "step": 23388 + }, + { + "epoch": 1.84, + "learning_rate": 9.766276104723447e-05, + "loss": 1.4805, + "step": 23389 + }, + { + "epoch": 1.84, + "learning_rate": 9.765117826250463e-05, + "loss": 1.512, + "step": 23390 + }, + { + "epoch": 1.84, + "learning_rate": 9.763959583319439e-05, + "loss": 1.4795, + "step": 23391 + }, + { + "epoch": 1.84, + "learning_rate": 9.762801375938244e-05, + "loss": 1.5051, + "step": 23392 + }, + { + "epoch": 1.84, + "learning_rate": 9.761643204114733e-05, + "loss": 1.4243, + "step": 23393 + }, + { + "epoch": 1.84, + "learning_rate": 9.760485067856772e-05, + "loss": 1.5309, + "step": 23394 + }, + { + "epoch": 1.84, + "learning_rate": 9.759326967172228e-05, + "loss": 1.5165, + "step": 23395 + }, + { + "epoch": 1.84, + "learning_rate": 9.758168902068965e-05, + "loss": 1.465, + "step": 23396 + }, + { + "epoch": 1.84, + "learning_rate": 9.75701087255484e-05, + "loss": 1.5044, + "step": 23397 + }, + { + "epoch": 1.84, + "learning_rate": 9.755852878637721e-05, + "loss": 1.5182, + "step": 23398 + }, + { + "epoch": 1.84, + "learning_rate": 9.754694920325463e-05, + "loss": 1.4665, + "step": 23399 + }, + { + "epoch": 1.84, + "learning_rate": 9.753536997625933e-05, + "loss": 1.5361, + "step": 23400 + }, + { + "epoch": 1.84, + "learning_rate": 9.752379110546993e-05, + "loss": 1.4974, + "step": 23401 + }, + { + "epoch": 1.84, + "learning_rate": 9.751221259096503e-05, + "loss": 1.512, + "step": 23402 + }, + { + "epoch": 1.84, + "learning_rate": 9.750063443282322e-05, + "loss": 1.4664, + "step": 23403 + }, + { + "epoch": 1.84, + "learning_rate": 9.748905663112313e-05, + "loss": 1.5198, + "step": 23404 + }, + { + "epoch": 1.84, + "learning_rate": 9.747747918594338e-05, + "loss": 1.5047, + "step": 23405 + }, + { + "epoch": 1.84, + "learning_rate": 9.746590209736259e-05, + "loss": 1.4858, + "step": 23406 + }, + { + "epoch": 1.84, + "learning_rate": 9.745432536545929e-05, + "loss": 1.4792, + "step": 23407 + }, + { + "epoch": 1.84, + "learning_rate": 9.744274899031213e-05, + "loss": 1.4798, + "step": 23408 + }, + { + "epoch": 1.84, + "learning_rate": 9.743117297199966e-05, + "loss": 1.4948, + "step": 23409 + }, + { + "epoch": 1.84, + "learning_rate": 9.74195973106006e-05, + "loss": 1.4942, + "step": 23410 + }, + { + "epoch": 1.84, + "learning_rate": 9.74080220061934e-05, + "loss": 1.5059, + "step": 23411 + }, + { + "epoch": 1.84, + "learning_rate": 9.739644705885673e-05, + "loss": 1.5608, + "step": 23412 + }, + { + "epoch": 1.84, + "learning_rate": 9.738487246866916e-05, + "loss": 1.4676, + "step": 23413 + }, + { + "epoch": 1.84, + "learning_rate": 9.737329823570927e-05, + "loss": 1.499, + "step": 23414 + }, + { + "epoch": 1.84, + "learning_rate": 9.736172436005567e-05, + "loss": 1.4901, + "step": 23415 + }, + { + "epoch": 1.84, + "learning_rate": 9.735015084178685e-05, + "loss": 1.5026, + "step": 23416 + }, + { + "epoch": 1.84, + "learning_rate": 9.73385776809815e-05, + "loss": 1.5026, + "step": 23417 + }, + { + "epoch": 1.84, + "learning_rate": 9.732700487771814e-05, + "loss": 1.4818, + "step": 23418 + }, + { + "epoch": 1.84, + "learning_rate": 9.731543243207534e-05, + "loss": 1.4671, + "step": 23419 + }, + { + "epoch": 1.84, + "learning_rate": 9.730386034413166e-05, + "loss": 1.5509, + "step": 23420 + }, + { + "epoch": 1.84, + "learning_rate": 9.729228861396574e-05, + "loss": 1.5083, + "step": 23421 + }, + { + "epoch": 1.84, + "learning_rate": 9.728071724165603e-05, + "loss": 1.4984, + "step": 23422 + }, + { + "epoch": 1.84, + "learning_rate": 9.726914622728121e-05, + "loss": 1.5074, + "step": 23423 + }, + { + "epoch": 1.84, + "learning_rate": 9.725757557091978e-05, + "loss": 1.4909, + "step": 23424 + }, + { + "epoch": 1.84, + "learning_rate": 9.724600527265025e-05, + "loss": 1.5224, + "step": 23425 + }, + { + "epoch": 1.84, + "learning_rate": 9.723443533255126e-05, + "loss": 1.4898, + "step": 23426 + }, + { + "epoch": 1.84, + "learning_rate": 9.722286575070138e-05, + "loss": 1.4639, + "step": 23427 + }, + { + "epoch": 1.84, + "learning_rate": 9.721129652717906e-05, + "loss": 1.4479, + "step": 23428 + }, + { + "epoch": 1.84, + "learning_rate": 9.719972766206294e-05, + "loss": 1.4637, + "step": 23429 + }, + { + "epoch": 1.84, + "learning_rate": 9.718815915543153e-05, + "loss": 1.4653, + "step": 23430 + }, + { + "epoch": 1.84, + "learning_rate": 9.717659100736338e-05, + "loss": 1.4824, + "step": 23431 + }, + { + "epoch": 1.84, + "learning_rate": 9.716502321793702e-05, + "loss": 1.5005, + "step": 23432 + }, + { + "epoch": 1.84, + "learning_rate": 9.715345578723099e-05, + "loss": 1.5072, + "step": 23433 + }, + { + "epoch": 1.84, + "learning_rate": 9.714188871532382e-05, + "loss": 1.45, + "step": 23434 + }, + { + "epoch": 1.84, + "learning_rate": 9.713032200229409e-05, + "loss": 1.5104, + "step": 23435 + }, + { + "epoch": 1.84, + "learning_rate": 9.711875564822027e-05, + "loss": 1.569, + "step": 23436 + }, + { + "epoch": 1.84, + "learning_rate": 9.710718965318093e-05, + "loss": 1.5614, + "step": 23437 + }, + { + "epoch": 1.84, + "learning_rate": 9.70956240172546e-05, + "loss": 1.5018, + "step": 23438 + }, + { + "epoch": 1.84, + "learning_rate": 9.708405874051977e-05, + "loss": 1.4734, + "step": 23439 + }, + { + "epoch": 1.84, + "learning_rate": 9.707249382305499e-05, + "loss": 1.4676, + "step": 23440 + }, + { + "epoch": 1.84, + "learning_rate": 9.706092926493868e-05, + "loss": 1.4999, + "step": 23441 + }, + { + "epoch": 1.84, + "learning_rate": 9.704936506624954e-05, + "loss": 1.4864, + "step": 23442 + }, + { + "epoch": 1.84, + "learning_rate": 9.703780122706598e-05, + "loss": 1.4717, + "step": 23443 + }, + { + "epoch": 1.84, + "learning_rate": 9.702623774746652e-05, + "loss": 1.4734, + "step": 23444 + }, + { + "epoch": 1.84, + "learning_rate": 9.701467462752967e-05, + "loss": 1.4778, + "step": 23445 + }, + { + "epoch": 1.84, + "learning_rate": 9.700311186733391e-05, + "loss": 1.5141, + "step": 23446 + }, + { + "epoch": 1.84, + "learning_rate": 9.699154946695782e-05, + "loss": 1.4717, + "step": 23447 + }, + { + "epoch": 1.84, + "learning_rate": 9.697998742647985e-05, + "loss": 1.5033, + "step": 23448 + }, + { + "epoch": 1.84, + "learning_rate": 9.696842574597847e-05, + "loss": 1.4964, + "step": 23449 + }, + { + "epoch": 1.85, + "learning_rate": 9.695686442553226e-05, + "loss": 1.4609, + "step": 23450 + }, + { + "epoch": 1.85, + "learning_rate": 9.694530346521963e-05, + "loss": 1.4683, + "step": 23451 + }, + { + "epoch": 1.85, + "learning_rate": 9.693374286511915e-05, + "loss": 1.5289, + "step": 23452 + }, + { + "epoch": 1.85, + "learning_rate": 9.692218262530925e-05, + "loss": 1.494, + "step": 23453 + }, + { + "epoch": 1.85, + "learning_rate": 9.691062274586841e-05, + "loss": 1.5068, + "step": 23454 + }, + { + "epoch": 1.85, + "learning_rate": 9.68990632268752e-05, + "loss": 1.4706, + "step": 23455 + }, + { + "epoch": 1.85, + "learning_rate": 9.688750406840802e-05, + "loss": 1.5269, + "step": 23456 + }, + { + "epoch": 1.85, + "learning_rate": 9.687594527054533e-05, + "loss": 1.4539, + "step": 23457 + }, + { + "epoch": 1.85, + "learning_rate": 9.686438683336571e-05, + "loss": 1.5188, + "step": 23458 + }, + { + "epoch": 1.85, + "learning_rate": 9.68528287569476e-05, + "loss": 1.4609, + "step": 23459 + }, + { + "epoch": 1.85, + "learning_rate": 9.68412710413694e-05, + "loss": 1.4507, + "step": 23460 + }, + { + "epoch": 1.85, + "learning_rate": 9.68297136867097e-05, + "loss": 1.4885, + "step": 23461 + }, + { + "epoch": 1.85, + "learning_rate": 9.681815669304685e-05, + "loss": 1.5065, + "step": 23462 + }, + { + "epoch": 1.85, + "learning_rate": 9.680660006045938e-05, + "loss": 1.4876, + "step": 23463 + }, + { + "epoch": 1.85, + "learning_rate": 9.679504378902576e-05, + "loss": 1.5133, + "step": 23464 + }, + { + "epoch": 1.85, + "learning_rate": 9.67834878788244e-05, + "loss": 1.4907, + "step": 23465 + }, + { + "epoch": 1.85, + "learning_rate": 9.677193232993378e-05, + "loss": 1.5112, + "step": 23466 + }, + { + "epoch": 1.85, + "learning_rate": 9.676037714243243e-05, + "loss": 1.4446, + "step": 23467 + }, + { + "epoch": 1.85, + "learning_rate": 9.674882231639869e-05, + "loss": 1.5131, + "step": 23468 + }, + { + "epoch": 1.85, + "learning_rate": 9.67372678519111e-05, + "loss": 1.442, + "step": 23469 + }, + { + "epoch": 1.85, + "learning_rate": 9.672571374904803e-05, + "loss": 1.4759, + "step": 23470 + }, + { + "epoch": 1.85, + "learning_rate": 9.671416000788796e-05, + "loss": 1.4635, + "step": 23471 + }, + { + "epoch": 1.85, + "learning_rate": 9.67026066285093e-05, + "loss": 1.4882, + "step": 23472 + }, + { + "epoch": 1.85, + "learning_rate": 9.669105361099062e-05, + "loss": 1.478, + "step": 23473 + }, + { + "epoch": 1.85, + "learning_rate": 9.667950095541021e-05, + "loss": 1.4503, + "step": 23474 + }, + { + "epoch": 1.85, + "learning_rate": 9.666794866184656e-05, + "loss": 1.4998, + "step": 23475 + }, + { + "epoch": 1.85, + "learning_rate": 9.665639673037815e-05, + "loss": 1.4393, + "step": 23476 + }, + { + "epoch": 1.85, + "learning_rate": 9.664484516108335e-05, + "loss": 1.5105, + "step": 23477 + }, + { + "epoch": 1.85, + "learning_rate": 9.66332939540406e-05, + "loss": 1.4936, + "step": 23478 + }, + { + "epoch": 1.85, + "learning_rate": 9.662174310932835e-05, + "loss": 1.5446, + "step": 23479 + }, + { + "epoch": 1.85, + "learning_rate": 9.661019262702499e-05, + "loss": 1.5527, + "step": 23480 + }, + { + "epoch": 1.85, + "learning_rate": 9.6598642507209e-05, + "loss": 1.4658, + "step": 23481 + }, + { + "epoch": 1.85, + "learning_rate": 9.65870927499587e-05, + "loss": 1.5304, + "step": 23482 + }, + { + "epoch": 1.85, + "learning_rate": 9.657554335535259e-05, + "loss": 1.4681, + "step": 23483 + }, + { + "epoch": 1.85, + "learning_rate": 9.656399432346908e-05, + "loss": 1.4807, + "step": 23484 + }, + { + "epoch": 1.85, + "learning_rate": 9.655244565438653e-05, + "loss": 1.4582, + "step": 23485 + }, + { + "epoch": 1.85, + "learning_rate": 9.654089734818341e-05, + "loss": 1.5132, + "step": 23486 + }, + { + "epoch": 1.85, + "learning_rate": 9.652934940493806e-05, + "loss": 1.4245, + "step": 23487 + }, + { + "epoch": 1.85, + "learning_rate": 9.651780182472888e-05, + "loss": 1.5041, + "step": 23488 + }, + { + "epoch": 1.85, + "learning_rate": 9.650625460763437e-05, + "loss": 1.4644, + "step": 23489 + }, + { + "epoch": 1.85, + "learning_rate": 9.649470775373283e-05, + "loss": 1.4746, + "step": 23490 + }, + { + "epoch": 1.85, + "learning_rate": 9.648316126310278e-05, + "loss": 1.5013, + "step": 23491 + }, + { + "epoch": 1.85, + "learning_rate": 9.647161513582248e-05, + "loss": 1.502, + "step": 23492 + }, + { + "epoch": 1.85, + "learning_rate": 9.646006937197039e-05, + "loss": 1.513, + "step": 23493 + }, + { + "epoch": 1.85, + "learning_rate": 9.644852397162487e-05, + "loss": 1.4957, + "step": 23494 + }, + { + "epoch": 1.85, + "learning_rate": 9.64369789348643e-05, + "loss": 1.4874, + "step": 23495 + }, + { + "epoch": 1.85, + "learning_rate": 9.642543426176714e-05, + "loss": 1.4818, + "step": 23496 + }, + { + "epoch": 1.85, + "learning_rate": 9.641388995241166e-05, + "loss": 1.512, + "step": 23497 + }, + { + "epoch": 1.85, + "learning_rate": 9.640234600687635e-05, + "loss": 1.5519, + "step": 23498 + }, + { + "epoch": 1.85, + "learning_rate": 9.639080242523949e-05, + "loss": 1.4904, + "step": 23499 + }, + { + "epoch": 1.85, + "learning_rate": 9.637925920757949e-05, + "loss": 1.4725, + "step": 23500 + }, + { + "epoch": 1.85, + "learning_rate": 9.636771635397479e-05, + "loss": 1.4727, + "step": 23501 + }, + { + "epoch": 1.85, + "learning_rate": 9.635617386450364e-05, + "loss": 1.5369, + "step": 23502 + }, + { + "epoch": 1.85, + "learning_rate": 9.634463173924448e-05, + "loss": 1.5091, + "step": 23503 + }, + { + "epoch": 1.85, + "learning_rate": 9.633308997827562e-05, + "loss": 1.4908, + "step": 23504 + }, + { + "epoch": 1.85, + "learning_rate": 9.632154858167553e-05, + "loss": 1.5146, + "step": 23505 + }, + { + "epoch": 1.85, + "learning_rate": 9.631000754952248e-05, + "loss": 1.4644, + "step": 23506 + }, + { + "epoch": 1.85, + "learning_rate": 9.629846688189484e-05, + "loss": 1.4562, + "step": 23507 + }, + { + "epoch": 1.85, + "learning_rate": 9.628692657887101e-05, + "loss": 1.4431, + "step": 23508 + }, + { + "epoch": 1.85, + "learning_rate": 9.627538664052927e-05, + "loss": 1.5275, + "step": 23509 + }, + { + "epoch": 1.85, + "learning_rate": 9.626384706694805e-05, + "loss": 1.4235, + "step": 23510 + }, + { + "epoch": 1.85, + "learning_rate": 9.62523078582056e-05, + "loss": 1.5252, + "step": 23511 + }, + { + "epoch": 1.85, + "learning_rate": 9.624076901438035e-05, + "loss": 1.452, + "step": 23512 + }, + { + "epoch": 1.85, + "learning_rate": 9.622923053555063e-05, + "loss": 1.4467, + "step": 23513 + }, + { + "epoch": 1.85, + "learning_rate": 9.621769242179472e-05, + "loss": 1.4812, + "step": 23514 + }, + { + "epoch": 1.85, + "learning_rate": 9.620615467319104e-05, + "loss": 1.5035, + "step": 23515 + }, + { + "epoch": 1.85, + "learning_rate": 9.619461728981785e-05, + "loss": 1.4396, + "step": 23516 + }, + { + "epoch": 1.85, + "learning_rate": 9.618308027175352e-05, + "loss": 1.5053, + "step": 23517 + }, + { + "epoch": 1.85, + "learning_rate": 9.61715436190764e-05, + "loss": 1.4416, + "step": 23518 + }, + { + "epoch": 1.85, + "learning_rate": 9.61600073318647e-05, + "loss": 1.5473, + "step": 23519 + }, + { + "epoch": 1.85, + "learning_rate": 9.614847141019694e-05, + "loss": 1.4474, + "step": 23520 + }, + { + "epoch": 1.85, + "learning_rate": 9.613693585415131e-05, + "loss": 1.5306, + "step": 23521 + }, + { + "epoch": 1.85, + "learning_rate": 9.61254006638062e-05, + "loss": 1.4738, + "step": 23522 + }, + { + "epoch": 1.85, + "learning_rate": 9.611386583923984e-05, + "loss": 1.5181, + "step": 23523 + }, + { + "epoch": 1.85, + "learning_rate": 9.61023313805306e-05, + "loss": 1.4235, + "step": 23524 + }, + { + "epoch": 1.85, + "learning_rate": 9.609079728775682e-05, + "loss": 1.497, + "step": 23525 + }, + { + "epoch": 1.85, + "learning_rate": 9.607926356099676e-05, + "loss": 1.4572, + "step": 23526 + }, + { + "epoch": 1.85, + "learning_rate": 9.606773020032875e-05, + "loss": 1.5303, + "step": 23527 + }, + { + "epoch": 1.85, + "learning_rate": 9.605619720583108e-05, + "loss": 1.4556, + "step": 23528 + }, + { + "epoch": 1.85, + "learning_rate": 9.604466457758203e-05, + "loss": 1.4738, + "step": 23529 + }, + { + "epoch": 1.85, + "learning_rate": 9.603313231565998e-05, + "loss": 1.4825, + "step": 23530 + }, + { + "epoch": 1.85, + "learning_rate": 9.602160042014319e-05, + "loss": 1.4584, + "step": 23531 + }, + { + "epoch": 1.85, + "learning_rate": 9.60100688911099e-05, + "loss": 1.468, + "step": 23532 + }, + { + "epoch": 1.85, + "learning_rate": 9.599853772863848e-05, + "loss": 1.4435, + "step": 23533 + }, + { + "epoch": 1.85, + "learning_rate": 9.598700693280717e-05, + "loss": 1.4681, + "step": 23534 + }, + { + "epoch": 1.85, + "learning_rate": 9.597547650369425e-05, + "loss": 1.5119, + "step": 23535 + }, + { + "epoch": 1.85, + "learning_rate": 9.596394644137803e-05, + "loss": 1.4876, + "step": 23536 + }, + { + "epoch": 1.85, + "learning_rate": 9.595241674593688e-05, + "loss": 1.5052, + "step": 23537 + }, + { + "epoch": 1.85, + "learning_rate": 9.594088741744893e-05, + "loss": 1.5067, + "step": 23538 + }, + { + "epoch": 1.85, + "learning_rate": 9.592935845599255e-05, + "loss": 1.4693, + "step": 23539 + }, + { + "epoch": 1.85, + "learning_rate": 9.591782986164596e-05, + "loss": 1.4888, + "step": 23540 + }, + { + "epoch": 1.85, + "learning_rate": 9.590630163448746e-05, + "loss": 1.452, + "step": 23541 + }, + { + "epoch": 1.85, + "learning_rate": 9.589477377459534e-05, + "loss": 1.4813, + "step": 23542 + }, + { + "epoch": 1.85, + "learning_rate": 9.588324628204785e-05, + "loss": 1.5142, + "step": 23543 + }, + { + "epoch": 1.85, + "learning_rate": 9.587171915692328e-05, + "loss": 1.4436, + "step": 23544 + }, + { + "epoch": 1.85, + "learning_rate": 9.586019239929981e-05, + "loss": 1.4372, + "step": 23545 + }, + { + "epoch": 1.85, + "learning_rate": 9.584866600925576e-05, + "loss": 1.4905, + "step": 23546 + }, + { + "epoch": 1.85, + "learning_rate": 9.583713998686944e-05, + "loss": 1.478, + "step": 23547 + }, + { + "epoch": 1.85, + "learning_rate": 9.582561433221899e-05, + "loss": 1.4551, + "step": 23548 + }, + { + "epoch": 1.85, + "learning_rate": 9.581408904538274e-05, + "loss": 1.4336, + "step": 23549 + }, + { + "epoch": 1.85, + "learning_rate": 9.580256412643894e-05, + "loss": 1.4936, + "step": 23550 + }, + { + "epoch": 1.85, + "learning_rate": 9.579103957546578e-05, + "loss": 1.5043, + "step": 23551 + }, + { + "epoch": 1.85, + "learning_rate": 9.577951539254157e-05, + "loss": 1.4979, + "step": 23552 + }, + { + "epoch": 1.85, + "learning_rate": 9.576799157774453e-05, + "loss": 1.4802, + "step": 23553 + }, + { + "epoch": 1.85, + "learning_rate": 9.575646813115292e-05, + "loss": 1.495, + "step": 23554 + }, + { + "epoch": 1.85, + "learning_rate": 9.574494505284492e-05, + "loss": 1.4412, + "step": 23555 + }, + { + "epoch": 1.85, + "learning_rate": 9.573342234289885e-05, + "loss": 1.5015, + "step": 23556 + }, + { + "epoch": 1.85, + "learning_rate": 9.572190000139286e-05, + "loss": 1.4885, + "step": 23557 + }, + { + "epoch": 1.85, + "learning_rate": 9.571037802840523e-05, + "loss": 1.4574, + "step": 23558 + }, + { + "epoch": 1.85, + "learning_rate": 9.569885642401419e-05, + "loss": 1.471, + "step": 23559 + }, + { + "epoch": 1.85, + "learning_rate": 9.568733518829791e-05, + "loss": 1.4651, + "step": 23560 + }, + { + "epoch": 1.85, + "learning_rate": 9.567581432133466e-05, + "loss": 1.4582, + "step": 23561 + }, + { + "epoch": 1.85, + "learning_rate": 9.566429382320268e-05, + "loss": 1.493, + "step": 23562 + }, + { + "epoch": 1.85, + "learning_rate": 9.565277369398015e-05, + "loss": 1.5855, + "step": 23563 + }, + { + "epoch": 1.85, + "learning_rate": 9.564125393374529e-05, + "loss": 1.447, + "step": 23564 + }, + { + "epoch": 1.85, + "learning_rate": 9.56297345425763e-05, + "loss": 1.4764, + "step": 23565 + }, + { + "epoch": 1.85, + "learning_rate": 9.561821552055143e-05, + "loss": 1.5262, + "step": 23566 + }, + { + "epoch": 1.85, + "learning_rate": 9.560669686774883e-05, + "loss": 1.4928, + "step": 23567 + }, + { + "epoch": 1.85, + "learning_rate": 9.559517858424678e-05, + "loss": 1.5065, + "step": 23568 + }, + { + "epoch": 1.85, + "learning_rate": 9.558366067012344e-05, + "loss": 1.52, + "step": 23569 + }, + { + "epoch": 1.85, + "learning_rate": 9.557214312545699e-05, + "loss": 1.5201, + "step": 23570 + }, + { + "epoch": 1.85, + "learning_rate": 9.55606259503257e-05, + "loss": 1.5057, + "step": 23571 + }, + { + "epoch": 1.85, + "learning_rate": 9.554910914480768e-05, + "loss": 1.4658, + "step": 23572 + }, + { + "epoch": 1.85, + "learning_rate": 9.553759270898117e-05, + "loss": 1.4834, + "step": 23573 + }, + { + "epoch": 1.85, + "learning_rate": 9.552607664292438e-05, + "loss": 1.5121, + "step": 23574 + }, + { + "epoch": 1.85, + "learning_rate": 9.551456094671542e-05, + "loss": 1.4826, + "step": 23575 + }, + { + "epoch": 1.85, + "learning_rate": 9.550304562043257e-05, + "loss": 1.4776, + "step": 23576 + }, + { + "epoch": 1.86, + "learning_rate": 9.549153066415392e-05, + "loss": 1.5163, + "step": 23577 + }, + { + "epoch": 1.86, + "learning_rate": 9.548001607795772e-05, + "loss": 1.533, + "step": 23578 + }, + { + "epoch": 1.86, + "learning_rate": 9.546850186192214e-05, + "loss": 1.5099, + "step": 23579 + }, + { + "epoch": 1.86, + "learning_rate": 9.545698801612531e-05, + "loss": 1.4913, + "step": 23580 + }, + { + "epoch": 1.86, + "learning_rate": 9.544547454064547e-05, + "loss": 1.5181, + "step": 23581 + }, + { + "epoch": 1.86, + "learning_rate": 9.543396143556066e-05, + "loss": 1.4623, + "step": 23582 + }, + { + "epoch": 1.86, + "learning_rate": 9.542244870094922e-05, + "loss": 1.4998, + "step": 23583 + }, + { + "epoch": 1.86, + "learning_rate": 9.54109363368892e-05, + "loss": 1.4998, + "step": 23584 + }, + { + "epoch": 1.86, + "learning_rate": 9.539942434345884e-05, + "loss": 1.5091, + "step": 23585 + }, + { + "epoch": 1.86, + "learning_rate": 9.538791272073623e-05, + "loss": 1.5311, + "step": 23586 + }, + { + "epoch": 1.86, + "learning_rate": 9.537640146879956e-05, + "loss": 1.4796, + "step": 23587 + }, + { + "epoch": 1.86, + "learning_rate": 9.536489058772701e-05, + "loss": 1.4939, + "step": 23588 + }, + { + "epoch": 1.86, + "learning_rate": 9.535338007759665e-05, + "loss": 1.4796, + "step": 23589 + }, + { + "epoch": 1.86, + "learning_rate": 9.53418699384867e-05, + "loss": 1.4879, + "step": 23590 + }, + { + "epoch": 1.86, + "learning_rate": 9.533036017047531e-05, + "loss": 1.4894, + "step": 23591 + }, + { + "epoch": 1.86, + "learning_rate": 9.531885077364058e-05, + "loss": 1.4679, + "step": 23592 + }, + { + "epoch": 1.86, + "learning_rate": 9.530734174806072e-05, + "loss": 1.5209, + "step": 23593 + }, + { + "epoch": 1.86, + "learning_rate": 9.529583309381378e-05, + "loss": 1.5179, + "step": 23594 + }, + { + "epoch": 1.86, + "learning_rate": 9.528432481097796e-05, + "loss": 1.5434, + "step": 23595 + }, + { + "epoch": 1.86, + "learning_rate": 9.527281689963141e-05, + "loss": 1.4933, + "step": 23596 + }, + { + "epoch": 1.86, + "learning_rate": 9.526130935985218e-05, + "loss": 1.5067, + "step": 23597 + }, + { + "epoch": 1.86, + "learning_rate": 9.524980219171844e-05, + "loss": 1.4881, + "step": 23598 + }, + { + "epoch": 1.86, + "learning_rate": 9.523829539530836e-05, + "loss": 1.4715, + "step": 23599 + }, + { + "epoch": 1.86, + "learning_rate": 9.522678897070006e-05, + "loss": 1.4894, + "step": 23600 + }, + { + "epoch": 1.86, + "learning_rate": 9.521528291797162e-05, + "loss": 1.4632, + "step": 23601 + }, + { + "epoch": 1.86, + "learning_rate": 9.520377723720116e-05, + "loss": 1.4526, + "step": 23602 + }, + { + "epoch": 1.86, + "learning_rate": 9.519227192846684e-05, + "loss": 1.4627, + "step": 23603 + }, + { + "epoch": 1.86, + "learning_rate": 9.518076699184674e-05, + "loss": 1.5444, + "step": 23604 + }, + { + "epoch": 1.86, + "learning_rate": 9.516926242741898e-05, + "loss": 1.4769, + "step": 23605 + }, + { + "epoch": 1.86, + "learning_rate": 9.515775823526166e-05, + "loss": 1.4415, + "step": 23606 + }, + { + "epoch": 1.86, + "learning_rate": 9.514625441545288e-05, + "loss": 1.5127, + "step": 23607 + }, + { + "epoch": 1.86, + "learning_rate": 9.513475096807081e-05, + "loss": 1.476, + "step": 23608 + }, + { + "epoch": 1.86, + "learning_rate": 9.512324789319347e-05, + "loss": 1.4854, + "step": 23609 + }, + { + "epoch": 1.86, + "learning_rate": 9.511174519089904e-05, + "loss": 1.4735, + "step": 23610 + }, + { + "epoch": 1.86, + "learning_rate": 9.51002428612655e-05, + "loss": 1.5474, + "step": 23611 + }, + { + "epoch": 1.86, + "learning_rate": 9.508874090437105e-05, + "loss": 1.4386, + "step": 23612 + }, + { + "epoch": 1.86, + "learning_rate": 9.507723932029376e-05, + "loss": 1.4908, + "step": 23613 + }, + { + "epoch": 1.86, + "learning_rate": 9.506573810911164e-05, + "loss": 1.4969, + "step": 23614 + }, + { + "epoch": 1.86, + "learning_rate": 9.50542372709029e-05, + "loss": 1.4543, + "step": 23615 + }, + { + "epoch": 1.86, + "learning_rate": 9.504273680574554e-05, + "loss": 1.4916, + "step": 23616 + }, + { + "epoch": 1.86, + "learning_rate": 9.503123671371772e-05, + "loss": 1.4834, + "step": 23617 + }, + { + "epoch": 1.86, + "learning_rate": 9.501973699489742e-05, + "loss": 1.4565, + "step": 23618 + }, + { + "epoch": 1.86, + "learning_rate": 9.500823764936276e-05, + "loss": 1.5081, + "step": 23619 + }, + { + "epoch": 1.86, + "learning_rate": 9.499673867719188e-05, + "loss": 1.4898, + "step": 23620 + }, + { + "epoch": 1.86, + "learning_rate": 9.498524007846274e-05, + "loss": 1.467, + "step": 23621 + }, + { + "epoch": 1.86, + "learning_rate": 9.497374185325348e-05, + "loss": 1.5156, + "step": 23622 + }, + { + "epoch": 1.86, + "learning_rate": 9.496224400164212e-05, + "loss": 1.4746, + "step": 23623 + }, + { + "epoch": 1.86, + "learning_rate": 9.495074652370677e-05, + "loss": 1.4703, + "step": 23624 + }, + { + "epoch": 1.86, + "learning_rate": 9.49392494195255e-05, + "loss": 1.4819, + "step": 23625 + }, + { + "epoch": 1.86, + "learning_rate": 9.492775268917631e-05, + "loss": 1.5061, + "step": 23626 + }, + { + "epoch": 1.86, + "learning_rate": 9.49162563327373e-05, + "loss": 1.47, + "step": 23627 + }, + { + "epoch": 1.86, + "learning_rate": 9.49047603502865e-05, + "loss": 1.483, + "step": 23628 + }, + { + "epoch": 1.86, + "learning_rate": 9.489326474190196e-05, + "loss": 1.4706, + "step": 23629 + }, + { + "epoch": 1.86, + "learning_rate": 9.488176950766173e-05, + "loss": 1.5115, + "step": 23630 + }, + { + "epoch": 1.86, + "learning_rate": 9.487027464764389e-05, + "loss": 1.5075, + "step": 23631 + }, + { + "epoch": 1.86, + "learning_rate": 9.485878016192648e-05, + "loss": 1.4894, + "step": 23632 + }, + { + "epoch": 1.86, + "learning_rate": 9.484728605058752e-05, + "loss": 1.5018, + "step": 23633 + }, + { + "epoch": 1.86, + "learning_rate": 9.483579231370505e-05, + "loss": 1.4826, + "step": 23634 + }, + { + "epoch": 1.86, + "learning_rate": 9.48242989513571e-05, + "loss": 1.5101, + "step": 23635 + }, + { + "epoch": 1.86, + "learning_rate": 9.481280596362171e-05, + "loss": 1.527, + "step": 23636 + }, + { + "epoch": 1.86, + "learning_rate": 9.480131335057693e-05, + "loss": 1.5015, + "step": 23637 + }, + { + "epoch": 1.86, + "learning_rate": 9.478982111230076e-05, + "loss": 1.5156, + "step": 23638 + }, + { + "epoch": 1.86, + "learning_rate": 9.477832924887127e-05, + "loss": 1.5122, + "step": 23639 + }, + { + "epoch": 1.86, + "learning_rate": 9.47668377603664e-05, + "loss": 1.4471, + "step": 23640 + }, + { + "epoch": 1.86, + "learning_rate": 9.475534664686423e-05, + "loss": 1.5034, + "step": 23641 + }, + { + "epoch": 1.86, + "learning_rate": 9.474385590844279e-05, + "loss": 1.5269, + "step": 23642 + }, + { + "epoch": 1.86, + "learning_rate": 9.473236554518005e-05, + "loss": 1.5017, + "step": 23643 + }, + { + "epoch": 1.86, + "learning_rate": 9.472087555715407e-05, + "loss": 1.5045, + "step": 23644 + }, + { + "epoch": 1.86, + "learning_rate": 9.470938594444279e-05, + "loss": 1.4714, + "step": 23645 + }, + { + "epoch": 1.86, + "learning_rate": 9.469789670712432e-05, + "loss": 1.4572, + "step": 23646 + }, + { + "epoch": 1.86, + "learning_rate": 9.468640784527657e-05, + "loss": 1.4937, + "step": 23647 + }, + { + "epoch": 1.86, + "learning_rate": 9.467491935897763e-05, + "loss": 1.4554, + "step": 23648 + }, + { + "epoch": 1.86, + "learning_rate": 9.466343124830546e-05, + "loss": 1.4765, + "step": 23649 + }, + { + "epoch": 1.86, + "learning_rate": 9.465194351333803e-05, + "loss": 1.4685, + "step": 23650 + }, + { + "epoch": 1.86, + "learning_rate": 9.464045615415338e-05, + "loss": 1.503, + "step": 23651 + }, + { + "epoch": 1.86, + "learning_rate": 9.462896917082948e-05, + "loss": 1.468, + "step": 23652 + }, + { + "epoch": 1.86, + "learning_rate": 9.46174825634443e-05, + "loss": 1.5024, + "step": 23653 + }, + { + "epoch": 1.86, + "learning_rate": 9.460599633207588e-05, + "loss": 1.5179, + "step": 23654 + }, + { + "epoch": 1.86, + "learning_rate": 9.459451047680216e-05, + "loss": 1.4898, + "step": 23655 + }, + { + "epoch": 1.86, + "learning_rate": 9.458302499770116e-05, + "loss": 1.4681, + "step": 23656 + }, + { + "epoch": 1.86, + "learning_rate": 9.45715398948508e-05, + "loss": 1.474, + "step": 23657 + }, + { + "epoch": 1.86, + "learning_rate": 9.456005516832911e-05, + "loss": 1.4729, + "step": 23658 + }, + { + "epoch": 1.86, + "learning_rate": 9.454857081821408e-05, + "loss": 1.5008, + "step": 23659 + }, + { + "epoch": 1.86, + "learning_rate": 9.453708684458361e-05, + "loss": 1.4698, + "step": 23660 + }, + { + "epoch": 1.86, + "learning_rate": 9.45256032475157e-05, + "loss": 1.5035, + "step": 23661 + }, + { + "epoch": 1.86, + "learning_rate": 9.451412002708835e-05, + "loss": 1.4384, + "step": 23662 + }, + { + "epoch": 1.86, + "learning_rate": 9.450263718337954e-05, + "loss": 1.4966, + "step": 23663 + }, + { + "epoch": 1.86, + "learning_rate": 9.449115471646718e-05, + "loss": 1.5169, + "step": 23664 + }, + { + "epoch": 1.86, + "learning_rate": 9.447967262642922e-05, + "loss": 1.4934, + "step": 23665 + }, + { + "epoch": 1.86, + "learning_rate": 9.44681909133437e-05, + "loss": 1.4796, + "step": 23666 + }, + { + "epoch": 1.86, + "learning_rate": 9.445670957728848e-05, + "loss": 1.4497, + "step": 23667 + }, + { + "epoch": 1.86, + "learning_rate": 9.444522861834158e-05, + "loss": 1.5203, + "step": 23668 + }, + { + "epoch": 1.86, + "learning_rate": 9.443374803658087e-05, + "loss": 1.5002, + "step": 23669 + }, + { + "epoch": 1.86, + "learning_rate": 9.442226783208438e-05, + "loss": 1.4514, + "step": 23670 + }, + { + "epoch": 1.86, + "learning_rate": 9.441078800493002e-05, + "loss": 1.4279, + "step": 23671 + }, + { + "epoch": 1.86, + "learning_rate": 9.439930855519572e-05, + "loss": 1.4601, + "step": 23672 + }, + { + "epoch": 1.86, + "learning_rate": 9.438782948295944e-05, + "loss": 1.5167, + "step": 23673 + }, + { + "epoch": 1.86, + "learning_rate": 9.437635078829914e-05, + "loss": 1.4628, + "step": 23674 + }, + { + "epoch": 1.86, + "learning_rate": 9.436487247129266e-05, + "loss": 1.483, + "step": 23675 + }, + { + "epoch": 1.86, + "learning_rate": 9.435339453201805e-05, + "loss": 1.4381, + "step": 23676 + }, + { + "epoch": 1.86, + "learning_rate": 9.434191697055309e-05, + "loss": 1.5191, + "step": 23677 + }, + { + "epoch": 1.86, + "learning_rate": 9.433043978697589e-05, + "loss": 1.4998, + "step": 23678 + }, + { + "epoch": 1.86, + "learning_rate": 9.431896298136425e-05, + "loss": 1.5158, + "step": 23679 + }, + { + "epoch": 1.86, + "learning_rate": 9.430748655379616e-05, + "loss": 1.5019, + "step": 23680 + }, + { + "epoch": 1.86, + "learning_rate": 9.429601050434946e-05, + "loss": 1.496, + "step": 23681 + }, + { + "epoch": 1.86, + "learning_rate": 9.428453483310212e-05, + "loss": 1.4946, + "step": 23682 + }, + { + "epoch": 1.86, + "learning_rate": 9.427305954013206e-05, + "loss": 1.48, + "step": 23683 + }, + { + "epoch": 1.86, + "learning_rate": 9.426158462551716e-05, + "loss": 1.4658, + "step": 23684 + }, + { + "epoch": 1.86, + "learning_rate": 9.425011008933531e-05, + "loss": 1.5141, + "step": 23685 + }, + { + "epoch": 1.86, + "learning_rate": 9.423863593166452e-05, + "loss": 1.4942, + "step": 23686 + }, + { + "epoch": 1.86, + "learning_rate": 9.422716215258256e-05, + "loss": 1.5162, + "step": 23687 + }, + { + "epoch": 1.86, + "learning_rate": 9.421568875216745e-05, + "loss": 1.5083, + "step": 23688 + }, + { + "epoch": 1.86, + "learning_rate": 9.420421573049696e-05, + "loss": 1.506, + "step": 23689 + }, + { + "epoch": 1.86, + "learning_rate": 9.419274308764907e-05, + "loss": 1.5304, + "step": 23690 + }, + { + "epoch": 1.86, + "learning_rate": 9.418127082370169e-05, + "loss": 1.4864, + "step": 23691 + }, + { + "epoch": 1.86, + "learning_rate": 9.416979893873262e-05, + "loss": 1.5016, + "step": 23692 + }, + { + "epoch": 1.86, + "learning_rate": 9.415832743281985e-05, + "loss": 1.5017, + "step": 23693 + }, + { + "epoch": 1.86, + "learning_rate": 9.41468563060412e-05, + "loss": 1.4913, + "step": 23694 + }, + { + "epoch": 1.86, + "learning_rate": 9.413538555847461e-05, + "loss": 1.4618, + "step": 23695 + }, + { + "epoch": 1.86, + "learning_rate": 9.41239151901979e-05, + "loss": 1.4556, + "step": 23696 + }, + { + "epoch": 1.86, + "learning_rate": 9.411244520128898e-05, + "loss": 1.4496, + "step": 23697 + }, + { + "epoch": 1.86, + "learning_rate": 9.41009755918257e-05, + "loss": 1.4804, + "step": 23698 + }, + { + "epoch": 1.86, + "learning_rate": 9.408950636188595e-05, + "loss": 1.5475, + "step": 23699 + }, + { + "epoch": 1.86, + "learning_rate": 9.407803751154762e-05, + "loss": 1.4681, + "step": 23700 + }, + { + "epoch": 1.86, + "learning_rate": 9.406656904088854e-05, + "loss": 1.4479, + "step": 23701 + }, + { + "epoch": 1.86, + "learning_rate": 9.405510094998658e-05, + "loss": 1.4703, + "step": 23702 + }, + { + "epoch": 1.86, + "learning_rate": 9.404363323891964e-05, + "loss": 1.4669, + "step": 23703 + }, + { + "epoch": 1.87, + "learning_rate": 9.403216590776554e-05, + "loss": 1.5315, + "step": 23704 + }, + { + "epoch": 1.87, + "learning_rate": 9.402069895660215e-05, + "loss": 1.4958, + "step": 23705 + }, + { + "epoch": 1.87, + "learning_rate": 9.40092323855073e-05, + "loss": 1.4878, + "step": 23706 + }, + { + "epoch": 1.87, + "learning_rate": 9.399776619455886e-05, + "loss": 1.5716, + "step": 23707 + }, + { + "epoch": 1.87, + "learning_rate": 9.398630038383466e-05, + "loss": 1.457, + "step": 23708 + }, + { + "epoch": 1.87, + "learning_rate": 9.397483495341263e-05, + "loss": 1.4601, + "step": 23709 + }, + { + "epoch": 1.87, + "learning_rate": 9.396336990337053e-05, + "loss": 1.464, + "step": 23710 + }, + { + "epoch": 1.87, + "learning_rate": 9.39519052337862e-05, + "loss": 1.4566, + "step": 23711 + }, + { + "epoch": 1.87, + "learning_rate": 9.394044094473756e-05, + "loss": 1.5046, + "step": 23712 + }, + { + "epoch": 1.87, + "learning_rate": 9.392897703630235e-05, + "loss": 1.5005, + "step": 23713 + }, + { + "epoch": 1.87, + "learning_rate": 9.391751350855843e-05, + "loss": 1.5003, + "step": 23714 + }, + { + "epoch": 1.87, + "learning_rate": 9.39060503615837e-05, + "loss": 1.4742, + "step": 23715 + }, + { + "epoch": 1.87, + "learning_rate": 9.38945875954559e-05, + "loss": 1.4918, + "step": 23716 + }, + { + "epoch": 1.87, + "learning_rate": 9.38831252102529e-05, + "loss": 1.4754, + "step": 23717 + }, + { + "epoch": 1.87, + "learning_rate": 9.387166320605249e-05, + "loss": 1.5211, + "step": 23718 + }, + { + "epoch": 1.87, + "learning_rate": 9.386020158293253e-05, + "loss": 1.4687, + "step": 23719 + }, + { + "epoch": 1.87, + "learning_rate": 9.384874034097083e-05, + "loss": 1.4933, + "step": 23720 + }, + { + "epoch": 1.87, + "learning_rate": 9.383727948024516e-05, + "loss": 1.5117, + "step": 23721 + }, + { + "epoch": 1.87, + "learning_rate": 9.38258190008334e-05, + "loss": 1.5352, + "step": 23722 + }, + { + "epoch": 1.87, + "learning_rate": 9.381435890281332e-05, + "loss": 1.5244, + "step": 23723 + }, + { + "epoch": 1.87, + "learning_rate": 9.38028991862627e-05, + "loss": 1.4292, + "step": 23724 + }, + { + "epoch": 1.87, + "learning_rate": 9.37914398512594e-05, + "loss": 1.4568, + "step": 23725 + }, + { + "epoch": 1.87, + "learning_rate": 9.377998089788126e-05, + "loss": 1.461, + "step": 23726 + }, + { + "epoch": 1.87, + "learning_rate": 9.376852232620597e-05, + "loss": 1.468, + "step": 23727 + }, + { + "epoch": 1.87, + "learning_rate": 9.37570641363114e-05, + "loss": 1.4589, + "step": 23728 + }, + { + "epoch": 1.87, + "learning_rate": 9.374560632827535e-05, + "loss": 1.4847, + "step": 23729 + }, + { + "epoch": 1.87, + "learning_rate": 9.373414890217554e-05, + "loss": 1.5068, + "step": 23730 + }, + { + "epoch": 1.87, + "learning_rate": 9.372269185808983e-05, + "loss": 1.4905, + "step": 23731 + }, + { + "epoch": 1.87, + "learning_rate": 9.371123519609602e-05, + "loss": 1.5539, + "step": 23732 + }, + { + "epoch": 1.87, + "learning_rate": 9.369977891627183e-05, + "loss": 1.496, + "step": 23733 + }, + { + "epoch": 1.87, + "learning_rate": 9.368832301869507e-05, + "loss": 1.4659, + "step": 23734 + }, + { + "epoch": 1.87, + "learning_rate": 9.367686750344354e-05, + "loss": 1.4869, + "step": 23735 + }, + { + "epoch": 1.87, + "learning_rate": 9.366541237059498e-05, + "loss": 1.4965, + "step": 23736 + }, + { + "epoch": 1.87, + "learning_rate": 9.365395762022721e-05, + "loss": 1.4868, + "step": 23737 + }, + { + "epoch": 1.87, + "learning_rate": 9.364250325241792e-05, + "loss": 1.5095, + "step": 23738 + }, + { + "epoch": 1.87, + "learning_rate": 9.3631049267245e-05, + "loss": 1.4701, + "step": 23739 + }, + { + "epoch": 1.87, + "learning_rate": 9.361959566478602e-05, + "loss": 1.4996, + "step": 23740 + }, + { + "epoch": 1.87, + "learning_rate": 9.360814244511899e-05, + "loss": 1.5192, + "step": 23741 + }, + { + "epoch": 1.87, + "learning_rate": 9.359668960832153e-05, + "loss": 1.5127, + "step": 23742 + }, + { + "epoch": 1.87, + "learning_rate": 9.35852371544714e-05, + "loss": 1.4697, + "step": 23743 + }, + { + "epoch": 1.87, + "learning_rate": 9.35737850836464e-05, + "loss": 1.5386, + "step": 23744 + }, + { + "epoch": 1.87, + "learning_rate": 9.356233339592425e-05, + "loss": 1.5076, + "step": 23745 + }, + { + "epoch": 1.87, + "learning_rate": 9.355088209138275e-05, + "loss": 1.5276, + "step": 23746 + }, + { + "epoch": 1.87, + "learning_rate": 9.353943117009957e-05, + "loss": 1.4573, + "step": 23747 + }, + { + "epoch": 1.87, + "learning_rate": 9.352798063215248e-05, + "loss": 1.4793, + "step": 23748 + }, + { + "epoch": 1.87, + "learning_rate": 9.351653047761929e-05, + "loss": 1.4331, + "step": 23749 + }, + { + "epoch": 1.87, + "learning_rate": 9.350508070657764e-05, + "loss": 1.5628, + "step": 23750 + }, + { + "epoch": 1.87, + "learning_rate": 9.349363131910534e-05, + "loss": 1.4968, + "step": 23751 + }, + { + "epoch": 1.87, + "learning_rate": 9.348218231528011e-05, + "loss": 1.5699, + "step": 23752 + }, + { + "epoch": 1.87, + "learning_rate": 9.347073369517963e-05, + "loss": 1.4692, + "step": 23753 + }, + { + "epoch": 1.87, + "learning_rate": 9.345928545888171e-05, + "loss": 1.4807, + "step": 23754 + }, + { + "epoch": 1.87, + "learning_rate": 9.3447837606464e-05, + "loss": 1.5306, + "step": 23755 + }, + { + "epoch": 1.87, + "learning_rate": 9.343639013800429e-05, + "loss": 1.4465, + "step": 23756 + }, + { + "epoch": 1.87, + "learning_rate": 9.342494305358026e-05, + "loss": 1.4665, + "step": 23757 + }, + { + "epoch": 1.87, + "learning_rate": 9.34134963532697e-05, + "loss": 1.4899, + "step": 23758 + }, + { + "epoch": 1.87, + "learning_rate": 9.340205003715022e-05, + "loss": 1.4399, + "step": 23759 + }, + { + "epoch": 1.87, + "learning_rate": 9.33906041052996e-05, + "loss": 1.4809, + "step": 23760 + }, + { + "epoch": 1.87, + "learning_rate": 9.337915855779556e-05, + "loss": 1.4921, + "step": 23761 + }, + { + "epoch": 1.87, + "learning_rate": 9.336771339471577e-05, + "loss": 1.4811, + "step": 23762 + }, + { + "epoch": 1.87, + "learning_rate": 9.335626861613798e-05, + "loss": 1.5417, + "step": 23763 + }, + { + "epoch": 1.87, + "learning_rate": 9.334482422213982e-05, + "loss": 1.4367, + "step": 23764 + }, + { + "epoch": 1.87, + "learning_rate": 9.333338021279905e-05, + "loss": 1.478, + "step": 23765 + }, + { + "epoch": 1.87, + "learning_rate": 9.332193658819338e-05, + "loss": 1.4487, + "step": 23766 + }, + { + "epoch": 1.87, + "learning_rate": 9.331049334840048e-05, + "loss": 1.4496, + "step": 23767 + }, + { + "epoch": 1.87, + "learning_rate": 9.329905049349802e-05, + "loss": 1.5131, + "step": 23768 + }, + { + "epoch": 1.87, + "learning_rate": 9.328760802356375e-05, + "loss": 1.4727, + "step": 23769 + }, + { + "epoch": 1.87, + "learning_rate": 9.327616593867532e-05, + "loss": 1.5027, + "step": 23770 + }, + { + "epoch": 1.87, + "learning_rate": 9.326472423891035e-05, + "loss": 1.5027, + "step": 23771 + }, + { + "epoch": 1.87, + "learning_rate": 9.325328292434665e-05, + "loss": 1.5356, + "step": 23772 + }, + { + "epoch": 1.87, + "learning_rate": 9.324184199506186e-05, + "loss": 1.5191, + "step": 23773 + }, + { + "epoch": 1.87, + "learning_rate": 9.323040145113362e-05, + "loss": 1.4605, + "step": 23774 + }, + { + "epoch": 1.87, + "learning_rate": 9.321896129263966e-05, + "loss": 1.4655, + "step": 23775 + }, + { + "epoch": 1.87, + "learning_rate": 9.32075215196576e-05, + "loss": 1.4509, + "step": 23776 + }, + { + "epoch": 1.87, + "learning_rate": 9.31960821322651e-05, + "loss": 1.484, + "step": 23777 + }, + { + "epoch": 1.87, + "learning_rate": 9.318464313053989e-05, + "loss": 1.4689, + "step": 23778 + }, + { + "epoch": 1.87, + "learning_rate": 9.317320451455958e-05, + "loss": 1.526, + "step": 23779 + }, + { + "epoch": 1.87, + "learning_rate": 9.316176628440188e-05, + "loss": 1.4229, + "step": 23780 + }, + { + "epoch": 1.87, + "learning_rate": 9.315032844014439e-05, + "loss": 1.4469, + "step": 23781 + }, + { + "epoch": 1.87, + "learning_rate": 9.31388909818648e-05, + "loss": 1.5076, + "step": 23782 + }, + { + "epoch": 1.87, + "learning_rate": 9.312745390964078e-05, + "loss": 1.4774, + "step": 23783 + }, + { + "epoch": 1.87, + "learning_rate": 9.311601722354996e-05, + "loss": 1.4736, + "step": 23784 + }, + { + "epoch": 1.87, + "learning_rate": 9.310458092366996e-05, + "loss": 1.4782, + "step": 23785 + }, + { + "epoch": 1.87, + "learning_rate": 9.30931450100785e-05, + "loss": 1.5026, + "step": 23786 + }, + { + "epoch": 1.87, + "learning_rate": 9.308170948285312e-05, + "loss": 1.4867, + "step": 23787 + }, + { + "epoch": 1.87, + "learning_rate": 9.307027434207156e-05, + "loss": 1.5132, + "step": 23788 + }, + { + "epoch": 1.87, + "learning_rate": 9.305883958781141e-05, + "loss": 1.5112, + "step": 23789 + }, + { + "epoch": 1.87, + "learning_rate": 9.304740522015035e-05, + "loss": 1.4623, + "step": 23790 + }, + { + "epoch": 1.87, + "learning_rate": 9.303597123916596e-05, + "loss": 1.4409, + "step": 23791 + }, + { + "epoch": 1.87, + "learning_rate": 9.30245376449359e-05, + "loss": 1.5075, + "step": 23792 + }, + { + "epoch": 1.87, + "learning_rate": 9.301310443753777e-05, + "loss": 1.5217, + "step": 23793 + }, + { + "epoch": 1.87, + "learning_rate": 9.300167161704922e-05, + "loss": 1.4766, + "step": 23794 + }, + { + "epoch": 1.87, + "learning_rate": 9.299023918354789e-05, + "loss": 1.5221, + "step": 23795 + }, + { + "epoch": 1.87, + "learning_rate": 9.297880713711134e-05, + "loss": 1.4978, + "step": 23796 + }, + { + "epoch": 1.87, + "learning_rate": 9.296737547781723e-05, + "loss": 1.4537, + "step": 23797 + }, + { + "epoch": 1.87, + "learning_rate": 9.295594420574321e-05, + "loss": 1.5163, + "step": 23798 + }, + { + "epoch": 1.87, + "learning_rate": 9.294451332096678e-05, + "loss": 1.5412, + "step": 23799 + }, + { + "epoch": 1.87, + "learning_rate": 9.293308282356567e-05, + "loss": 1.4259, + "step": 23800 + }, + { + "epoch": 1.87, + "learning_rate": 9.292165271361741e-05, + "loss": 1.4663, + "step": 23801 + }, + { + "epoch": 1.87, + "learning_rate": 9.29102229911996e-05, + "loss": 1.497, + "step": 23802 + }, + { + "epoch": 1.87, + "learning_rate": 9.289879365638989e-05, + "loss": 1.4627, + "step": 23803 + }, + { + "epoch": 1.87, + "learning_rate": 9.288736470926593e-05, + "loss": 1.4462, + "step": 23804 + }, + { + "epoch": 1.87, + "learning_rate": 9.287593614990516e-05, + "loss": 1.4496, + "step": 23805 + }, + { + "epoch": 1.87, + "learning_rate": 9.286450797838529e-05, + "loss": 1.479, + "step": 23806 + }, + { + "epoch": 1.87, + "learning_rate": 9.285308019478389e-05, + "loss": 1.501, + "step": 23807 + }, + { + "epoch": 1.87, + "learning_rate": 9.284165279917855e-05, + "loss": 1.4425, + "step": 23808 + }, + { + "epoch": 1.87, + "learning_rate": 9.283022579164684e-05, + "loss": 1.4799, + "step": 23809 + }, + { + "epoch": 1.87, + "learning_rate": 9.28187991722663e-05, + "loss": 1.4861, + "step": 23810 + }, + { + "epoch": 1.87, + "learning_rate": 9.28073729411146e-05, + "loss": 1.4645, + "step": 23811 + }, + { + "epoch": 1.87, + "learning_rate": 9.279594709826931e-05, + "loss": 1.4083, + "step": 23812 + }, + { + "epoch": 1.87, + "learning_rate": 9.278452164380791e-05, + "loss": 1.4579, + "step": 23813 + }, + { + "epoch": 1.87, + "learning_rate": 9.277309657780805e-05, + "loss": 1.4722, + "step": 23814 + }, + { + "epoch": 1.87, + "learning_rate": 9.27616719003473e-05, + "loss": 1.4563, + "step": 23815 + }, + { + "epoch": 1.87, + "learning_rate": 9.27502476115032e-05, + "loss": 1.4633, + "step": 23816 + }, + { + "epoch": 1.87, + "learning_rate": 9.273882371135335e-05, + "loss": 1.5143, + "step": 23817 + }, + { + "epoch": 1.87, + "learning_rate": 9.272740019997519e-05, + "loss": 1.4736, + "step": 23818 + }, + { + "epoch": 1.87, + "learning_rate": 9.27159770774465e-05, + "loss": 1.5386, + "step": 23819 + }, + { + "epoch": 1.87, + "learning_rate": 9.270455434384463e-05, + "loss": 1.4594, + "step": 23820 + }, + { + "epoch": 1.87, + "learning_rate": 9.269313199924728e-05, + "loss": 1.5193, + "step": 23821 + }, + { + "epoch": 1.87, + "learning_rate": 9.268171004373189e-05, + "loss": 1.4662, + "step": 23822 + }, + { + "epoch": 1.87, + "learning_rate": 9.267028847737608e-05, + "loss": 1.4491, + "step": 23823 + }, + { + "epoch": 1.87, + "learning_rate": 9.265886730025739e-05, + "loss": 1.5192, + "step": 23824 + }, + { + "epoch": 1.87, + "learning_rate": 9.264744651245334e-05, + "loss": 1.4667, + "step": 23825 + }, + { + "epoch": 1.87, + "learning_rate": 9.263602611404146e-05, + "loss": 1.4898, + "step": 23826 + }, + { + "epoch": 1.87, + "learning_rate": 9.262460610509932e-05, + "loss": 1.4932, + "step": 23827 + }, + { + "epoch": 1.87, + "learning_rate": 9.261318648570444e-05, + "loss": 1.4804, + "step": 23828 + }, + { + "epoch": 1.87, + "learning_rate": 9.260176725593438e-05, + "loss": 1.459, + "step": 23829 + }, + { + "epoch": 1.87, + "learning_rate": 9.259034841586661e-05, + "loss": 1.5337, + "step": 23830 + }, + { + "epoch": 1.88, + "learning_rate": 9.257892996557869e-05, + "loss": 1.4955, + "step": 23831 + }, + { + "epoch": 1.88, + "learning_rate": 9.256751190514818e-05, + "loss": 1.5221, + "step": 23832 + }, + { + "epoch": 1.88, + "learning_rate": 9.255609423465255e-05, + "loss": 1.4736, + "step": 23833 + }, + { + "epoch": 1.88, + "learning_rate": 9.254467695416929e-05, + "loss": 1.4622, + "step": 23834 + }, + { + "epoch": 1.88, + "learning_rate": 9.2533260063776e-05, + "loss": 1.4668, + "step": 23835 + }, + { + "epoch": 1.88, + "learning_rate": 9.252184356355021e-05, + "loss": 1.5239, + "step": 23836 + }, + { + "epoch": 1.88, + "learning_rate": 9.251042745356933e-05, + "loss": 1.4742, + "step": 23837 + }, + { + "epoch": 1.88, + "learning_rate": 9.249901173391099e-05, + "loss": 1.5122, + "step": 23838 + }, + { + "epoch": 1.88, + "learning_rate": 9.248759640465258e-05, + "loss": 1.4742, + "step": 23839 + }, + { + "epoch": 1.88, + "learning_rate": 9.247618146587164e-05, + "loss": 1.5387, + "step": 23840 + }, + { + "epoch": 1.88, + "learning_rate": 9.246476691764571e-05, + "loss": 1.4543, + "step": 23841 + }, + { + "epoch": 1.88, + "learning_rate": 9.245335276005224e-05, + "loss": 1.4745, + "step": 23842 + }, + { + "epoch": 1.88, + "learning_rate": 9.244193899316876e-05, + "loss": 1.4979, + "step": 23843 + }, + { + "epoch": 1.88, + "learning_rate": 9.243052561707277e-05, + "loss": 1.4632, + "step": 23844 + }, + { + "epoch": 1.88, + "learning_rate": 9.24191126318417e-05, + "loss": 1.5334, + "step": 23845 + }, + { + "epoch": 1.88, + "learning_rate": 9.240770003755312e-05, + "loss": 1.4532, + "step": 23846 + }, + { + "epoch": 1.88, + "learning_rate": 9.239628783428446e-05, + "loss": 1.4758, + "step": 23847 + }, + { + "epoch": 1.88, + "learning_rate": 9.23848760221132e-05, + "loss": 1.5103, + "step": 23848 + }, + { + "epoch": 1.88, + "learning_rate": 9.237346460111687e-05, + "loss": 1.4991, + "step": 23849 + }, + { + "epoch": 1.88, + "learning_rate": 9.236205357137286e-05, + "loss": 1.4902, + "step": 23850 + }, + { + "epoch": 1.88, + "learning_rate": 9.235064293295871e-05, + "loss": 1.457, + "step": 23851 + }, + { + "epoch": 1.88, + "learning_rate": 9.233923268595191e-05, + "loss": 1.4968, + "step": 23852 + }, + { + "epoch": 1.88, + "learning_rate": 9.232782283042992e-05, + "loss": 1.4332, + "step": 23853 + }, + { + "epoch": 1.88, + "learning_rate": 9.231641336647014e-05, + "loss": 1.484, + "step": 23854 + }, + { + "epoch": 1.88, + "learning_rate": 9.230500429415008e-05, + "loss": 1.4599, + "step": 23855 + }, + { + "epoch": 1.88, + "learning_rate": 9.229359561354726e-05, + "loss": 1.4621, + "step": 23856 + }, + { + "epoch": 1.88, + "learning_rate": 9.228218732473904e-05, + "loss": 1.4847, + "step": 23857 + }, + { + "epoch": 1.88, + "learning_rate": 9.227077942780295e-05, + "loss": 1.4436, + "step": 23858 + }, + { + "epoch": 1.88, + "learning_rate": 9.225937192281636e-05, + "loss": 1.4831, + "step": 23859 + }, + { + "epoch": 1.88, + "learning_rate": 9.224796480985678e-05, + "loss": 1.5593, + "step": 23860 + }, + { + "epoch": 1.88, + "learning_rate": 9.223655808900169e-05, + "loss": 1.5644, + "step": 23861 + }, + { + "epoch": 1.88, + "learning_rate": 9.222515176032846e-05, + "loss": 1.5173, + "step": 23862 + }, + { + "epoch": 1.88, + "learning_rate": 9.22137458239146e-05, + "loss": 1.4468, + "step": 23863 + }, + { + "epoch": 1.88, + "learning_rate": 9.220234027983748e-05, + "loss": 1.4944, + "step": 23864 + }, + { + "epoch": 1.88, + "learning_rate": 9.219093512817453e-05, + "loss": 1.4428, + "step": 23865 + }, + { + "epoch": 1.88, + "learning_rate": 9.217953036900327e-05, + "loss": 1.5095, + "step": 23866 + }, + { + "epoch": 1.88, + "learning_rate": 9.21681260024011e-05, + "loss": 1.47, + "step": 23867 + }, + { + "epoch": 1.88, + "learning_rate": 9.215672202844547e-05, + "loss": 1.4878, + "step": 23868 + }, + { + "epoch": 1.88, + "learning_rate": 9.214531844721373e-05, + "loss": 1.4404, + "step": 23869 + }, + { + "epoch": 1.88, + "learning_rate": 9.21339152587834e-05, + "loss": 1.5205, + "step": 23870 + }, + { + "epoch": 1.88, + "learning_rate": 9.212251246323181e-05, + "loss": 1.4825, + "step": 23871 + }, + { + "epoch": 1.88, + "learning_rate": 9.211111006063641e-05, + "loss": 1.4892, + "step": 23872 + }, + { + "epoch": 1.88, + "learning_rate": 9.20997080510747e-05, + "loss": 1.495, + "step": 23873 + }, + { + "epoch": 1.88, + "learning_rate": 9.208830643462395e-05, + "loss": 1.5124, + "step": 23874 + }, + { + "epoch": 1.88, + "learning_rate": 9.207690521136168e-05, + "loss": 1.4798, + "step": 23875 + }, + { + "epoch": 1.88, + "learning_rate": 9.206550438136524e-05, + "loss": 1.5016, + "step": 23876 + }, + { + "epoch": 1.88, + "learning_rate": 9.205410394471205e-05, + "loss": 1.5329, + "step": 23877 + }, + { + "epoch": 1.88, + "learning_rate": 9.204270390147953e-05, + "loss": 1.5119, + "step": 23878 + }, + { + "epoch": 1.88, + "learning_rate": 9.203130425174505e-05, + "loss": 1.5135, + "step": 23879 + }, + { + "epoch": 1.88, + "learning_rate": 9.201990499558604e-05, + "loss": 1.4969, + "step": 23880 + }, + { + "epoch": 1.88, + "learning_rate": 9.200850613307981e-05, + "loss": 1.4691, + "step": 23881 + }, + { + "epoch": 1.88, + "learning_rate": 9.199710766430393e-05, + "loss": 1.4822, + "step": 23882 + }, + { + "epoch": 1.88, + "learning_rate": 9.198570958933561e-05, + "loss": 1.5163, + "step": 23883 + }, + { + "epoch": 1.88, + "learning_rate": 9.197431190825234e-05, + "loss": 1.5059, + "step": 23884 + }, + { + "epoch": 1.88, + "learning_rate": 9.196291462113146e-05, + "loss": 1.4289, + "step": 23885 + }, + { + "epoch": 1.88, + "learning_rate": 9.195151772805036e-05, + "loss": 1.5112, + "step": 23886 + }, + { + "epoch": 1.88, + "learning_rate": 9.194012122908647e-05, + "loss": 1.4121, + "step": 23887 + }, + { + "epoch": 1.88, + "learning_rate": 9.192872512431704e-05, + "loss": 1.5058, + "step": 23888 + }, + { + "epoch": 1.88, + "learning_rate": 9.191732941381957e-05, + "loss": 1.4845, + "step": 23889 + }, + { + "epoch": 1.88, + "learning_rate": 9.190593409767137e-05, + "loss": 1.538, + "step": 23890 + }, + { + "epoch": 1.88, + "learning_rate": 9.189453917594982e-05, + "loss": 1.4666, + "step": 23891 + }, + { + "epoch": 1.88, + "learning_rate": 9.188314464873227e-05, + "loss": 1.4324, + "step": 23892 + }, + { + "epoch": 1.88, + "learning_rate": 9.187175051609609e-05, + "loss": 1.4943, + "step": 23893 + }, + { + "epoch": 1.88, + "learning_rate": 9.186035677811865e-05, + "loss": 1.4852, + "step": 23894 + }, + { + "epoch": 1.88, + "learning_rate": 9.184896343487733e-05, + "loss": 1.4973, + "step": 23895 + }, + { + "epoch": 1.88, + "learning_rate": 9.183757048644943e-05, + "loss": 1.476, + "step": 23896 + }, + { + "epoch": 1.88, + "learning_rate": 9.182617793291231e-05, + "loss": 1.556, + "step": 23897 + }, + { + "epoch": 1.88, + "learning_rate": 9.181478577434336e-05, + "loss": 1.504, + "step": 23898 + }, + { + "epoch": 1.88, + "learning_rate": 9.180339401081993e-05, + "loss": 1.4643, + "step": 23899 + }, + { + "epoch": 1.88, + "learning_rate": 9.17920026424193e-05, + "loss": 1.4244, + "step": 23900 + }, + { + "epoch": 1.88, + "learning_rate": 9.178061166921889e-05, + "loss": 1.4973, + "step": 23901 + }, + { + "epoch": 1.88, + "learning_rate": 9.176922109129597e-05, + "loss": 1.4411, + "step": 23902 + }, + { + "epoch": 1.88, + "learning_rate": 9.175783090872791e-05, + "loss": 1.5305, + "step": 23903 + }, + { + "epoch": 1.88, + "learning_rate": 9.174644112159208e-05, + "loss": 1.5078, + "step": 23904 + }, + { + "epoch": 1.88, + "learning_rate": 9.173505172996573e-05, + "loss": 1.4977, + "step": 23905 + }, + { + "epoch": 1.88, + "learning_rate": 9.172366273392621e-05, + "loss": 1.5094, + "step": 23906 + }, + { + "epoch": 1.88, + "learning_rate": 9.17122741335509e-05, + "loss": 1.4453, + "step": 23907 + }, + { + "epoch": 1.88, + "learning_rate": 9.170088592891704e-05, + "loss": 1.5058, + "step": 23908 + }, + { + "epoch": 1.88, + "learning_rate": 9.1689498120102e-05, + "loss": 1.536, + "step": 23909 + }, + { + "epoch": 1.88, + "learning_rate": 9.167811070718312e-05, + "loss": 1.5331, + "step": 23910 + }, + { + "epoch": 1.88, + "learning_rate": 9.166672369023766e-05, + "loss": 1.4465, + "step": 23911 + }, + { + "epoch": 1.88, + "learning_rate": 9.165533706934293e-05, + "loss": 1.4734, + "step": 23912 + }, + { + "epoch": 1.88, + "learning_rate": 9.164395084457628e-05, + "loss": 1.4782, + "step": 23913 + }, + { + "epoch": 1.88, + "learning_rate": 9.163256501601503e-05, + "loss": 1.5023, + "step": 23914 + }, + { + "epoch": 1.88, + "learning_rate": 9.162117958373643e-05, + "loss": 1.4937, + "step": 23915 + }, + { + "epoch": 1.88, + "learning_rate": 9.160979454781782e-05, + "loss": 1.4907, + "step": 23916 + }, + { + "epoch": 1.88, + "learning_rate": 9.15984099083365e-05, + "loss": 1.4839, + "step": 23917 + }, + { + "epoch": 1.88, + "learning_rate": 9.15870256653697e-05, + "loss": 1.5095, + "step": 23918 + }, + { + "epoch": 1.88, + "learning_rate": 9.15756418189948e-05, + "loss": 1.4809, + "step": 23919 + }, + { + "epoch": 1.88, + "learning_rate": 9.156425836928902e-05, + "loss": 1.4629, + "step": 23920 + }, + { + "epoch": 1.88, + "learning_rate": 9.155287531632972e-05, + "loss": 1.4828, + "step": 23921 + }, + { + "epoch": 1.88, + "learning_rate": 9.15414926601941e-05, + "loss": 1.5247, + "step": 23922 + }, + { + "epoch": 1.88, + "learning_rate": 9.153011040095949e-05, + "loss": 1.4758, + "step": 23923 + }, + { + "epoch": 1.88, + "learning_rate": 9.151872853870319e-05, + "loss": 1.475, + "step": 23924 + }, + { + "epoch": 1.88, + "learning_rate": 9.150734707350243e-05, + "loss": 1.5095, + "step": 23925 + }, + { + "epoch": 1.88, + "learning_rate": 9.14959660054345e-05, + "loss": 1.507, + "step": 23926 + }, + { + "epoch": 1.88, + "learning_rate": 9.148458533457671e-05, + "loss": 1.4804, + "step": 23927 + }, + { + "epoch": 1.88, + "learning_rate": 9.147320506100624e-05, + "loss": 1.4402, + "step": 23928 + }, + { + "epoch": 1.88, + "learning_rate": 9.146182518480041e-05, + "loss": 1.4994, + "step": 23929 + }, + { + "epoch": 1.88, + "learning_rate": 9.145044570603652e-05, + "loss": 1.4882, + "step": 23930 + }, + { + "epoch": 1.88, + "learning_rate": 9.143906662479179e-05, + "loss": 1.5402, + "step": 23931 + }, + { + "epoch": 1.88, + "learning_rate": 9.142768794114348e-05, + "loss": 1.473, + "step": 23932 + }, + { + "epoch": 1.88, + "learning_rate": 9.141630965516886e-05, + "loss": 1.4819, + "step": 23933 + }, + { + "epoch": 1.88, + "learning_rate": 9.140493176694514e-05, + "loss": 1.5005, + "step": 23934 + }, + { + "epoch": 1.88, + "learning_rate": 9.13935542765496e-05, + "loss": 1.533, + "step": 23935 + }, + { + "epoch": 1.88, + "learning_rate": 9.138217718405953e-05, + "loss": 1.4831, + "step": 23936 + }, + { + "epoch": 1.88, + "learning_rate": 9.137080048955206e-05, + "loss": 1.489, + "step": 23937 + }, + { + "epoch": 1.88, + "learning_rate": 9.135942419310453e-05, + "loss": 1.5341, + "step": 23938 + }, + { + "epoch": 1.88, + "learning_rate": 9.134804829479417e-05, + "loss": 1.4614, + "step": 23939 + }, + { + "epoch": 1.88, + "learning_rate": 9.133667279469819e-05, + "loss": 1.4967, + "step": 23940 + }, + { + "epoch": 1.88, + "learning_rate": 9.132529769289382e-05, + "loss": 1.4846, + "step": 23941 + }, + { + "epoch": 1.88, + "learning_rate": 9.131392298945827e-05, + "loss": 1.4762, + "step": 23942 + }, + { + "epoch": 1.88, + "learning_rate": 9.130254868446883e-05, + "loss": 1.5195, + "step": 23943 + }, + { + "epoch": 1.88, + "learning_rate": 9.129117477800264e-05, + "loss": 1.5096, + "step": 23944 + }, + { + "epoch": 1.88, + "learning_rate": 9.127980127013704e-05, + "loss": 1.5297, + "step": 23945 + }, + { + "epoch": 1.88, + "learning_rate": 9.126842816094915e-05, + "loss": 1.4609, + "step": 23946 + }, + { + "epoch": 1.88, + "learning_rate": 9.125705545051622e-05, + "loss": 1.4828, + "step": 23947 + }, + { + "epoch": 1.88, + "learning_rate": 9.124568313891552e-05, + "loss": 1.4889, + "step": 23948 + }, + { + "epoch": 1.88, + "learning_rate": 9.123431122622416e-05, + "loss": 1.4879, + "step": 23949 + }, + { + "epoch": 1.88, + "learning_rate": 9.12229397125194e-05, + "loss": 1.4758, + "step": 23950 + }, + { + "epoch": 1.88, + "learning_rate": 9.121156859787848e-05, + "loss": 1.4925, + "step": 23951 + }, + { + "epoch": 1.88, + "learning_rate": 9.120019788237853e-05, + "loss": 1.4751, + "step": 23952 + }, + { + "epoch": 1.88, + "learning_rate": 9.118882756609681e-05, + "loss": 1.491, + "step": 23953 + }, + { + "epoch": 1.88, + "learning_rate": 9.117745764911049e-05, + "loss": 1.4986, + "step": 23954 + }, + { + "epoch": 1.88, + "learning_rate": 9.116608813149674e-05, + "loss": 1.4934, + "step": 23955 + }, + { + "epoch": 1.88, + "learning_rate": 9.115471901333284e-05, + "loss": 1.4749, + "step": 23956 + }, + { + "epoch": 1.88, + "learning_rate": 9.114335029469588e-05, + "loss": 1.5112, + "step": 23957 + }, + { + "epoch": 1.89, + "learning_rate": 9.113198197566312e-05, + "loss": 1.4979, + "step": 23958 + }, + { + "epoch": 1.89, + "learning_rate": 9.11206140563117e-05, + "loss": 1.4843, + "step": 23959 + }, + { + "epoch": 1.89, + "learning_rate": 9.110924653671879e-05, + "loss": 1.484, + "step": 23960 + }, + { + "epoch": 1.89, + "learning_rate": 9.10978794169616e-05, + "loss": 1.4861, + "step": 23961 + }, + { + "epoch": 1.89, + "learning_rate": 9.108651269711735e-05, + "loss": 1.5132, + "step": 23962 + }, + { + "epoch": 1.89, + "learning_rate": 9.107514637726315e-05, + "loss": 1.4995, + "step": 23963 + }, + { + "epoch": 1.89, + "learning_rate": 9.106378045747617e-05, + "loss": 1.5152, + "step": 23964 + }, + { + "epoch": 1.89, + "learning_rate": 9.105241493783363e-05, + "loss": 1.4364, + "step": 23965 + }, + { + "epoch": 1.89, + "learning_rate": 9.104104981841266e-05, + "loss": 1.511, + "step": 23966 + }, + { + "epoch": 1.89, + "learning_rate": 9.102968509929038e-05, + "loss": 1.4797, + "step": 23967 + }, + { + "epoch": 1.89, + "learning_rate": 9.101832078054406e-05, + "loss": 1.4761, + "step": 23968 + }, + { + "epoch": 1.89, + "learning_rate": 9.100695686225075e-05, + "loss": 1.5036, + "step": 23969 + }, + { + "epoch": 1.89, + "learning_rate": 9.099559334448767e-05, + "loss": 1.4583, + "step": 23970 + }, + { + "epoch": 1.89, + "learning_rate": 9.098423022733194e-05, + "loss": 1.5036, + "step": 23971 + }, + { + "epoch": 1.89, + "learning_rate": 9.097286751086071e-05, + "loss": 1.5441, + "step": 23972 + }, + { + "epoch": 1.89, + "learning_rate": 9.096150519515117e-05, + "loss": 1.5074, + "step": 23973 + }, + { + "epoch": 1.89, + "learning_rate": 9.09501432802804e-05, + "loss": 1.5034, + "step": 23974 + }, + { + "epoch": 1.89, + "learning_rate": 9.093878176632553e-05, + "loss": 1.4477, + "step": 23975 + }, + { + "epoch": 1.89, + "learning_rate": 9.092742065336376e-05, + "loss": 1.4769, + "step": 23976 + }, + { + "epoch": 1.89, + "learning_rate": 9.091605994147226e-05, + "loss": 1.5192, + "step": 23977 + }, + { + "epoch": 1.89, + "learning_rate": 9.090469963072806e-05, + "loss": 1.4702, + "step": 23978 + }, + { + "epoch": 1.89, + "learning_rate": 9.089333972120836e-05, + "loss": 1.4311, + "step": 23979 + }, + { + "epoch": 1.89, + "learning_rate": 9.088198021299026e-05, + "loss": 1.5035, + "step": 23980 + }, + { + "epoch": 1.89, + "learning_rate": 9.087062110615089e-05, + "loss": 1.518, + "step": 23981 + }, + { + "epoch": 1.89, + "learning_rate": 9.085926240076738e-05, + "loss": 1.4625, + "step": 23982 + }, + { + "epoch": 1.89, + "learning_rate": 9.084790409691684e-05, + "loss": 1.51, + "step": 23983 + }, + { + "epoch": 1.89, + "learning_rate": 9.083654619467637e-05, + "loss": 1.4675, + "step": 23984 + }, + { + "epoch": 1.89, + "learning_rate": 9.082518869412314e-05, + "loss": 1.4465, + "step": 23985 + }, + { + "epoch": 1.89, + "learning_rate": 9.081383159533419e-05, + "loss": 1.4992, + "step": 23986 + }, + { + "epoch": 1.89, + "learning_rate": 9.080247489838668e-05, + "loss": 1.4512, + "step": 23987 + }, + { + "epoch": 1.89, + "learning_rate": 9.079111860335769e-05, + "loss": 1.4538, + "step": 23988 + }, + { + "epoch": 1.89, + "learning_rate": 9.077976271032431e-05, + "loss": 1.5056, + "step": 23989 + }, + { + "epoch": 1.89, + "learning_rate": 9.076840721936371e-05, + "loss": 1.4619, + "step": 23990 + }, + { + "epoch": 1.89, + "learning_rate": 9.075705213055286e-05, + "loss": 1.4871, + "step": 23991 + }, + { + "epoch": 1.89, + "learning_rate": 9.074569744396896e-05, + "loss": 1.4958, + "step": 23992 + }, + { + "epoch": 1.89, + "learning_rate": 9.07343431596891e-05, + "loss": 1.4515, + "step": 23993 + }, + { + "epoch": 1.89, + "learning_rate": 9.072298927779036e-05, + "loss": 1.4322, + "step": 23994 + }, + { + "epoch": 1.89, + "learning_rate": 9.071163579834977e-05, + "loss": 1.4871, + "step": 23995 + }, + { + "epoch": 1.89, + "learning_rate": 9.070028272144448e-05, + "loss": 1.4984, + "step": 23996 + }, + { + "epoch": 1.89, + "learning_rate": 9.068893004715155e-05, + "loss": 1.4409, + "step": 23997 + }, + { + "epoch": 1.89, + "learning_rate": 9.067757777554805e-05, + "loss": 1.4564, + "step": 23998 + }, + { + "epoch": 1.89, + "learning_rate": 9.066622590671108e-05, + "loss": 1.4936, + "step": 23999 + }, + { + "epoch": 1.89, + "learning_rate": 9.065487444071766e-05, + "loss": 1.4891, + "step": 24000 + }, + { + "epoch": 1.89, + "learning_rate": 9.064352337764487e-05, + "loss": 1.5119, + "step": 24001 + }, + { + "epoch": 1.89, + "learning_rate": 9.063217271756986e-05, + "loss": 1.4685, + "step": 24002 + }, + { + "epoch": 1.89, + "learning_rate": 9.062082246056962e-05, + "loss": 1.4967, + "step": 24003 + }, + { + "epoch": 1.89, + "learning_rate": 9.060947260672123e-05, + "loss": 1.5252, + "step": 24004 + }, + { + "epoch": 1.89, + "learning_rate": 9.05981231561017e-05, + "loss": 1.473, + "step": 24005 + }, + { + "epoch": 1.89, + "learning_rate": 9.058677410878818e-05, + "loss": 1.4425, + "step": 24006 + }, + { + "epoch": 1.89, + "learning_rate": 9.057542546485762e-05, + "loss": 1.5045, + "step": 24007 + }, + { + "epoch": 1.89, + "learning_rate": 9.056407722438716e-05, + "loss": 1.4706, + "step": 24008 + }, + { + "epoch": 1.89, + "learning_rate": 9.055272938745385e-05, + "loss": 1.4383, + "step": 24009 + }, + { + "epoch": 1.89, + "learning_rate": 9.054138195413467e-05, + "loss": 1.497, + "step": 24010 + }, + { + "epoch": 1.89, + "learning_rate": 9.053003492450672e-05, + "loss": 1.5409, + "step": 24011 + }, + { + "epoch": 1.89, + "learning_rate": 9.051868829864698e-05, + "loss": 1.4933, + "step": 24012 + }, + { + "epoch": 1.89, + "learning_rate": 9.050734207663253e-05, + "loss": 1.5171, + "step": 24013 + }, + { + "epoch": 1.89, + "learning_rate": 9.049599625854043e-05, + "loss": 1.5332, + "step": 24014 + }, + { + "epoch": 1.89, + "learning_rate": 9.048465084444765e-05, + "loss": 1.4475, + "step": 24015 + }, + { + "epoch": 1.89, + "learning_rate": 9.047330583443127e-05, + "loss": 1.4653, + "step": 24016 + }, + { + "epoch": 1.89, + "learning_rate": 9.046196122856827e-05, + "loss": 1.4629, + "step": 24017 + }, + { + "epoch": 1.89, + "learning_rate": 9.04506170269357e-05, + "loss": 1.4827, + "step": 24018 + }, + { + "epoch": 1.89, + "learning_rate": 9.043927322961059e-05, + "loss": 1.4931, + "step": 24019 + }, + { + "epoch": 1.89, + "learning_rate": 9.042792983666993e-05, + "loss": 1.4209, + "step": 24020 + }, + { + "epoch": 1.89, + "learning_rate": 9.041658684819074e-05, + "loss": 1.516, + "step": 24021 + }, + { + "epoch": 1.89, + "learning_rate": 9.040524426425003e-05, + "loss": 1.476, + "step": 24022 + }, + { + "epoch": 1.89, + "learning_rate": 9.039390208492488e-05, + "loss": 1.4628, + "step": 24023 + }, + { + "epoch": 1.89, + "learning_rate": 9.038256031029221e-05, + "loss": 1.4772, + "step": 24024 + }, + { + "epoch": 1.89, + "learning_rate": 9.037121894042905e-05, + "loss": 1.4913, + "step": 24025 + }, + { + "epoch": 1.89, + "learning_rate": 9.035987797541246e-05, + "loss": 1.5127, + "step": 24026 + }, + { + "epoch": 1.89, + "learning_rate": 9.034853741531933e-05, + "loss": 1.5762, + "step": 24027 + }, + { + "epoch": 1.89, + "learning_rate": 9.033719726022676e-05, + "loss": 1.4936, + "step": 24028 + }, + { + "epoch": 1.89, + "learning_rate": 9.032585751021166e-05, + "loss": 1.4939, + "step": 24029 + }, + { + "epoch": 1.89, + "learning_rate": 9.031451816535106e-05, + "loss": 1.4577, + "step": 24030 + }, + { + "epoch": 1.89, + "learning_rate": 9.030317922572196e-05, + "loss": 1.5092, + "step": 24031 + }, + { + "epoch": 1.89, + "learning_rate": 9.029184069140131e-05, + "loss": 1.4612, + "step": 24032 + }, + { + "epoch": 1.89, + "learning_rate": 9.028050256246615e-05, + "loss": 1.5588, + "step": 24033 + }, + { + "epoch": 1.89, + "learning_rate": 9.026916483899338e-05, + "loss": 1.4946, + "step": 24034 + }, + { + "epoch": 1.89, + "learning_rate": 9.025782752106002e-05, + "loss": 1.4503, + "step": 24035 + }, + { + "epoch": 1.89, + "learning_rate": 9.024649060874309e-05, + "loss": 1.4781, + "step": 24036 + }, + { + "epoch": 1.89, + "learning_rate": 9.023515410211944e-05, + "loss": 1.4777, + "step": 24037 + }, + { + "epoch": 1.89, + "learning_rate": 9.022381800126612e-05, + "loss": 1.5185, + "step": 24038 + }, + { + "epoch": 1.89, + "learning_rate": 9.021248230626013e-05, + "loss": 1.445, + "step": 24039 + }, + { + "epoch": 1.89, + "learning_rate": 9.020114701717839e-05, + "loss": 1.4879, + "step": 24040 + }, + { + "epoch": 1.89, + "learning_rate": 9.018981213409785e-05, + "loss": 1.4154, + "step": 24041 + }, + { + "epoch": 1.89, + "learning_rate": 9.017847765709545e-05, + "loss": 1.4389, + "step": 24042 + }, + { + "epoch": 1.89, + "learning_rate": 9.016714358624824e-05, + "loss": 1.5091, + "step": 24043 + }, + { + "epoch": 1.89, + "learning_rate": 9.015580992163306e-05, + "loss": 1.4793, + "step": 24044 + }, + { + "epoch": 1.89, + "learning_rate": 9.014447666332694e-05, + "loss": 1.4628, + "step": 24045 + }, + { + "epoch": 1.89, + "learning_rate": 9.013314381140677e-05, + "loss": 1.4901, + "step": 24046 + }, + { + "epoch": 1.89, + "learning_rate": 9.01218113659495e-05, + "loss": 1.4701, + "step": 24047 + }, + { + "epoch": 1.89, + "learning_rate": 9.011047932703213e-05, + "loss": 1.5002, + "step": 24048 + }, + { + "epoch": 1.89, + "learning_rate": 9.009914769473153e-05, + "loss": 1.5172, + "step": 24049 + }, + { + "epoch": 1.89, + "learning_rate": 9.008781646912466e-05, + "loss": 1.4886, + "step": 24050 + }, + { + "epoch": 1.89, + "learning_rate": 9.007648565028845e-05, + "loss": 1.4519, + "step": 24051 + }, + { + "epoch": 1.89, + "learning_rate": 9.006515523829985e-05, + "loss": 1.4335, + "step": 24052 + }, + { + "epoch": 1.89, + "learning_rate": 9.005382523323576e-05, + "loss": 1.5332, + "step": 24053 + }, + { + "epoch": 1.89, + "learning_rate": 9.004249563517306e-05, + "loss": 1.5175, + "step": 24054 + }, + { + "epoch": 1.89, + "learning_rate": 9.00311664441888e-05, + "loss": 1.4868, + "step": 24055 + }, + { + "epoch": 1.89, + "learning_rate": 9.001983766035981e-05, + "loss": 1.5179, + "step": 24056 + }, + { + "epoch": 1.89, + "learning_rate": 9.000850928376304e-05, + "loss": 1.4798, + "step": 24057 + }, + { + "epoch": 1.89, + "learning_rate": 8.999718131447536e-05, + "loss": 1.4414, + "step": 24058 + }, + { + "epoch": 1.89, + "learning_rate": 8.998585375257371e-05, + "loss": 1.5221, + "step": 24059 + }, + { + "epoch": 1.89, + "learning_rate": 8.997452659813501e-05, + "loss": 1.5341, + "step": 24060 + }, + { + "epoch": 1.89, + "learning_rate": 8.996319985123612e-05, + "loss": 1.4804, + "step": 24061 + }, + { + "epoch": 1.89, + "learning_rate": 8.995187351195399e-05, + "loss": 1.4423, + "step": 24062 + }, + { + "epoch": 1.89, + "learning_rate": 8.994054758036553e-05, + "loss": 1.4869, + "step": 24063 + }, + { + "epoch": 1.89, + "learning_rate": 8.992922205654757e-05, + "loss": 1.4883, + "step": 24064 + }, + { + "epoch": 1.89, + "learning_rate": 8.991789694057707e-05, + "loss": 1.5262, + "step": 24065 + }, + { + "epoch": 1.89, + "learning_rate": 8.990657223253088e-05, + "loss": 1.5153, + "step": 24066 + }, + { + "epoch": 1.89, + "learning_rate": 8.98952479324859e-05, + "loss": 1.4889, + "step": 24067 + }, + { + "epoch": 1.89, + "learning_rate": 8.988392404051902e-05, + "loss": 1.5229, + "step": 24068 + }, + { + "epoch": 1.89, + "learning_rate": 8.987260055670712e-05, + "loss": 1.4873, + "step": 24069 + }, + { + "epoch": 1.89, + "learning_rate": 8.986127748112704e-05, + "loss": 1.4684, + "step": 24070 + }, + { + "epoch": 1.89, + "learning_rate": 8.984995481385573e-05, + "loss": 1.4908, + "step": 24071 + }, + { + "epoch": 1.89, + "learning_rate": 8.983863255497005e-05, + "loss": 1.4888, + "step": 24072 + }, + { + "epoch": 1.89, + "learning_rate": 8.982731070454684e-05, + "loss": 1.4786, + "step": 24073 + }, + { + "epoch": 1.89, + "learning_rate": 8.981598926266302e-05, + "loss": 1.4742, + "step": 24074 + }, + { + "epoch": 1.89, + "learning_rate": 8.980466822939537e-05, + "loss": 1.4877, + "step": 24075 + }, + { + "epoch": 1.89, + "learning_rate": 8.979334760482082e-05, + "loss": 1.4301, + "step": 24076 + }, + { + "epoch": 1.89, + "learning_rate": 8.978202738901624e-05, + "loss": 1.4516, + "step": 24077 + }, + { + "epoch": 1.89, + "learning_rate": 8.977070758205845e-05, + "loss": 1.471, + "step": 24078 + }, + { + "epoch": 1.89, + "learning_rate": 8.975938818402428e-05, + "loss": 1.4707, + "step": 24079 + }, + { + "epoch": 1.89, + "learning_rate": 8.974806919499069e-05, + "loss": 1.4295, + "step": 24080 + }, + { + "epoch": 1.89, + "learning_rate": 8.97367506150344e-05, + "loss": 1.4508, + "step": 24081 + }, + { + "epoch": 1.89, + "learning_rate": 8.972543244423236e-05, + "loss": 1.4577, + "step": 24082 + }, + { + "epoch": 1.89, + "learning_rate": 8.971411468266136e-05, + "loss": 1.4563, + "step": 24083 + }, + { + "epoch": 1.89, + "learning_rate": 8.970279733039823e-05, + "loss": 1.4694, + "step": 24084 + }, + { + "epoch": 1.9, + "learning_rate": 8.969148038751981e-05, + "loss": 1.4914, + "step": 24085 + }, + { + "epoch": 1.9, + "learning_rate": 8.968016385410301e-05, + "loss": 1.5038, + "step": 24086 + }, + { + "epoch": 1.9, + "learning_rate": 8.966884773022458e-05, + "loss": 1.4647, + "step": 24087 + }, + { + "epoch": 1.9, + "learning_rate": 8.96575320159614e-05, + "loss": 1.4883, + "step": 24088 + }, + { + "epoch": 1.9, + "learning_rate": 8.964621671139029e-05, + "loss": 1.4838, + "step": 24089 + }, + { + "epoch": 1.9, + "learning_rate": 8.963490181658803e-05, + "loss": 1.5443, + "step": 24090 + }, + { + "epoch": 1.9, + "learning_rate": 8.962358733163148e-05, + "loss": 1.4505, + "step": 24091 + }, + { + "epoch": 1.9, + "learning_rate": 8.961227325659748e-05, + "loss": 1.4497, + "step": 24092 + }, + { + "epoch": 1.9, + "learning_rate": 8.96009595915628e-05, + "loss": 1.4848, + "step": 24093 + }, + { + "epoch": 1.9, + "learning_rate": 8.958964633660429e-05, + "loss": 1.5056, + "step": 24094 + }, + { + "epoch": 1.9, + "learning_rate": 8.957833349179871e-05, + "loss": 1.5048, + "step": 24095 + }, + { + "epoch": 1.9, + "learning_rate": 8.956702105722293e-05, + "loss": 1.5127, + "step": 24096 + }, + { + "epoch": 1.9, + "learning_rate": 8.955570903295373e-05, + "loss": 1.4919, + "step": 24097 + }, + { + "epoch": 1.9, + "learning_rate": 8.95443974190679e-05, + "loss": 1.4467, + "step": 24098 + }, + { + "epoch": 1.9, + "learning_rate": 8.953308621564226e-05, + "loss": 1.4803, + "step": 24099 + }, + { + "epoch": 1.9, + "learning_rate": 8.952177542275357e-05, + "loss": 1.492, + "step": 24100 + }, + { + "epoch": 1.9, + "learning_rate": 8.951046504047863e-05, + "loss": 1.4445, + "step": 24101 + }, + { + "epoch": 1.9, + "learning_rate": 8.949915506889428e-05, + "loss": 1.5179, + "step": 24102 + }, + { + "epoch": 1.9, + "learning_rate": 8.948784550807731e-05, + "loss": 1.5102, + "step": 24103 + }, + { + "epoch": 1.9, + "learning_rate": 8.947653635810444e-05, + "loss": 1.4911, + "step": 24104 + }, + { + "epoch": 1.9, + "learning_rate": 8.946522761905248e-05, + "loss": 1.5527, + "step": 24105 + }, + { + "epoch": 1.9, + "learning_rate": 8.945391929099828e-05, + "loss": 1.4633, + "step": 24106 + }, + { + "epoch": 1.9, + "learning_rate": 8.94426113740185e-05, + "loss": 1.4792, + "step": 24107 + }, + { + "epoch": 1.9, + "learning_rate": 8.943130386818999e-05, + "loss": 1.5127, + "step": 24108 + }, + { + "epoch": 1.9, + "learning_rate": 8.94199967735895e-05, + "loss": 1.5, + "step": 24109 + }, + { + "epoch": 1.9, + "learning_rate": 8.94086900902938e-05, + "loss": 1.5141, + "step": 24110 + }, + { + "epoch": 1.9, + "learning_rate": 8.939738381837966e-05, + "loss": 1.4688, + "step": 24111 + }, + { + "epoch": 1.9, + "learning_rate": 8.938607795792384e-05, + "loss": 1.4375, + "step": 24112 + }, + { + "epoch": 1.9, + "learning_rate": 8.937477250900308e-05, + "loss": 1.4993, + "step": 24113 + }, + { + "epoch": 1.9, + "learning_rate": 8.93634674716942e-05, + "loss": 1.4501, + "step": 24114 + }, + { + "epoch": 1.9, + "learning_rate": 8.935216284607389e-05, + "loss": 1.5125, + "step": 24115 + }, + { + "epoch": 1.9, + "learning_rate": 8.934085863221894e-05, + "loss": 1.5187, + "step": 24116 + }, + { + "epoch": 1.9, + "learning_rate": 8.9329554830206e-05, + "loss": 1.4809, + "step": 24117 + }, + { + "epoch": 1.9, + "learning_rate": 8.9318251440112e-05, + "loss": 1.4737, + "step": 24118 + }, + { + "epoch": 1.9, + "learning_rate": 8.930694846201355e-05, + "loss": 1.5312, + "step": 24119 + }, + { + "epoch": 1.9, + "learning_rate": 8.929564589598743e-05, + "loss": 1.5136, + "step": 24120 + }, + { + "epoch": 1.9, + "learning_rate": 8.928434374211039e-05, + "loss": 1.4486, + "step": 24121 + }, + { + "epoch": 1.9, + "learning_rate": 8.927304200045915e-05, + "loss": 1.4801, + "step": 24122 + }, + { + "epoch": 1.9, + "learning_rate": 8.926174067111043e-05, + "loss": 1.4748, + "step": 24123 + }, + { + "epoch": 1.9, + "learning_rate": 8.9250439754141e-05, + "loss": 1.5004, + "step": 24124 + }, + { + "epoch": 1.9, + "learning_rate": 8.923913924962751e-05, + "loss": 1.4864, + "step": 24125 + }, + { + "epoch": 1.9, + "learning_rate": 8.922783915764678e-05, + "loss": 1.4961, + "step": 24126 + }, + { + "epoch": 1.9, + "learning_rate": 8.921653947827545e-05, + "loss": 1.4617, + "step": 24127 + }, + { + "epoch": 1.9, + "learning_rate": 8.920524021159031e-05, + "loss": 1.5361, + "step": 24128 + }, + { + "epoch": 1.9, + "learning_rate": 8.919394135766803e-05, + "loss": 1.4682, + "step": 24129 + }, + { + "epoch": 1.9, + "learning_rate": 8.918264291658531e-05, + "loss": 1.5132, + "step": 24130 + }, + { + "epoch": 1.9, + "learning_rate": 8.917134488841891e-05, + "loss": 1.513, + "step": 24131 + }, + { + "epoch": 1.9, + "learning_rate": 8.916004727324545e-05, + "loss": 1.4824, + "step": 24132 + }, + { + "epoch": 1.9, + "learning_rate": 8.914875007114173e-05, + "loss": 1.4616, + "step": 24133 + }, + { + "epoch": 1.9, + "learning_rate": 8.913745328218444e-05, + "loss": 1.504, + "step": 24134 + }, + { + "epoch": 1.9, + "learning_rate": 8.912615690645024e-05, + "loss": 1.466, + "step": 24135 + }, + { + "epoch": 1.9, + "learning_rate": 8.911486094401584e-05, + "loss": 1.4754, + "step": 24136 + }, + { + "epoch": 1.9, + "learning_rate": 8.910356539495792e-05, + "loss": 1.5432, + "step": 24137 + }, + { + "epoch": 1.9, + "learning_rate": 8.909227025935323e-05, + "loss": 1.4662, + "step": 24138 + }, + { + "epoch": 1.9, + "learning_rate": 8.908097553727838e-05, + "loss": 1.4872, + "step": 24139 + }, + { + "epoch": 1.9, + "learning_rate": 8.906968122881013e-05, + "loss": 1.5041, + "step": 24140 + }, + { + "epoch": 1.9, + "learning_rate": 8.905838733402507e-05, + "loss": 1.5077, + "step": 24141 + }, + { + "epoch": 1.9, + "learning_rate": 8.904709385299993e-05, + "loss": 1.4851, + "step": 24142 + }, + { + "epoch": 1.9, + "learning_rate": 8.903580078581142e-05, + "loss": 1.4696, + "step": 24143 + }, + { + "epoch": 1.9, + "learning_rate": 8.902450813253615e-05, + "loss": 1.4654, + "step": 24144 + }, + { + "epoch": 1.9, + "learning_rate": 8.901321589325082e-05, + "loss": 1.5286, + "step": 24145 + }, + { + "epoch": 1.9, + "learning_rate": 8.900192406803215e-05, + "loss": 1.516, + "step": 24146 + }, + { + "epoch": 1.9, + "learning_rate": 8.89906326569567e-05, + "loss": 1.5013, + "step": 24147 + }, + { + "epoch": 1.9, + "learning_rate": 8.897934166010116e-05, + "loss": 1.476, + "step": 24148 + }, + { + "epoch": 1.9, + "learning_rate": 8.896805107754225e-05, + "loss": 1.474, + "step": 24149 + }, + { + "epoch": 1.9, + "learning_rate": 8.895676090935662e-05, + "loss": 1.57, + "step": 24150 + }, + { + "epoch": 1.9, + "learning_rate": 8.894547115562088e-05, + "loss": 1.5029, + "step": 24151 + }, + { + "epoch": 1.9, + "learning_rate": 8.893418181641171e-05, + "loss": 1.4511, + "step": 24152 + }, + { + "epoch": 1.9, + "learning_rate": 8.892289289180573e-05, + "loss": 1.502, + "step": 24153 + }, + { + "epoch": 1.9, + "learning_rate": 8.891160438187957e-05, + "loss": 1.4996, + "step": 24154 + }, + { + "epoch": 1.9, + "learning_rate": 8.890031628670998e-05, + "loss": 1.4952, + "step": 24155 + }, + { + "epoch": 1.9, + "learning_rate": 8.888902860637346e-05, + "loss": 1.5299, + "step": 24156 + }, + { + "epoch": 1.9, + "learning_rate": 8.887774134094677e-05, + "loss": 1.488, + "step": 24157 + }, + { + "epoch": 1.9, + "learning_rate": 8.886645449050643e-05, + "loss": 1.4931, + "step": 24158 + }, + { + "epoch": 1.9, + "learning_rate": 8.885516805512914e-05, + "loss": 1.4803, + "step": 24159 + }, + { + "epoch": 1.9, + "learning_rate": 8.884388203489157e-05, + "loss": 1.4876, + "step": 24160 + }, + { + "epoch": 1.9, + "learning_rate": 8.883259642987023e-05, + "loss": 1.4319, + "step": 24161 + }, + { + "epoch": 1.9, + "learning_rate": 8.88213112401418e-05, + "loss": 1.4927, + "step": 24162 + }, + { + "epoch": 1.9, + "learning_rate": 8.881002646578297e-05, + "loss": 1.4841, + "step": 24163 + }, + { + "epoch": 1.9, + "learning_rate": 8.879874210687022e-05, + "loss": 1.4905, + "step": 24164 + }, + { + "epoch": 1.9, + "learning_rate": 8.878745816348025e-05, + "loss": 1.4925, + "step": 24165 + }, + { + "epoch": 1.9, + "learning_rate": 8.877617463568966e-05, + "loss": 1.4587, + "step": 24166 + }, + { + "epoch": 1.9, + "learning_rate": 8.87648915235751e-05, + "loss": 1.4487, + "step": 24167 + }, + { + "epoch": 1.9, + "learning_rate": 8.875360882721311e-05, + "loss": 1.4251, + "step": 24168 + }, + { + "epoch": 1.9, + "learning_rate": 8.874232654668033e-05, + "loss": 1.5304, + "step": 24169 + }, + { + "epoch": 1.9, + "learning_rate": 8.873104468205335e-05, + "loss": 1.5663, + "step": 24170 + }, + { + "epoch": 1.9, + "learning_rate": 8.871976323340873e-05, + "loss": 1.525, + "step": 24171 + }, + { + "epoch": 1.9, + "learning_rate": 8.870848220082314e-05, + "loss": 1.5112, + "step": 24172 + }, + { + "epoch": 1.9, + "learning_rate": 8.86972015843731e-05, + "loss": 1.4883, + "step": 24173 + }, + { + "epoch": 1.9, + "learning_rate": 8.868592138413524e-05, + "loss": 1.4824, + "step": 24174 + }, + { + "epoch": 1.9, + "learning_rate": 8.867464160018617e-05, + "loss": 1.5145, + "step": 24175 + }, + { + "epoch": 1.9, + "learning_rate": 8.866336223260242e-05, + "loss": 1.4521, + "step": 24176 + }, + { + "epoch": 1.9, + "learning_rate": 8.865208328146059e-05, + "loss": 1.4846, + "step": 24177 + }, + { + "epoch": 1.9, + "learning_rate": 8.864080474683726e-05, + "loss": 1.5179, + "step": 24178 + }, + { + "epoch": 1.9, + "learning_rate": 8.8629526628809e-05, + "loss": 1.523, + "step": 24179 + }, + { + "epoch": 1.9, + "learning_rate": 8.861824892745235e-05, + "loss": 1.4261, + "step": 24180 + }, + { + "epoch": 1.9, + "learning_rate": 8.860697164284397e-05, + "loss": 1.4949, + "step": 24181 + }, + { + "epoch": 1.9, + "learning_rate": 8.859569477506035e-05, + "loss": 1.5082, + "step": 24182 + }, + { + "epoch": 1.9, + "learning_rate": 8.858441832417809e-05, + "loss": 1.5369, + "step": 24183 + }, + { + "epoch": 1.9, + "learning_rate": 8.857314229027374e-05, + "loss": 1.505, + "step": 24184 + }, + { + "epoch": 1.9, + "learning_rate": 8.856186667342383e-05, + "loss": 1.5105, + "step": 24185 + }, + { + "epoch": 1.9, + "learning_rate": 8.8550591473705e-05, + "loss": 1.4519, + "step": 24186 + }, + { + "epoch": 1.9, + "learning_rate": 8.85393166911937e-05, + "loss": 1.4614, + "step": 24187 + }, + { + "epoch": 1.9, + "learning_rate": 8.852804232596652e-05, + "loss": 1.4924, + "step": 24188 + }, + { + "epoch": 1.9, + "learning_rate": 8.851676837810003e-05, + "loss": 1.5013, + "step": 24189 + }, + { + "epoch": 1.9, + "learning_rate": 8.850549484767073e-05, + "loss": 1.5413, + "step": 24190 + }, + { + "epoch": 1.9, + "learning_rate": 8.849422173475519e-05, + "loss": 1.5119, + "step": 24191 + }, + { + "epoch": 1.9, + "learning_rate": 8.848294903942997e-05, + "loss": 1.4676, + "step": 24192 + }, + { + "epoch": 1.9, + "learning_rate": 8.847167676177154e-05, + "loss": 1.49, + "step": 24193 + }, + { + "epoch": 1.9, + "learning_rate": 8.84604049018565e-05, + "loss": 1.4887, + "step": 24194 + }, + { + "epoch": 1.9, + "learning_rate": 8.844913345976127e-05, + "loss": 1.4882, + "step": 24195 + }, + { + "epoch": 1.9, + "learning_rate": 8.843786243556256e-05, + "loss": 1.482, + "step": 24196 + }, + { + "epoch": 1.9, + "learning_rate": 8.842659182933673e-05, + "loss": 1.4918, + "step": 24197 + }, + { + "epoch": 1.9, + "learning_rate": 8.841532164116041e-05, + "loss": 1.4517, + "step": 24198 + }, + { + "epoch": 1.9, + "learning_rate": 8.840405187111004e-05, + "loss": 1.4837, + "step": 24199 + }, + { + "epoch": 1.9, + "learning_rate": 8.839278251926217e-05, + "loss": 1.4377, + "step": 24200 + }, + { + "epoch": 1.9, + "learning_rate": 8.838151358569333e-05, + "loss": 1.427, + "step": 24201 + }, + { + "epoch": 1.9, + "learning_rate": 8.837024507047999e-05, + "loss": 1.5423, + "step": 24202 + }, + { + "epoch": 1.9, + "learning_rate": 8.835897697369866e-05, + "loss": 1.4865, + "step": 24203 + }, + { + "epoch": 1.9, + "learning_rate": 8.83477092954259e-05, + "loss": 1.4584, + "step": 24204 + }, + { + "epoch": 1.9, + "learning_rate": 8.833644203573815e-05, + "loss": 1.4953, + "step": 24205 + }, + { + "epoch": 1.9, + "learning_rate": 8.832517519471195e-05, + "loss": 1.4728, + "step": 24206 + }, + { + "epoch": 1.9, + "learning_rate": 8.831390877242375e-05, + "loss": 1.477, + "step": 24207 + }, + { + "epoch": 1.9, + "learning_rate": 8.830264276895005e-05, + "loss": 1.4474, + "step": 24208 + }, + { + "epoch": 1.9, + "learning_rate": 8.829137718436741e-05, + "loss": 1.4784, + "step": 24209 + }, + { + "epoch": 1.9, + "learning_rate": 8.828011201875224e-05, + "loss": 1.4759, + "step": 24210 + }, + { + "epoch": 1.9, + "learning_rate": 8.826884727218099e-05, + "loss": 1.4727, + "step": 24211 + }, + { + "epoch": 1.91, + "learning_rate": 8.825758294473025e-05, + "loss": 1.4902, + "step": 24212 + }, + { + "epoch": 1.91, + "learning_rate": 8.824631903647647e-05, + "loss": 1.5376, + "step": 24213 + }, + { + "epoch": 1.91, + "learning_rate": 8.823505554749608e-05, + "loss": 1.4215, + "step": 24214 + }, + { + "epoch": 1.91, + "learning_rate": 8.822379247786562e-05, + "loss": 1.4649, + "step": 24215 + }, + { + "epoch": 1.91, + "learning_rate": 8.821252982766148e-05, + "loss": 1.4872, + "step": 24216 + }, + { + "epoch": 1.91, + "learning_rate": 8.820126759696017e-05, + "loss": 1.4778, + "step": 24217 + }, + { + "epoch": 1.91, + "learning_rate": 8.819000578583817e-05, + "loss": 1.5351, + "step": 24218 + }, + { + "epoch": 1.91, + "learning_rate": 8.81787443943719e-05, + "loss": 1.4541, + "step": 24219 + }, + { + "epoch": 1.91, + "learning_rate": 8.816748342263783e-05, + "loss": 1.553, + "step": 24220 + }, + { + "epoch": 1.91, + "learning_rate": 8.815622287071247e-05, + "loss": 1.4637, + "step": 24221 + }, + { + "epoch": 1.91, + "learning_rate": 8.814496273867219e-05, + "loss": 1.519, + "step": 24222 + }, + { + "epoch": 1.91, + "learning_rate": 8.81337030265935e-05, + "loss": 1.4798, + "step": 24223 + }, + { + "epoch": 1.91, + "learning_rate": 8.81224437345528e-05, + "loss": 1.4856, + "step": 24224 + }, + { + "epoch": 1.91, + "learning_rate": 8.811118486262656e-05, + "loss": 1.444, + "step": 24225 + }, + { + "epoch": 1.91, + "learning_rate": 8.809992641089126e-05, + "loss": 1.5221, + "step": 24226 + }, + { + "epoch": 1.91, + "learning_rate": 8.808866837942325e-05, + "loss": 1.4696, + "step": 24227 + }, + { + "epoch": 1.91, + "learning_rate": 8.8077410768299e-05, + "loss": 1.533, + "step": 24228 + }, + { + "epoch": 1.91, + "learning_rate": 8.8066153577595e-05, + "loss": 1.4718, + "step": 24229 + }, + { + "epoch": 1.91, + "learning_rate": 8.805489680738766e-05, + "loss": 1.488, + "step": 24230 + }, + { + "epoch": 1.91, + "learning_rate": 8.804364045775337e-05, + "loss": 1.4706, + "step": 24231 + }, + { + "epoch": 1.91, + "learning_rate": 8.803238452876857e-05, + "loss": 1.4831, + "step": 24232 + }, + { + "epoch": 1.91, + "learning_rate": 8.802112902050968e-05, + "loss": 1.4621, + "step": 24233 + }, + { + "epoch": 1.91, + "learning_rate": 8.800987393305311e-05, + "loss": 1.5091, + "step": 24234 + }, + { + "epoch": 1.91, + "learning_rate": 8.799861926647532e-05, + "loss": 1.5367, + "step": 24235 + }, + { + "epoch": 1.91, + "learning_rate": 8.798736502085265e-05, + "loss": 1.4395, + "step": 24236 + }, + { + "epoch": 1.91, + "learning_rate": 8.797611119626156e-05, + "loss": 1.4836, + "step": 24237 + }, + { + "epoch": 1.91, + "learning_rate": 8.796485779277849e-05, + "loss": 1.4785, + "step": 24238 + }, + { + "epoch": 1.91, + "learning_rate": 8.795360481047975e-05, + "loss": 1.4857, + "step": 24239 + }, + { + "epoch": 1.91, + "learning_rate": 8.794235224944183e-05, + "loss": 1.5083, + "step": 24240 + }, + { + "epoch": 1.91, + "learning_rate": 8.793110010974108e-05, + "loss": 1.4951, + "step": 24241 + }, + { + "epoch": 1.91, + "learning_rate": 8.791984839145385e-05, + "loss": 1.4795, + "step": 24242 + }, + { + "epoch": 1.91, + "learning_rate": 8.790859709465664e-05, + "loss": 1.5029, + "step": 24243 + }, + { + "epoch": 1.91, + "learning_rate": 8.789734621942578e-05, + "loss": 1.5129, + "step": 24244 + }, + { + "epoch": 1.91, + "learning_rate": 8.788609576583769e-05, + "loss": 1.4797, + "step": 24245 + }, + { + "epoch": 1.91, + "learning_rate": 8.787484573396873e-05, + "loss": 1.5111, + "step": 24246 + }, + { + "epoch": 1.91, + "learning_rate": 8.786359612389528e-05, + "loss": 1.5351, + "step": 24247 + }, + { + "epoch": 1.91, + "learning_rate": 8.785234693569371e-05, + "loss": 1.4886, + "step": 24248 + }, + { + "epoch": 1.91, + "learning_rate": 8.78410981694404e-05, + "loss": 1.4581, + "step": 24249 + }, + { + "epoch": 1.91, + "learning_rate": 8.782984982521178e-05, + "loss": 1.4729, + "step": 24250 + }, + { + "epoch": 1.91, + "learning_rate": 8.781860190308414e-05, + "loss": 1.4775, + "step": 24251 + }, + { + "epoch": 1.91, + "learning_rate": 8.78073544031339e-05, + "loss": 1.4553, + "step": 24252 + }, + { + "epoch": 1.91, + "learning_rate": 8.779610732543735e-05, + "loss": 1.5403, + "step": 24253 + }, + { + "epoch": 1.91, + "learning_rate": 8.778486067007094e-05, + "loss": 1.468, + "step": 24254 + }, + { + "epoch": 1.91, + "learning_rate": 8.777361443711101e-05, + "loss": 1.4837, + "step": 24255 + }, + { + "epoch": 1.91, + "learning_rate": 8.776236862663386e-05, + "loss": 1.4533, + "step": 24256 + }, + { + "epoch": 1.91, + "learning_rate": 8.77511232387159e-05, + "loss": 1.4878, + "step": 24257 + }, + { + "epoch": 1.91, + "learning_rate": 8.773987827343341e-05, + "loss": 1.515, + "step": 24258 + }, + { + "epoch": 1.91, + "learning_rate": 8.772863373086287e-05, + "loss": 1.4717, + "step": 24259 + }, + { + "epoch": 1.91, + "learning_rate": 8.77173896110805e-05, + "loss": 1.4985, + "step": 24260 + }, + { + "epoch": 1.91, + "learning_rate": 8.770614591416269e-05, + "loss": 1.4528, + "step": 24261 + }, + { + "epoch": 1.91, + "learning_rate": 8.769490264018579e-05, + "loss": 1.45, + "step": 24262 + }, + { + "epoch": 1.91, + "learning_rate": 8.76836597892261e-05, + "loss": 1.4852, + "step": 24263 + }, + { + "epoch": 1.91, + "learning_rate": 8.767241736136e-05, + "loss": 1.5282, + "step": 24264 + }, + { + "epoch": 1.91, + "learning_rate": 8.766117535666376e-05, + "loss": 1.4585, + "step": 24265 + }, + { + "epoch": 1.91, + "learning_rate": 8.764993377521374e-05, + "loss": 1.4559, + "step": 24266 + }, + { + "epoch": 1.91, + "learning_rate": 8.763869261708629e-05, + "loss": 1.4526, + "step": 24267 + }, + { + "epoch": 1.91, + "learning_rate": 8.762745188235766e-05, + "loss": 1.483, + "step": 24268 + }, + { + "epoch": 1.91, + "learning_rate": 8.761621157110426e-05, + "loss": 1.4916, + "step": 24269 + }, + { + "epoch": 1.91, + "learning_rate": 8.760497168340232e-05, + "loss": 1.4741, + "step": 24270 + }, + { + "epoch": 1.91, + "learning_rate": 8.759373221932819e-05, + "loss": 1.5096, + "step": 24271 + }, + { + "epoch": 1.91, + "learning_rate": 8.758249317895822e-05, + "loss": 1.513, + "step": 24272 + }, + { + "epoch": 1.91, + "learning_rate": 8.757125456236863e-05, + "loss": 1.4871, + "step": 24273 + }, + { + "epoch": 1.91, + "learning_rate": 8.756001636963576e-05, + "loss": 1.4279, + "step": 24274 + }, + { + "epoch": 1.91, + "learning_rate": 8.754877860083597e-05, + "loss": 1.5045, + "step": 24275 + }, + { + "epoch": 1.91, + "learning_rate": 8.753754125604543e-05, + "loss": 1.4854, + "step": 24276 + }, + { + "epoch": 1.91, + "learning_rate": 8.752630433534061e-05, + "loss": 1.4405, + "step": 24277 + }, + { + "epoch": 1.91, + "learning_rate": 8.75150678387977e-05, + "loss": 1.5058, + "step": 24278 + }, + { + "epoch": 1.91, + "learning_rate": 8.750383176649291e-05, + "loss": 1.4845, + "step": 24279 + }, + { + "epoch": 1.91, + "learning_rate": 8.749259611850269e-05, + "loss": 1.4817, + "step": 24280 + }, + { + "epoch": 1.91, + "learning_rate": 8.748136089490325e-05, + "loss": 1.4792, + "step": 24281 + }, + { + "epoch": 1.91, + "learning_rate": 8.747012609577082e-05, + "loss": 1.5027, + "step": 24282 + }, + { + "epoch": 1.91, + "learning_rate": 8.745889172118177e-05, + "loss": 1.5188, + "step": 24283 + }, + { + "epoch": 1.91, + "learning_rate": 8.744765777121235e-05, + "loss": 1.4977, + "step": 24284 + }, + { + "epoch": 1.91, + "learning_rate": 8.74364242459388e-05, + "loss": 1.5101, + "step": 24285 + }, + { + "epoch": 1.91, + "learning_rate": 8.742519114543735e-05, + "loss": 1.4758, + "step": 24286 + }, + { + "epoch": 1.91, + "learning_rate": 8.741395846978439e-05, + "loss": 1.4678, + "step": 24287 + }, + { + "epoch": 1.91, + "learning_rate": 8.74027262190561e-05, + "loss": 1.5102, + "step": 24288 + }, + { + "epoch": 1.91, + "learning_rate": 8.739149439332868e-05, + "loss": 1.4579, + "step": 24289 + }, + { + "epoch": 1.91, + "learning_rate": 8.738026299267849e-05, + "loss": 1.4929, + "step": 24290 + }, + { + "epoch": 1.91, + "learning_rate": 8.736903201718179e-05, + "loss": 1.4606, + "step": 24291 + }, + { + "epoch": 1.91, + "learning_rate": 8.735780146691485e-05, + "loss": 1.4884, + "step": 24292 + }, + { + "epoch": 1.91, + "learning_rate": 8.734657134195376e-05, + "loss": 1.5173, + "step": 24293 + }, + { + "epoch": 1.91, + "learning_rate": 8.733534164237496e-05, + "loss": 1.5334, + "step": 24294 + }, + { + "epoch": 1.91, + "learning_rate": 8.73241123682546e-05, + "loss": 1.4909, + "step": 24295 + }, + { + "epoch": 1.91, + "learning_rate": 8.731288351966888e-05, + "loss": 1.4448, + "step": 24296 + }, + { + "epoch": 1.91, + "learning_rate": 8.730165509669413e-05, + "loss": 1.4828, + "step": 24297 + }, + { + "epoch": 1.91, + "learning_rate": 8.729042709940654e-05, + "loss": 1.4922, + "step": 24298 + }, + { + "epoch": 1.91, + "learning_rate": 8.727919952788231e-05, + "loss": 1.4059, + "step": 24299 + }, + { + "epoch": 1.91, + "learning_rate": 8.726797238219775e-05, + "loss": 1.4244, + "step": 24300 + }, + { + "epoch": 1.91, + "learning_rate": 8.725674566242904e-05, + "loss": 1.4391, + "step": 24301 + }, + { + "epoch": 1.91, + "learning_rate": 8.72455193686524e-05, + "loss": 1.4566, + "step": 24302 + }, + { + "epoch": 1.91, + "learning_rate": 8.723429350094398e-05, + "loss": 1.4875, + "step": 24303 + }, + { + "epoch": 1.91, + "learning_rate": 8.722306805938014e-05, + "loss": 1.4921, + "step": 24304 + }, + { + "epoch": 1.91, + "learning_rate": 8.721184304403697e-05, + "loss": 1.4189, + "step": 24305 + }, + { + "epoch": 1.91, + "learning_rate": 8.72006184549908e-05, + "loss": 1.5493, + "step": 24306 + }, + { + "epoch": 1.91, + "learning_rate": 8.71893942923177e-05, + "loss": 1.4602, + "step": 24307 + }, + { + "epoch": 1.91, + "learning_rate": 8.717817055609401e-05, + "loss": 1.506, + "step": 24308 + }, + { + "epoch": 1.91, + "learning_rate": 8.716694724639589e-05, + "loss": 1.5242, + "step": 24309 + }, + { + "epoch": 1.91, + "learning_rate": 8.715572436329946e-05, + "loss": 1.5221, + "step": 24310 + }, + { + "epoch": 1.91, + "learning_rate": 8.714450190688104e-05, + "loss": 1.5043, + "step": 24311 + }, + { + "epoch": 1.91, + "learning_rate": 8.713327987721677e-05, + "loss": 1.4906, + "step": 24312 + }, + { + "epoch": 1.91, + "learning_rate": 8.712205827438277e-05, + "loss": 1.4725, + "step": 24313 + }, + { + "epoch": 1.91, + "learning_rate": 8.711083709845534e-05, + "loss": 1.4664, + "step": 24314 + }, + { + "epoch": 1.91, + "learning_rate": 8.709961634951064e-05, + "loss": 1.4454, + "step": 24315 + }, + { + "epoch": 1.91, + "learning_rate": 8.708839602762477e-05, + "loss": 1.4767, + "step": 24316 + }, + { + "epoch": 1.91, + "learning_rate": 8.707717613287407e-05, + "loss": 1.4569, + "step": 24317 + }, + { + "epoch": 1.91, + "learning_rate": 8.706595666533456e-05, + "loss": 1.4442, + "step": 24318 + }, + { + "epoch": 1.91, + "learning_rate": 8.705473762508244e-05, + "loss": 1.5116, + "step": 24319 + }, + { + "epoch": 1.91, + "learning_rate": 8.704351901219398e-05, + "loss": 1.5092, + "step": 24320 + }, + { + "epoch": 1.91, + "learning_rate": 8.703230082674523e-05, + "loss": 1.499, + "step": 24321 + }, + { + "epoch": 1.91, + "learning_rate": 8.702108306881244e-05, + "loss": 1.487, + "step": 24322 + }, + { + "epoch": 1.91, + "learning_rate": 8.700986573847171e-05, + "loss": 1.5369, + "step": 24323 + }, + { + "epoch": 1.91, + "learning_rate": 8.699864883579928e-05, + "loss": 1.5105, + "step": 24324 + }, + { + "epoch": 1.91, + "learning_rate": 8.698743236087125e-05, + "loss": 1.511, + "step": 24325 + }, + { + "epoch": 1.91, + "learning_rate": 8.697621631376378e-05, + "loss": 1.461, + "step": 24326 + }, + { + "epoch": 1.91, + "learning_rate": 8.6965000694553e-05, + "loss": 1.5106, + "step": 24327 + }, + { + "epoch": 1.91, + "learning_rate": 8.695378550331508e-05, + "loss": 1.5158, + "step": 24328 + }, + { + "epoch": 1.91, + "learning_rate": 8.694257074012622e-05, + "loss": 1.4911, + "step": 24329 + }, + { + "epoch": 1.91, + "learning_rate": 8.693135640506242e-05, + "loss": 1.4849, + "step": 24330 + }, + { + "epoch": 1.91, + "learning_rate": 8.692014249819995e-05, + "loss": 1.4602, + "step": 24331 + }, + { + "epoch": 1.91, + "learning_rate": 8.690892901961491e-05, + "loss": 1.4484, + "step": 24332 + }, + { + "epoch": 1.91, + "learning_rate": 8.689771596938338e-05, + "loss": 1.5066, + "step": 24333 + }, + { + "epoch": 1.91, + "learning_rate": 8.68865033475816e-05, + "loss": 1.454, + "step": 24334 + }, + { + "epoch": 1.91, + "learning_rate": 8.687529115428563e-05, + "loss": 1.4626, + "step": 24335 + }, + { + "epoch": 1.91, + "learning_rate": 8.686407938957152e-05, + "loss": 1.4992, + "step": 24336 + }, + { + "epoch": 1.91, + "learning_rate": 8.685286805351549e-05, + "loss": 1.4525, + "step": 24337 + }, + { + "epoch": 1.91, + "learning_rate": 8.68416571461937e-05, + "loss": 1.4694, + "step": 24338 + }, + { + "epoch": 1.92, + "learning_rate": 8.683044666768218e-05, + "loss": 1.5133, + "step": 24339 + }, + { + "epoch": 1.92, + "learning_rate": 8.681923661805701e-05, + "loss": 1.4637, + "step": 24340 + }, + { + "epoch": 1.92, + "learning_rate": 8.680802699739443e-05, + "loss": 1.4798, + "step": 24341 + }, + { + "epoch": 1.92, + "learning_rate": 8.679681780577046e-05, + "loss": 1.5459, + "step": 24342 + }, + { + "epoch": 1.92, + "learning_rate": 8.678560904326125e-05, + "loss": 1.5057, + "step": 24343 + }, + { + "epoch": 1.92, + "learning_rate": 8.677440070994279e-05, + "loss": 1.4671, + "step": 24344 + }, + { + "epoch": 1.92, + "learning_rate": 8.676319280589134e-05, + "loss": 1.4705, + "step": 24345 + }, + { + "epoch": 1.92, + "learning_rate": 8.675198533118288e-05, + "loss": 1.4514, + "step": 24346 + }, + { + "epoch": 1.92, + "learning_rate": 8.67407782858935e-05, + "loss": 1.483, + "step": 24347 + }, + { + "epoch": 1.92, + "learning_rate": 8.672957167009936e-05, + "loss": 1.5204, + "step": 24348 + }, + { + "epoch": 1.92, + "learning_rate": 8.671836548387654e-05, + "loss": 1.5205, + "step": 24349 + }, + { + "epoch": 1.92, + "learning_rate": 8.670715972730101e-05, + "loss": 1.4852, + "step": 24350 + }, + { + "epoch": 1.92, + "learning_rate": 8.669595440044902e-05, + "loss": 1.5154, + "step": 24351 + }, + { + "epoch": 1.92, + "learning_rate": 8.66847495033965e-05, + "loss": 1.4997, + "step": 24352 + }, + { + "epoch": 1.92, + "learning_rate": 8.667354503621965e-05, + "loss": 1.4806, + "step": 24353 + }, + { + "epoch": 1.92, + "learning_rate": 8.666234099899443e-05, + "loss": 1.4809, + "step": 24354 + }, + { + "epoch": 1.92, + "learning_rate": 8.665113739179702e-05, + "loss": 1.4653, + "step": 24355 + }, + { + "epoch": 1.92, + "learning_rate": 8.663993421470342e-05, + "loss": 1.4524, + "step": 24356 + }, + { + "epoch": 1.92, + "learning_rate": 8.662873146778963e-05, + "loss": 1.4529, + "step": 24357 + }, + { + "epoch": 1.92, + "learning_rate": 8.661752915113188e-05, + "loss": 1.4768, + "step": 24358 + }, + { + "epoch": 1.92, + "learning_rate": 8.660632726480609e-05, + "loss": 1.4512, + "step": 24359 + }, + { + "epoch": 1.92, + "learning_rate": 8.659512580888837e-05, + "loss": 1.4284, + "step": 24360 + }, + { + "epoch": 1.92, + "learning_rate": 8.65839247834547e-05, + "loss": 1.4714, + "step": 24361 + }, + { + "epoch": 1.92, + "learning_rate": 8.657272418858124e-05, + "loss": 1.4866, + "step": 24362 + }, + { + "epoch": 1.92, + "learning_rate": 8.656152402434398e-05, + "loss": 1.5329, + "step": 24363 + }, + { + "epoch": 1.92, + "learning_rate": 8.655032429081892e-05, + "loss": 1.5069, + "step": 24364 + }, + { + "epoch": 1.92, + "learning_rate": 8.653912498808219e-05, + "loss": 1.4516, + "step": 24365 + }, + { + "epoch": 1.92, + "learning_rate": 8.652792611620977e-05, + "loss": 1.445, + "step": 24366 + }, + { + "epoch": 1.92, + "learning_rate": 8.651672767527767e-05, + "loss": 1.4797, + "step": 24367 + }, + { + "epoch": 1.92, + "learning_rate": 8.650552966536193e-05, + "loss": 1.4556, + "step": 24368 + }, + { + "epoch": 1.92, + "learning_rate": 8.649433208653869e-05, + "loss": 1.4417, + "step": 24369 + }, + { + "epoch": 1.92, + "learning_rate": 8.648313493888386e-05, + "loss": 1.4703, + "step": 24370 + }, + { + "epoch": 1.92, + "learning_rate": 8.647193822247345e-05, + "loss": 1.5135, + "step": 24371 + }, + { + "epoch": 1.92, + "learning_rate": 8.64607419373836e-05, + "loss": 1.4897, + "step": 24372 + }, + { + "epoch": 1.92, + "learning_rate": 8.64495460836902e-05, + "loss": 1.4699, + "step": 24373 + }, + { + "epoch": 1.92, + "learning_rate": 8.643835066146928e-05, + "loss": 1.4763, + "step": 24374 + }, + { + "epoch": 1.92, + "learning_rate": 8.642715567079695e-05, + "loss": 1.4843, + "step": 24375 + }, + { + "epoch": 1.92, + "learning_rate": 8.641596111174915e-05, + "loss": 1.5064, + "step": 24376 + }, + { + "epoch": 1.92, + "learning_rate": 8.640476698440182e-05, + "loss": 1.5138, + "step": 24377 + }, + { + "epoch": 1.92, + "learning_rate": 8.639357328883108e-05, + "loss": 1.4565, + "step": 24378 + }, + { + "epoch": 1.92, + "learning_rate": 8.63823800251129e-05, + "loss": 1.4456, + "step": 24379 + }, + { + "epoch": 1.92, + "learning_rate": 8.637118719332322e-05, + "loss": 1.4876, + "step": 24380 + }, + { + "epoch": 1.92, + "learning_rate": 8.635999479353801e-05, + "loss": 1.4865, + "step": 24381 + }, + { + "epoch": 1.92, + "learning_rate": 8.634880282583341e-05, + "loss": 1.4697, + "step": 24382 + }, + { + "epoch": 1.92, + "learning_rate": 8.633761129028527e-05, + "loss": 1.5188, + "step": 24383 + }, + { + "epoch": 1.92, + "learning_rate": 8.632642018696958e-05, + "loss": 1.5105, + "step": 24384 + }, + { + "epoch": 1.92, + "learning_rate": 8.631522951596236e-05, + "loss": 1.4762, + "step": 24385 + }, + { + "epoch": 1.92, + "learning_rate": 8.630403927733966e-05, + "loss": 1.4361, + "step": 24386 + }, + { + "epoch": 1.92, + "learning_rate": 8.629284947117737e-05, + "loss": 1.4885, + "step": 24387 + }, + { + "epoch": 1.92, + "learning_rate": 8.62816600975514e-05, + "loss": 1.5013, + "step": 24388 + }, + { + "epoch": 1.92, + "learning_rate": 8.627047115653787e-05, + "loss": 1.52, + "step": 24389 + }, + { + "epoch": 1.92, + "learning_rate": 8.625928264821268e-05, + "loss": 1.5271, + "step": 24390 + }, + { + "epoch": 1.92, + "learning_rate": 8.624809457265172e-05, + "loss": 1.465, + "step": 24391 + }, + { + "epoch": 1.92, + "learning_rate": 8.623690692993105e-05, + "loss": 1.5275, + "step": 24392 + }, + { + "epoch": 1.92, + "learning_rate": 8.622571972012662e-05, + "loss": 1.4936, + "step": 24393 + }, + { + "epoch": 1.92, + "learning_rate": 8.62145329433143e-05, + "loss": 1.4868, + "step": 24394 + }, + { + "epoch": 1.92, + "learning_rate": 8.620334659957016e-05, + "loss": 1.4612, + "step": 24395 + }, + { + "epoch": 1.92, + "learning_rate": 8.619216068897008e-05, + "loss": 1.4762, + "step": 24396 + }, + { + "epoch": 1.92, + "learning_rate": 8.618097521159005e-05, + "loss": 1.4826, + "step": 24397 + }, + { + "epoch": 1.92, + "learning_rate": 8.616979016750588e-05, + "loss": 1.4713, + "step": 24398 + }, + { + "epoch": 1.92, + "learning_rate": 8.61586055567937e-05, + "loss": 1.5297, + "step": 24399 + }, + { + "epoch": 1.92, + "learning_rate": 8.614742137952928e-05, + "loss": 1.4539, + "step": 24400 + }, + { + "epoch": 1.92, + "learning_rate": 8.613623763578868e-05, + "loss": 1.5199, + "step": 24401 + }, + { + "epoch": 1.92, + "learning_rate": 8.612505432564775e-05, + "loss": 1.4291, + "step": 24402 + }, + { + "epoch": 1.92, + "learning_rate": 8.61138714491825e-05, + "loss": 1.5116, + "step": 24403 + }, + { + "epoch": 1.92, + "learning_rate": 8.610268900646879e-05, + "loss": 1.4627, + "step": 24404 + }, + { + "epoch": 1.92, + "learning_rate": 8.609150699758252e-05, + "loss": 1.5116, + "step": 24405 + }, + { + "epoch": 1.92, + "learning_rate": 8.608032542259972e-05, + "loss": 1.4942, + "step": 24406 + }, + { + "epoch": 1.92, + "learning_rate": 8.606914428159624e-05, + "loss": 1.508, + "step": 24407 + }, + { + "epoch": 1.92, + "learning_rate": 8.60579635746479e-05, + "loss": 1.5098, + "step": 24408 + }, + { + "epoch": 1.92, + "learning_rate": 8.604678330183078e-05, + "loss": 1.4495, + "step": 24409 + }, + { + "epoch": 1.92, + "learning_rate": 8.60356034632207e-05, + "loss": 1.5136, + "step": 24410 + }, + { + "epoch": 1.92, + "learning_rate": 8.602442405889354e-05, + "loss": 1.4576, + "step": 24411 + }, + { + "epoch": 1.92, + "learning_rate": 8.601324508892525e-05, + "loss": 1.4636, + "step": 24412 + }, + { + "epoch": 1.92, + "learning_rate": 8.600206655339175e-05, + "loss": 1.4539, + "step": 24413 + }, + { + "epoch": 1.92, + "learning_rate": 8.59908884523689e-05, + "loss": 1.4487, + "step": 24414 + }, + { + "epoch": 1.92, + "learning_rate": 8.597971078593246e-05, + "loss": 1.4628, + "step": 24415 + }, + { + "epoch": 1.92, + "learning_rate": 8.596853355415859e-05, + "loss": 1.4629, + "step": 24416 + }, + { + "epoch": 1.92, + "learning_rate": 8.595735675712302e-05, + "loss": 1.5184, + "step": 24417 + }, + { + "epoch": 1.92, + "learning_rate": 8.594618039490167e-05, + "loss": 1.4827, + "step": 24418 + }, + { + "epoch": 1.92, + "learning_rate": 8.593500446757035e-05, + "loss": 1.4581, + "step": 24419 + }, + { + "epoch": 1.92, + "learning_rate": 8.592382897520506e-05, + "loss": 1.4833, + "step": 24420 + }, + { + "epoch": 1.92, + "learning_rate": 8.59126539178816e-05, + "loss": 1.4539, + "step": 24421 + }, + { + "epoch": 1.92, + "learning_rate": 8.59014792956758e-05, + "loss": 1.477, + "step": 24422 + }, + { + "epoch": 1.92, + "learning_rate": 8.589030510866363e-05, + "loss": 1.5956, + "step": 24423 + }, + { + "epoch": 1.92, + "learning_rate": 8.587913135692093e-05, + "loss": 1.5056, + "step": 24424 + }, + { + "epoch": 1.92, + "learning_rate": 8.586795804052346e-05, + "loss": 1.4961, + "step": 24425 + }, + { + "epoch": 1.92, + "learning_rate": 8.585678515954724e-05, + "loss": 1.4755, + "step": 24426 + }, + { + "epoch": 1.92, + "learning_rate": 8.584561271406804e-05, + "loss": 1.4612, + "step": 24427 + }, + { + "epoch": 1.92, + "learning_rate": 8.583444070416169e-05, + "loss": 1.4737, + "step": 24428 + }, + { + "epoch": 1.92, + "learning_rate": 8.582326912990412e-05, + "loss": 1.4962, + "step": 24429 + }, + { + "epoch": 1.92, + "learning_rate": 8.581209799137113e-05, + "loss": 1.4896, + "step": 24430 + }, + { + "epoch": 1.92, + "learning_rate": 8.580092728863853e-05, + "loss": 1.4408, + "step": 24431 + }, + { + "epoch": 1.92, + "learning_rate": 8.578975702178219e-05, + "loss": 1.4853, + "step": 24432 + }, + { + "epoch": 1.92, + "learning_rate": 8.577858719087805e-05, + "loss": 1.5112, + "step": 24433 + }, + { + "epoch": 1.92, + "learning_rate": 8.576741779600185e-05, + "loss": 1.5085, + "step": 24434 + }, + { + "epoch": 1.92, + "learning_rate": 8.575624883722937e-05, + "loss": 1.4877, + "step": 24435 + }, + { + "epoch": 1.92, + "learning_rate": 8.574508031463655e-05, + "loss": 1.4706, + "step": 24436 + }, + { + "epoch": 1.92, + "learning_rate": 8.573391222829919e-05, + "loss": 1.4606, + "step": 24437 + }, + { + "epoch": 1.92, + "learning_rate": 8.572274457829312e-05, + "loss": 1.4738, + "step": 24438 + }, + { + "epoch": 1.92, + "learning_rate": 8.571157736469408e-05, + "loss": 1.4838, + "step": 24439 + }, + { + "epoch": 1.92, + "learning_rate": 8.5700410587578e-05, + "loss": 1.4535, + "step": 24440 + }, + { + "epoch": 1.92, + "learning_rate": 8.568924424702065e-05, + "loss": 1.529, + "step": 24441 + }, + { + "epoch": 1.92, + "learning_rate": 8.567807834309777e-05, + "loss": 1.4576, + "step": 24442 + }, + { + "epoch": 1.92, + "learning_rate": 8.566691287588535e-05, + "loss": 1.4757, + "step": 24443 + }, + { + "epoch": 1.92, + "learning_rate": 8.565574784545904e-05, + "loss": 1.4405, + "step": 24444 + }, + { + "epoch": 1.92, + "learning_rate": 8.564458325189464e-05, + "loss": 1.4963, + "step": 24445 + }, + { + "epoch": 1.92, + "learning_rate": 8.563341909526808e-05, + "loss": 1.4074, + "step": 24446 + }, + { + "epoch": 1.92, + "learning_rate": 8.562225537565502e-05, + "loss": 1.5201, + "step": 24447 + }, + { + "epoch": 1.92, + "learning_rate": 8.561109209313138e-05, + "loss": 1.4842, + "step": 24448 + }, + { + "epoch": 1.92, + "learning_rate": 8.559992924777284e-05, + "loss": 1.5003, + "step": 24449 + }, + { + "epoch": 1.92, + "learning_rate": 8.558876683965529e-05, + "loss": 1.4728, + "step": 24450 + }, + { + "epoch": 1.92, + "learning_rate": 8.557760486885446e-05, + "loss": 1.4921, + "step": 24451 + }, + { + "epoch": 1.92, + "learning_rate": 8.556644333544609e-05, + "loss": 1.5321, + "step": 24452 + }, + { + "epoch": 1.92, + "learning_rate": 8.555528223950608e-05, + "loss": 1.5264, + "step": 24453 + }, + { + "epoch": 1.92, + "learning_rate": 8.554412158111014e-05, + "loss": 1.5158, + "step": 24454 + }, + { + "epoch": 1.92, + "learning_rate": 8.553296136033404e-05, + "loss": 1.5238, + "step": 24455 + }, + { + "epoch": 1.92, + "learning_rate": 8.552180157725348e-05, + "loss": 1.4768, + "step": 24456 + }, + { + "epoch": 1.92, + "learning_rate": 8.55106422319444e-05, + "loss": 1.5274, + "step": 24457 + }, + { + "epoch": 1.92, + "learning_rate": 8.549948332448244e-05, + "loss": 1.4896, + "step": 24458 + }, + { + "epoch": 1.92, + "learning_rate": 8.548832485494334e-05, + "loss": 1.4735, + "step": 24459 + }, + { + "epoch": 1.92, + "learning_rate": 8.547716682340297e-05, + "loss": 1.4561, + "step": 24460 + }, + { + "epoch": 1.92, + "learning_rate": 8.546600922993706e-05, + "loss": 1.5455, + "step": 24461 + }, + { + "epoch": 1.92, + "learning_rate": 8.545485207462125e-05, + "loss": 1.5336, + "step": 24462 + }, + { + "epoch": 1.92, + "learning_rate": 8.544369535753138e-05, + "loss": 1.5397, + "step": 24463 + }, + { + "epoch": 1.92, + "learning_rate": 8.543253907874326e-05, + "loss": 1.5343, + "step": 24464 + }, + { + "epoch": 1.92, + "learning_rate": 8.542138323833256e-05, + "loss": 1.5033, + "step": 24465 + }, + { + "epoch": 1.93, + "learning_rate": 8.541022783637498e-05, + "loss": 1.486, + "step": 24466 + }, + { + "epoch": 1.93, + "learning_rate": 8.539907287294635e-05, + "loss": 1.4765, + "step": 24467 + }, + { + "epoch": 1.93, + "learning_rate": 8.538791834812237e-05, + "loss": 1.4641, + "step": 24468 + }, + { + "epoch": 1.93, + "learning_rate": 8.537676426197873e-05, + "loss": 1.5246, + "step": 24469 + }, + { + "epoch": 1.93, + "learning_rate": 8.536561061459125e-05, + "loss": 1.4893, + "step": 24470 + }, + { + "epoch": 1.93, + "learning_rate": 8.53544574060356e-05, + "loss": 1.5128, + "step": 24471 + }, + { + "epoch": 1.93, + "learning_rate": 8.534330463638749e-05, + "loss": 1.5002, + "step": 24472 + }, + { + "epoch": 1.93, + "learning_rate": 8.533215230572263e-05, + "loss": 1.475, + "step": 24473 + }, + { + "epoch": 1.93, + "learning_rate": 8.532100041411683e-05, + "loss": 1.4912, + "step": 24474 + }, + { + "epoch": 1.93, + "learning_rate": 8.530984896164573e-05, + "loss": 1.526, + "step": 24475 + }, + { + "epoch": 1.93, + "learning_rate": 8.5298697948385e-05, + "loss": 1.4937, + "step": 24476 + }, + { + "epoch": 1.93, + "learning_rate": 8.528754737441047e-05, + "loss": 1.5134, + "step": 24477 + }, + { + "epoch": 1.93, + "learning_rate": 8.527639723979773e-05, + "loss": 1.4982, + "step": 24478 + }, + { + "epoch": 1.93, + "learning_rate": 8.526524754462257e-05, + "loss": 1.502, + "step": 24479 + }, + { + "epoch": 1.93, + "learning_rate": 8.525409828896061e-05, + "loss": 1.5067, + "step": 24480 + }, + { + "epoch": 1.93, + "learning_rate": 8.524294947288765e-05, + "loss": 1.4666, + "step": 24481 + }, + { + "epoch": 1.93, + "learning_rate": 8.523180109647932e-05, + "loss": 1.5086, + "step": 24482 + }, + { + "epoch": 1.93, + "learning_rate": 8.522065315981127e-05, + "loss": 1.5035, + "step": 24483 + }, + { + "epoch": 1.93, + "learning_rate": 8.52095056629593e-05, + "loss": 1.4904, + "step": 24484 + }, + { + "epoch": 1.93, + "learning_rate": 8.519835860599903e-05, + "loss": 1.4743, + "step": 24485 + }, + { + "epoch": 1.93, + "learning_rate": 8.518721198900608e-05, + "loss": 1.5155, + "step": 24486 + }, + { + "epoch": 1.93, + "learning_rate": 8.517606581205624e-05, + "loss": 1.5025, + "step": 24487 + }, + { + "epoch": 1.93, + "learning_rate": 8.516492007522517e-05, + "loss": 1.5239, + "step": 24488 + }, + { + "epoch": 1.93, + "learning_rate": 8.515377477858844e-05, + "loss": 1.4433, + "step": 24489 + }, + { + "epoch": 1.93, + "learning_rate": 8.514262992222185e-05, + "loss": 1.4885, + "step": 24490 + }, + { + "epoch": 1.93, + "learning_rate": 8.513148550620102e-05, + "loss": 1.464, + "step": 24491 + }, + { + "epoch": 1.93, + "learning_rate": 8.512034153060161e-05, + "loss": 1.4675, + "step": 24492 + }, + { + "epoch": 1.93, + "learning_rate": 8.51091979954992e-05, + "loss": 1.4353, + "step": 24493 + }, + { + "epoch": 1.93, + "learning_rate": 8.509805490096953e-05, + "loss": 1.4863, + "step": 24494 + }, + { + "epoch": 1.93, + "learning_rate": 8.508691224708833e-05, + "loss": 1.4849, + "step": 24495 + }, + { + "epoch": 1.93, + "learning_rate": 8.507577003393117e-05, + "loss": 1.4707, + "step": 24496 + }, + { + "epoch": 1.93, + "learning_rate": 8.506462826157362e-05, + "loss": 1.492, + "step": 24497 + }, + { + "epoch": 1.93, + "learning_rate": 8.505348693009149e-05, + "loss": 1.4896, + "step": 24498 + }, + { + "epoch": 1.93, + "learning_rate": 8.504234603956034e-05, + "loss": 1.5383, + "step": 24499 + }, + { + "epoch": 1.93, + "learning_rate": 8.503120559005574e-05, + "loss": 1.4668, + "step": 24500 + }, + { + "epoch": 1.93, + "learning_rate": 8.502006558165347e-05, + "loss": 1.4953, + "step": 24501 + }, + { + "epoch": 1.93, + "learning_rate": 8.500892601442911e-05, + "loss": 1.5142, + "step": 24502 + }, + { + "epoch": 1.93, + "learning_rate": 8.49977868884582e-05, + "loss": 1.4841, + "step": 24503 + }, + { + "epoch": 1.93, + "learning_rate": 8.49866482038165e-05, + "loss": 1.4614, + "step": 24504 + }, + { + "epoch": 1.93, + "learning_rate": 8.497550996057959e-05, + "loss": 1.461, + "step": 24505 + }, + { + "epoch": 1.93, + "learning_rate": 8.496437215882304e-05, + "loss": 1.4719, + "step": 24506 + }, + { + "epoch": 1.93, + "learning_rate": 8.495323479862256e-05, + "loss": 1.4903, + "step": 24507 + }, + { + "epoch": 1.93, + "learning_rate": 8.49420978800537e-05, + "loss": 1.499, + "step": 24508 + }, + { + "epoch": 1.93, + "learning_rate": 8.493096140319213e-05, + "loss": 1.4909, + "step": 24509 + }, + { + "epoch": 1.93, + "learning_rate": 8.491982536811328e-05, + "loss": 1.5116, + "step": 24510 + }, + { + "epoch": 1.93, + "learning_rate": 8.490868977489303e-05, + "loss": 1.456, + "step": 24511 + }, + { + "epoch": 1.93, + "learning_rate": 8.489755462360686e-05, + "loss": 1.4749, + "step": 24512 + }, + { + "epoch": 1.93, + "learning_rate": 8.488641991433034e-05, + "loss": 1.472, + "step": 24513 + }, + { + "epoch": 1.93, + "learning_rate": 8.487528564713908e-05, + "loss": 1.4975, + "step": 24514 + }, + { + "epoch": 1.93, + "learning_rate": 8.486415182210871e-05, + "loss": 1.4654, + "step": 24515 + }, + { + "epoch": 1.93, + "learning_rate": 8.485301843931484e-05, + "loss": 1.4562, + "step": 24516 + }, + { + "epoch": 1.93, + "learning_rate": 8.484188549883295e-05, + "loss": 1.5077, + "step": 24517 + }, + { + "epoch": 1.93, + "learning_rate": 8.483075300073876e-05, + "loss": 1.412, + "step": 24518 + }, + { + "epoch": 1.93, + "learning_rate": 8.481962094510778e-05, + "loss": 1.5125, + "step": 24519 + }, + { + "epoch": 1.93, + "learning_rate": 8.480848933201557e-05, + "loss": 1.4663, + "step": 24520 + }, + { + "epoch": 1.93, + "learning_rate": 8.479735816153779e-05, + "loss": 1.5914, + "step": 24521 + }, + { + "epoch": 1.93, + "learning_rate": 8.478622743374996e-05, + "loss": 1.4844, + "step": 24522 + }, + { + "epoch": 1.93, + "learning_rate": 8.477509714872761e-05, + "loss": 1.5142, + "step": 24523 + }, + { + "epoch": 1.93, + "learning_rate": 8.47639673065464e-05, + "loss": 1.4877, + "step": 24524 + }, + { + "epoch": 1.93, + "learning_rate": 8.475283790728178e-05, + "loss": 1.4603, + "step": 24525 + }, + { + "epoch": 1.93, + "learning_rate": 8.474170895100949e-05, + "loss": 1.5629, + "step": 24526 + }, + { + "epoch": 1.93, + "learning_rate": 8.473058043780489e-05, + "loss": 1.5086, + "step": 24527 + }, + { + "epoch": 1.93, + "learning_rate": 8.47194523677437e-05, + "loss": 1.4801, + "step": 24528 + }, + { + "epoch": 1.93, + "learning_rate": 8.470832474090141e-05, + "loss": 1.4893, + "step": 24529 + }, + { + "epoch": 1.93, + "learning_rate": 8.469719755735348e-05, + "loss": 1.4938, + "step": 24530 + }, + { + "epoch": 1.93, + "learning_rate": 8.468607081717562e-05, + "loss": 1.4954, + "step": 24531 + }, + { + "epoch": 1.93, + "learning_rate": 8.46749445204433e-05, + "loss": 1.5123, + "step": 24532 + }, + { + "epoch": 1.93, + "learning_rate": 8.466381866723205e-05, + "loss": 1.52, + "step": 24533 + }, + { + "epoch": 1.93, + "learning_rate": 8.465269325761736e-05, + "loss": 1.4975, + "step": 24534 + }, + { + "epoch": 1.93, + "learning_rate": 8.464156829167487e-05, + "loss": 1.4705, + "step": 24535 + }, + { + "epoch": 1.93, + "learning_rate": 8.463044376948006e-05, + "loss": 1.4506, + "step": 24536 + }, + { + "epoch": 1.93, + "learning_rate": 8.461931969110842e-05, + "loss": 1.3977, + "step": 24537 + }, + { + "epoch": 1.93, + "learning_rate": 8.460819605663558e-05, + "loss": 1.4798, + "step": 24538 + }, + { + "epoch": 1.93, + "learning_rate": 8.459707286613701e-05, + "loss": 1.4787, + "step": 24539 + }, + { + "epoch": 1.93, + "learning_rate": 8.458595011968813e-05, + "loss": 1.4565, + "step": 24540 + }, + { + "epoch": 1.93, + "learning_rate": 8.457482781736458e-05, + "loss": 1.4901, + "step": 24541 + }, + { + "epoch": 1.93, + "learning_rate": 8.45637059592419e-05, + "loss": 1.529, + "step": 24542 + }, + { + "epoch": 1.93, + "learning_rate": 8.455258454539553e-05, + "loss": 1.4855, + "step": 24543 + }, + { + "epoch": 1.93, + "learning_rate": 8.454146357590095e-05, + "loss": 1.4821, + "step": 24544 + }, + { + "epoch": 1.93, + "learning_rate": 8.453034305083374e-05, + "loss": 1.499, + "step": 24545 + }, + { + "epoch": 1.93, + "learning_rate": 8.451922297026941e-05, + "loss": 1.4936, + "step": 24546 + }, + { + "epoch": 1.93, + "learning_rate": 8.450810333428335e-05, + "loss": 1.4394, + "step": 24547 + }, + { + "epoch": 1.93, + "learning_rate": 8.449698414295119e-05, + "loss": 1.5055, + "step": 24548 + }, + { + "epoch": 1.93, + "learning_rate": 8.448586539634833e-05, + "loss": 1.512, + "step": 24549 + }, + { + "epoch": 1.93, + "learning_rate": 8.447474709455032e-05, + "loss": 1.4699, + "step": 24550 + }, + { + "epoch": 1.93, + "learning_rate": 8.446362923763255e-05, + "loss": 1.4795, + "step": 24551 + }, + { + "epoch": 1.93, + "learning_rate": 8.445251182567063e-05, + "loss": 1.4733, + "step": 24552 + }, + { + "epoch": 1.93, + "learning_rate": 8.444139485874e-05, + "loss": 1.4559, + "step": 24553 + }, + { + "epoch": 1.93, + "learning_rate": 8.443027833691603e-05, + "loss": 1.4838, + "step": 24554 + }, + { + "epoch": 1.93, + "learning_rate": 8.441916226027437e-05, + "loss": 1.4793, + "step": 24555 + }, + { + "epoch": 1.93, + "learning_rate": 8.440804662889039e-05, + "loss": 1.4772, + "step": 24556 + }, + { + "epoch": 1.93, + "learning_rate": 8.439693144283952e-05, + "loss": 1.463, + "step": 24557 + }, + { + "epoch": 1.93, + "learning_rate": 8.43858167021973e-05, + "loss": 1.4683, + "step": 24558 + }, + { + "epoch": 1.93, + "learning_rate": 8.437470240703922e-05, + "loss": 1.4572, + "step": 24559 + }, + { + "epoch": 1.93, + "learning_rate": 8.43635885574407e-05, + "loss": 1.4492, + "step": 24560 + }, + { + "epoch": 1.93, + "learning_rate": 8.435247515347712e-05, + "loss": 1.4399, + "step": 24561 + }, + { + "epoch": 1.93, + "learning_rate": 8.434136219522409e-05, + "loss": 1.4708, + "step": 24562 + }, + { + "epoch": 1.93, + "learning_rate": 8.433024968275697e-05, + "loss": 1.4803, + "step": 24563 + }, + { + "epoch": 1.93, + "learning_rate": 8.431913761615113e-05, + "loss": 1.4835, + "step": 24564 + }, + { + "epoch": 1.93, + "learning_rate": 8.430802599548218e-05, + "loss": 1.494, + "step": 24565 + }, + { + "epoch": 1.93, + "learning_rate": 8.42969148208255e-05, + "loss": 1.4551, + "step": 24566 + }, + { + "epoch": 1.93, + "learning_rate": 8.428580409225648e-05, + "loss": 1.5268, + "step": 24567 + }, + { + "epoch": 1.93, + "learning_rate": 8.427469380985054e-05, + "loss": 1.4841, + "step": 24568 + }, + { + "epoch": 1.93, + "learning_rate": 8.426358397368322e-05, + "loss": 1.4949, + "step": 24569 + }, + { + "epoch": 1.93, + "learning_rate": 8.425247458382988e-05, + "loss": 1.5569, + "step": 24570 + }, + { + "epoch": 1.93, + "learning_rate": 8.42413656403659e-05, + "loss": 1.497, + "step": 24571 + }, + { + "epoch": 1.93, + "learning_rate": 8.423025714336677e-05, + "loss": 1.5112, + "step": 24572 + }, + { + "epoch": 1.93, + "learning_rate": 8.421914909290794e-05, + "loss": 1.4912, + "step": 24573 + }, + { + "epoch": 1.93, + "learning_rate": 8.420804148906479e-05, + "loss": 1.4912, + "step": 24574 + }, + { + "epoch": 1.93, + "learning_rate": 8.419693433191269e-05, + "loss": 1.4865, + "step": 24575 + }, + { + "epoch": 1.93, + "learning_rate": 8.418582762152712e-05, + "loss": 1.4507, + "step": 24576 + }, + { + "epoch": 1.93, + "learning_rate": 8.417472135798349e-05, + "loss": 1.467, + "step": 24577 + }, + { + "epoch": 1.93, + "learning_rate": 8.416361554135712e-05, + "loss": 1.4702, + "step": 24578 + }, + { + "epoch": 1.93, + "learning_rate": 8.41525101717235e-05, + "loss": 1.5322, + "step": 24579 + }, + { + "epoch": 1.93, + "learning_rate": 8.414140524915802e-05, + "loss": 1.4698, + "step": 24580 + }, + { + "epoch": 1.93, + "learning_rate": 8.413030077373599e-05, + "loss": 1.4756, + "step": 24581 + }, + { + "epoch": 1.93, + "learning_rate": 8.411919674553292e-05, + "loss": 1.4884, + "step": 24582 + }, + { + "epoch": 1.93, + "learning_rate": 8.410809316462416e-05, + "loss": 1.4701, + "step": 24583 + }, + { + "epoch": 1.93, + "learning_rate": 8.409699003108507e-05, + "loss": 1.5337, + "step": 24584 + }, + { + "epoch": 1.93, + "learning_rate": 8.408588734499102e-05, + "loss": 1.4231, + "step": 24585 + }, + { + "epoch": 1.93, + "learning_rate": 8.407478510641744e-05, + "loss": 1.5133, + "step": 24586 + }, + { + "epoch": 1.93, + "learning_rate": 8.406368331543971e-05, + "loss": 1.4489, + "step": 24587 + }, + { + "epoch": 1.93, + "learning_rate": 8.405258197213306e-05, + "loss": 1.4733, + "step": 24588 + }, + { + "epoch": 1.93, + "learning_rate": 8.404148107657311e-05, + "loss": 1.5271, + "step": 24589 + }, + { + "epoch": 1.93, + "learning_rate": 8.403038062883511e-05, + "loss": 1.5109, + "step": 24590 + }, + { + "epoch": 1.93, + "learning_rate": 8.401928062899442e-05, + "loss": 1.4761, + "step": 24591 + }, + { + "epoch": 1.93, + "learning_rate": 8.400818107712633e-05, + "loss": 1.4621, + "step": 24592 + }, + { + "epoch": 1.94, + "learning_rate": 8.399708197330635e-05, + "loss": 1.4828, + "step": 24593 + }, + { + "epoch": 1.94, + "learning_rate": 8.398598331760974e-05, + "loss": 1.5569, + "step": 24594 + }, + { + "epoch": 1.94, + "learning_rate": 8.397488511011184e-05, + "loss": 1.4669, + "step": 24595 + }, + { + "epoch": 1.94, + "learning_rate": 8.396378735088806e-05, + "loss": 1.4675, + "step": 24596 + }, + { + "epoch": 1.94, + "learning_rate": 8.395269004001375e-05, + "loss": 1.4428, + "step": 24597 + }, + { + "epoch": 1.94, + "learning_rate": 8.394159317756414e-05, + "loss": 1.4379, + "step": 24598 + }, + { + "epoch": 1.94, + "learning_rate": 8.393049676361476e-05, + "loss": 1.4338, + "step": 24599 + }, + { + "epoch": 1.94, + "learning_rate": 8.39194007982408e-05, + "loss": 1.4989, + "step": 24600 + }, + { + "epoch": 1.94, + "learning_rate": 8.390830528151759e-05, + "loss": 1.5298, + "step": 24601 + }, + { + "epoch": 1.94, + "learning_rate": 8.389721021352062e-05, + "loss": 1.5006, + "step": 24602 + }, + { + "epoch": 1.94, + "learning_rate": 8.388611559432506e-05, + "loss": 1.4844, + "step": 24603 + }, + { + "epoch": 1.94, + "learning_rate": 8.387502142400625e-05, + "loss": 1.4804, + "step": 24604 + }, + { + "epoch": 1.94, + "learning_rate": 8.386392770263958e-05, + "loss": 1.4562, + "step": 24605 + }, + { + "epoch": 1.94, + "learning_rate": 8.385283443030036e-05, + "loss": 1.5214, + "step": 24606 + }, + { + "epoch": 1.94, + "learning_rate": 8.384174160706391e-05, + "loss": 1.4607, + "step": 24607 + }, + { + "epoch": 1.94, + "learning_rate": 8.383064923300555e-05, + "loss": 1.5175, + "step": 24608 + }, + { + "epoch": 1.94, + "learning_rate": 8.381955730820048e-05, + "loss": 1.4732, + "step": 24609 + }, + { + "epoch": 1.94, + "learning_rate": 8.380846583272416e-05, + "loss": 1.521, + "step": 24610 + }, + { + "epoch": 1.94, + "learning_rate": 8.379737480665182e-05, + "loss": 1.4893, + "step": 24611 + }, + { + "epoch": 1.94, + "learning_rate": 8.378628423005872e-05, + "loss": 1.4692, + "step": 24612 + }, + { + "epoch": 1.94, + "learning_rate": 8.377519410302027e-05, + "loss": 1.5134, + "step": 24613 + }, + { + "epoch": 1.94, + "learning_rate": 8.37641044256117e-05, + "loss": 1.4698, + "step": 24614 + }, + { + "epoch": 1.94, + "learning_rate": 8.375301519790825e-05, + "loss": 1.4911, + "step": 24615 + }, + { + "epoch": 1.94, + "learning_rate": 8.374192641998533e-05, + "loss": 1.4516, + "step": 24616 + }, + { + "epoch": 1.94, + "learning_rate": 8.373083809191818e-05, + "loss": 1.5276, + "step": 24617 + }, + { + "epoch": 1.94, + "learning_rate": 8.371975021378198e-05, + "loss": 1.4931, + "step": 24618 + }, + { + "epoch": 1.94, + "learning_rate": 8.37086627856522e-05, + "loss": 1.431, + "step": 24619 + }, + { + "epoch": 1.94, + "learning_rate": 8.369757580760393e-05, + "loss": 1.5126, + "step": 24620 + }, + { + "epoch": 1.94, + "learning_rate": 8.368648927971258e-05, + "loss": 1.4654, + "step": 24621 + }, + { + "epoch": 1.94, + "learning_rate": 8.367540320205334e-05, + "loss": 1.5655, + "step": 24622 + }, + { + "epoch": 1.94, + "learning_rate": 8.366431757470157e-05, + "loss": 1.5196, + "step": 24623 + }, + { + "epoch": 1.94, + "learning_rate": 8.365323239773245e-05, + "loss": 1.4472, + "step": 24624 + }, + { + "epoch": 1.94, + "learning_rate": 8.36421476712213e-05, + "loss": 1.5191, + "step": 24625 + }, + { + "epoch": 1.94, + "learning_rate": 8.363106339524326e-05, + "loss": 1.4978, + "step": 24626 + }, + { + "epoch": 1.94, + "learning_rate": 8.361997956987376e-05, + "loss": 1.5089, + "step": 24627 + }, + { + "epoch": 1.94, + "learning_rate": 8.360889619518796e-05, + "loss": 1.5283, + "step": 24628 + }, + { + "epoch": 1.94, + "learning_rate": 8.359781327126104e-05, + "loss": 1.4427, + "step": 24629 + }, + { + "epoch": 1.94, + "learning_rate": 8.35867307981684e-05, + "loss": 1.5161, + "step": 24630 + }, + { + "epoch": 1.94, + "learning_rate": 8.357564877598522e-05, + "loss": 1.4508, + "step": 24631 + }, + { + "epoch": 1.94, + "learning_rate": 8.356456720478665e-05, + "loss": 1.5265, + "step": 24632 + }, + { + "epoch": 1.94, + "learning_rate": 8.355348608464807e-05, + "loss": 1.5449, + "step": 24633 + }, + { + "epoch": 1.94, + "learning_rate": 8.354240541564464e-05, + "loss": 1.4073, + "step": 24634 + }, + { + "epoch": 1.94, + "learning_rate": 8.353132519785155e-05, + "loss": 1.5154, + "step": 24635 + }, + { + "epoch": 1.94, + "learning_rate": 8.35202454313441e-05, + "loss": 1.5087, + "step": 24636 + }, + { + "epoch": 1.94, + "learning_rate": 8.350916611619753e-05, + "loss": 1.5139, + "step": 24637 + }, + { + "epoch": 1.94, + "learning_rate": 8.349808725248705e-05, + "loss": 1.43, + "step": 24638 + }, + { + "epoch": 1.94, + "learning_rate": 8.348700884028779e-05, + "loss": 1.4967, + "step": 24639 + }, + { + "epoch": 1.94, + "learning_rate": 8.34759308796751e-05, + "loss": 1.4859, + "step": 24640 + }, + { + "epoch": 1.94, + "learning_rate": 8.34648533707241e-05, + "loss": 1.4615, + "step": 24641 + }, + { + "epoch": 1.94, + "learning_rate": 8.345377631351e-05, + "loss": 1.5272, + "step": 24642 + }, + { + "epoch": 1.94, + "learning_rate": 8.34426997081081e-05, + "loss": 1.426, + "step": 24643 + }, + { + "epoch": 1.94, + "learning_rate": 8.343162355459353e-05, + "loss": 1.508, + "step": 24644 + }, + { + "epoch": 1.94, + "learning_rate": 8.34205478530415e-05, + "loss": 1.4745, + "step": 24645 + }, + { + "epoch": 1.94, + "learning_rate": 8.340947260352714e-05, + "loss": 1.501, + "step": 24646 + }, + { + "epoch": 1.94, + "learning_rate": 8.339839780612577e-05, + "loss": 1.5126, + "step": 24647 + }, + { + "epoch": 1.94, + "learning_rate": 8.338732346091253e-05, + "loss": 1.5188, + "step": 24648 + }, + { + "epoch": 1.94, + "learning_rate": 8.337624956796258e-05, + "loss": 1.4789, + "step": 24649 + }, + { + "epoch": 1.94, + "learning_rate": 8.336517612735115e-05, + "loss": 1.4718, + "step": 24650 + }, + { + "epoch": 1.94, + "learning_rate": 8.335410313915335e-05, + "loss": 1.4366, + "step": 24651 + }, + { + "epoch": 1.94, + "learning_rate": 8.334303060344447e-05, + "loss": 1.4403, + "step": 24652 + }, + { + "epoch": 1.94, + "learning_rate": 8.333195852029957e-05, + "loss": 1.4752, + "step": 24653 + }, + { + "epoch": 1.94, + "learning_rate": 8.332088688979393e-05, + "loss": 1.4804, + "step": 24654 + }, + { + "epoch": 1.94, + "learning_rate": 8.330981571200268e-05, + "loss": 1.5492, + "step": 24655 + }, + { + "epoch": 1.94, + "learning_rate": 8.329874498700092e-05, + "loss": 1.4849, + "step": 24656 + }, + { + "epoch": 1.94, + "learning_rate": 8.328767471486394e-05, + "loss": 1.4908, + "step": 24657 + }, + { + "epoch": 1.94, + "learning_rate": 8.327660489566682e-05, + "loss": 1.4579, + "step": 24658 + }, + { + "epoch": 1.94, + "learning_rate": 8.326553552948469e-05, + "loss": 1.4746, + "step": 24659 + }, + { + "epoch": 1.94, + "learning_rate": 8.32544666163928e-05, + "loss": 1.5145, + "step": 24660 + }, + { + "epoch": 1.94, + "learning_rate": 8.324339815646623e-05, + "loss": 1.4774, + "step": 24661 + }, + { + "epoch": 1.94, + "learning_rate": 8.323233014978017e-05, + "loss": 1.4864, + "step": 24662 + }, + { + "epoch": 1.94, + "learning_rate": 8.322126259640967e-05, + "loss": 1.5234, + "step": 24663 + }, + { + "epoch": 1.94, + "learning_rate": 8.321019549643001e-05, + "loss": 1.5105, + "step": 24664 + }, + { + "epoch": 1.94, + "learning_rate": 8.319912884991627e-05, + "loss": 1.4761, + "step": 24665 + }, + { + "epoch": 1.94, + "learning_rate": 8.318806265694351e-05, + "loss": 1.4973, + "step": 24666 + }, + { + "epoch": 1.94, + "learning_rate": 8.317699691758695e-05, + "loss": 1.5222, + "step": 24667 + }, + { + "epoch": 1.94, + "learning_rate": 8.316593163192175e-05, + "loss": 1.4805, + "step": 24668 + }, + { + "epoch": 1.94, + "learning_rate": 8.315486680002299e-05, + "loss": 1.4751, + "step": 24669 + }, + { + "epoch": 1.94, + "learning_rate": 8.314380242196576e-05, + "loss": 1.4896, + "step": 24670 + }, + { + "epoch": 1.94, + "learning_rate": 8.313273849782525e-05, + "loss": 1.452, + "step": 24671 + }, + { + "epoch": 1.94, + "learning_rate": 8.312167502767656e-05, + "loss": 1.4394, + "step": 24672 + }, + { + "epoch": 1.94, + "learning_rate": 8.311061201159473e-05, + "loss": 1.4811, + "step": 24673 + }, + { + "epoch": 1.94, + "learning_rate": 8.309954944965499e-05, + "loss": 1.4447, + "step": 24674 + }, + { + "epoch": 1.94, + "learning_rate": 8.308848734193238e-05, + "loss": 1.4867, + "step": 24675 + }, + { + "epoch": 1.94, + "learning_rate": 8.307742568850196e-05, + "loss": 1.4764, + "step": 24676 + }, + { + "epoch": 1.94, + "learning_rate": 8.306636448943896e-05, + "loss": 1.5224, + "step": 24677 + }, + { + "epoch": 1.94, + "learning_rate": 8.30553037448184e-05, + "loss": 1.5034, + "step": 24678 + }, + { + "epoch": 1.94, + "learning_rate": 8.304424345471539e-05, + "loss": 1.5122, + "step": 24679 + }, + { + "epoch": 1.94, + "learning_rate": 8.303318361920495e-05, + "loss": 1.4684, + "step": 24680 + }, + { + "epoch": 1.94, + "learning_rate": 8.30221242383623e-05, + "loss": 1.5178, + "step": 24681 + }, + { + "epoch": 1.94, + "learning_rate": 8.301106531226242e-05, + "loss": 1.4731, + "step": 24682 + }, + { + "epoch": 1.94, + "learning_rate": 8.300000684098047e-05, + "loss": 1.5086, + "step": 24683 + }, + { + "epoch": 1.94, + "learning_rate": 8.298894882459146e-05, + "loss": 1.4167, + "step": 24684 + }, + { + "epoch": 1.94, + "learning_rate": 8.297789126317055e-05, + "loss": 1.4997, + "step": 24685 + }, + { + "epoch": 1.94, + "learning_rate": 8.29668341567928e-05, + "loss": 1.5192, + "step": 24686 + }, + { + "epoch": 1.94, + "learning_rate": 8.295577750553318e-05, + "loss": 1.4342, + "step": 24687 + }, + { + "epoch": 1.94, + "learning_rate": 8.29447213094669e-05, + "loss": 1.4956, + "step": 24688 + }, + { + "epoch": 1.94, + "learning_rate": 8.293366556866894e-05, + "loss": 1.4549, + "step": 24689 + }, + { + "epoch": 1.94, + "learning_rate": 8.292261028321433e-05, + "loss": 1.4558, + "step": 24690 + }, + { + "epoch": 1.94, + "learning_rate": 8.291155545317825e-05, + "loss": 1.5062, + "step": 24691 + }, + { + "epoch": 1.94, + "learning_rate": 8.290050107863568e-05, + "loss": 1.4312, + "step": 24692 + }, + { + "epoch": 1.94, + "learning_rate": 8.288944715966162e-05, + "loss": 1.5185, + "step": 24693 + }, + { + "epoch": 1.94, + "learning_rate": 8.287839369633121e-05, + "loss": 1.4898, + "step": 24694 + }, + { + "epoch": 1.94, + "learning_rate": 8.286734068871951e-05, + "loss": 1.4675, + "step": 24695 + }, + { + "epoch": 1.94, + "learning_rate": 8.285628813690144e-05, + "loss": 1.5362, + "step": 24696 + }, + { + "epoch": 1.94, + "learning_rate": 8.284523604095218e-05, + "loss": 1.4953, + "step": 24697 + }, + { + "epoch": 1.94, + "learning_rate": 8.283418440094663e-05, + "loss": 1.5193, + "step": 24698 + }, + { + "epoch": 1.94, + "learning_rate": 8.282313321696e-05, + "loss": 1.5529, + "step": 24699 + }, + { + "epoch": 1.94, + "learning_rate": 8.281208248906715e-05, + "loss": 1.4971, + "step": 24700 + }, + { + "epoch": 1.94, + "learning_rate": 8.280103221734324e-05, + "loss": 1.4502, + "step": 24701 + }, + { + "epoch": 1.94, + "learning_rate": 8.278998240186322e-05, + "loss": 1.4745, + "step": 24702 + }, + { + "epoch": 1.94, + "learning_rate": 8.277893304270215e-05, + "loss": 1.4998, + "step": 24703 + }, + { + "epoch": 1.94, + "learning_rate": 8.276788413993499e-05, + "loss": 1.4461, + "step": 24704 + }, + { + "epoch": 1.94, + "learning_rate": 8.27568356936368e-05, + "loss": 1.5116, + "step": 24705 + }, + { + "epoch": 1.94, + "learning_rate": 8.274578770388263e-05, + "loss": 1.4892, + "step": 24706 + }, + { + "epoch": 1.94, + "learning_rate": 8.273474017074738e-05, + "loss": 1.5141, + "step": 24707 + }, + { + "epoch": 1.94, + "learning_rate": 8.272369309430618e-05, + "loss": 1.4426, + "step": 24708 + }, + { + "epoch": 1.94, + "learning_rate": 8.271264647463399e-05, + "loss": 1.459, + "step": 24709 + }, + { + "epoch": 1.94, + "learning_rate": 8.270160031180571e-05, + "loss": 1.4993, + "step": 24710 + }, + { + "epoch": 1.94, + "learning_rate": 8.269055460589652e-05, + "loss": 1.456, + "step": 24711 + }, + { + "epoch": 1.94, + "learning_rate": 8.26795093569813e-05, + "loss": 1.4784, + "step": 24712 + }, + { + "epoch": 1.94, + "learning_rate": 8.266846456513499e-05, + "loss": 1.4794, + "step": 24713 + }, + { + "epoch": 1.94, + "learning_rate": 8.265742023043266e-05, + "loss": 1.4085, + "step": 24714 + }, + { + "epoch": 1.94, + "learning_rate": 8.264637635294936e-05, + "loss": 1.4605, + "step": 24715 + }, + { + "epoch": 1.94, + "learning_rate": 8.263533293275999e-05, + "loss": 1.4929, + "step": 24716 + }, + { + "epoch": 1.94, + "learning_rate": 8.262428996993944e-05, + "loss": 1.5038, + "step": 24717 + }, + { + "epoch": 1.94, + "learning_rate": 8.261324746456288e-05, + "loss": 1.5064, + "step": 24718 + }, + { + "epoch": 1.94, + "learning_rate": 8.260220541670516e-05, + "loss": 1.5084, + "step": 24719 + }, + { + "epoch": 1.95, + "learning_rate": 8.259116382644127e-05, + "loss": 1.5164, + "step": 24720 + }, + { + "epoch": 1.95, + "learning_rate": 8.258012269384614e-05, + "loss": 1.4367, + "step": 24721 + }, + { + "epoch": 1.95, + "learning_rate": 8.256908201899481e-05, + "loss": 1.4902, + "step": 24722 + }, + { + "epoch": 1.95, + "learning_rate": 8.255804180196222e-05, + "loss": 1.516, + "step": 24723 + }, + { + "epoch": 1.95, + "learning_rate": 8.254700204282325e-05, + "loss": 1.4842, + "step": 24724 + }, + { + "epoch": 1.95, + "learning_rate": 8.253596274165295e-05, + "loss": 1.4824, + "step": 24725 + }, + { + "epoch": 1.95, + "learning_rate": 8.252492389852626e-05, + "loss": 1.4827, + "step": 24726 + }, + { + "epoch": 1.95, + "learning_rate": 8.251388551351804e-05, + "loss": 1.4663, + "step": 24727 + }, + { + "epoch": 1.95, + "learning_rate": 8.250284758670334e-05, + "loss": 1.5492, + "step": 24728 + }, + { + "epoch": 1.95, + "learning_rate": 8.249181011815705e-05, + "loss": 1.4963, + "step": 24729 + }, + { + "epoch": 1.95, + "learning_rate": 8.248077310795406e-05, + "loss": 1.503, + "step": 24730 + }, + { + "epoch": 1.95, + "learning_rate": 8.246973655616937e-05, + "loss": 1.4848, + "step": 24731 + }, + { + "epoch": 1.95, + "learning_rate": 8.245870046287796e-05, + "loss": 1.4653, + "step": 24732 + }, + { + "epoch": 1.95, + "learning_rate": 8.244766482815469e-05, + "loss": 1.4725, + "step": 24733 + }, + { + "epoch": 1.95, + "learning_rate": 8.243662965207447e-05, + "loss": 1.5281, + "step": 24734 + }, + { + "epoch": 1.95, + "learning_rate": 8.242559493471226e-05, + "loss": 1.5073, + "step": 24735 + }, + { + "epoch": 1.95, + "learning_rate": 8.241456067614302e-05, + "loss": 1.4896, + "step": 24736 + }, + { + "epoch": 1.95, + "learning_rate": 8.240352687644157e-05, + "loss": 1.4791, + "step": 24737 + }, + { + "epoch": 1.95, + "learning_rate": 8.239249353568284e-05, + "loss": 1.5123, + "step": 24738 + }, + { + "epoch": 1.95, + "learning_rate": 8.238146065394181e-05, + "loss": 1.5267, + "step": 24739 + }, + { + "epoch": 1.95, + "learning_rate": 8.237042823129337e-05, + "loss": 1.4647, + "step": 24740 + }, + { + "epoch": 1.95, + "learning_rate": 8.235939626781233e-05, + "loss": 1.5042, + "step": 24741 + }, + { + "epoch": 1.95, + "learning_rate": 8.234836476357372e-05, + "loss": 1.4953, + "step": 24742 + }, + { + "epoch": 1.95, + "learning_rate": 8.23373337186524e-05, + "loss": 1.5021, + "step": 24743 + }, + { + "epoch": 1.95, + "learning_rate": 8.232630313312316e-05, + "loss": 1.4386, + "step": 24744 + }, + { + "epoch": 1.95, + "learning_rate": 8.231527300706098e-05, + "loss": 1.4448, + "step": 24745 + }, + { + "epoch": 1.95, + "learning_rate": 8.23042433405408e-05, + "loss": 1.5312, + "step": 24746 + }, + { + "epoch": 1.95, + "learning_rate": 8.229321413363746e-05, + "loss": 1.4863, + "step": 24747 + }, + { + "epoch": 1.95, + "learning_rate": 8.228218538642578e-05, + "loss": 1.4751, + "step": 24748 + }, + { + "epoch": 1.95, + "learning_rate": 8.227115709898076e-05, + "loss": 1.4852, + "step": 24749 + }, + { + "epoch": 1.95, + "learning_rate": 8.226012927137716e-05, + "loss": 1.4725, + "step": 24750 + }, + { + "epoch": 1.95, + "learning_rate": 8.224910190368988e-05, + "loss": 1.4664, + "step": 24751 + }, + { + "epoch": 1.95, + "learning_rate": 8.223807499599387e-05, + "loss": 1.5074, + "step": 24752 + }, + { + "epoch": 1.95, + "learning_rate": 8.222704854836392e-05, + "loss": 1.462, + "step": 24753 + }, + { + "epoch": 1.95, + "learning_rate": 8.221602256087487e-05, + "loss": 1.509, + "step": 24754 + }, + { + "epoch": 1.95, + "learning_rate": 8.220499703360165e-05, + "loss": 1.4378, + "step": 24755 + }, + { + "epoch": 1.95, + "learning_rate": 8.21939719666191e-05, + "loss": 1.506, + "step": 24756 + }, + { + "epoch": 1.95, + "learning_rate": 8.218294736000207e-05, + "loss": 1.5219, + "step": 24757 + }, + { + "epoch": 1.95, + "learning_rate": 8.217192321382536e-05, + "loss": 1.4759, + "step": 24758 + }, + { + "epoch": 1.95, + "learning_rate": 8.21608995281639e-05, + "loss": 1.5087, + "step": 24759 + }, + { + "epoch": 1.95, + "learning_rate": 8.214987630309248e-05, + "loss": 1.4552, + "step": 24760 + }, + { + "epoch": 1.95, + "learning_rate": 8.213885353868592e-05, + "loss": 1.4799, + "step": 24761 + }, + { + "epoch": 1.95, + "learning_rate": 8.21278312350191e-05, + "loss": 1.4389, + "step": 24762 + }, + { + "epoch": 1.95, + "learning_rate": 8.211680939216691e-05, + "loss": 1.4592, + "step": 24763 + }, + { + "epoch": 1.95, + "learning_rate": 8.21057880102041e-05, + "loss": 1.4935, + "step": 24764 + }, + { + "epoch": 1.95, + "learning_rate": 8.209476708920547e-05, + "loss": 1.4832, + "step": 24765 + }, + { + "epoch": 1.95, + "learning_rate": 8.208374662924596e-05, + "loss": 1.5011, + "step": 24766 + }, + { + "epoch": 1.95, + "learning_rate": 8.207272663040034e-05, + "loss": 1.4857, + "step": 24767 + }, + { + "epoch": 1.95, + "learning_rate": 8.206170709274337e-05, + "loss": 1.4961, + "step": 24768 + }, + { + "epoch": 1.95, + "learning_rate": 8.205068801634994e-05, + "loss": 1.474, + "step": 24769 + }, + { + "epoch": 1.95, + "learning_rate": 8.203966940129487e-05, + "loss": 1.4309, + "step": 24770 + }, + { + "epoch": 1.95, + "learning_rate": 8.202865124765287e-05, + "loss": 1.5028, + "step": 24771 + }, + { + "epoch": 1.95, + "learning_rate": 8.20176335554989e-05, + "loss": 1.498, + "step": 24772 + }, + { + "epoch": 1.95, + "learning_rate": 8.200661632490767e-05, + "loss": 1.5187, + "step": 24773 + }, + { + "epoch": 1.95, + "learning_rate": 8.199559955595397e-05, + "loss": 1.4755, + "step": 24774 + }, + { + "epoch": 1.95, + "learning_rate": 8.19845832487126e-05, + "loss": 1.495, + "step": 24775 + }, + { + "epoch": 1.95, + "learning_rate": 8.197356740325841e-05, + "loss": 1.4728, + "step": 24776 + }, + { + "epoch": 1.95, + "learning_rate": 8.19625520196661e-05, + "loss": 1.5097, + "step": 24777 + }, + { + "epoch": 1.95, + "learning_rate": 8.195153709801059e-05, + "loss": 1.4798, + "step": 24778 + }, + { + "epoch": 1.95, + "learning_rate": 8.194052263836651e-05, + "loss": 1.4704, + "step": 24779 + }, + { + "epoch": 1.95, + "learning_rate": 8.19295086408088e-05, + "loss": 1.4801, + "step": 24780 + }, + { + "epoch": 1.95, + "learning_rate": 8.191849510541215e-05, + "loss": 1.4422, + "step": 24781 + }, + { + "epoch": 1.95, + "learning_rate": 8.190748203225129e-05, + "loss": 1.468, + "step": 24782 + }, + { + "epoch": 1.95, + "learning_rate": 8.189646942140113e-05, + "loss": 1.4987, + "step": 24783 + }, + { + "epoch": 1.95, + "learning_rate": 8.188545727293632e-05, + "loss": 1.4856, + "step": 24784 + }, + { + "epoch": 1.95, + "learning_rate": 8.187444558693165e-05, + "loss": 1.4465, + "step": 24785 + }, + { + "epoch": 1.95, + "learning_rate": 8.186343436346192e-05, + "loss": 1.4383, + "step": 24786 + }, + { + "epoch": 1.95, + "learning_rate": 8.185242360260189e-05, + "loss": 1.4398, + "step": 24787 + }, + { + "epoch": 1.95, + "learning_rate": 8.184141330442622e-05, + "loss": 1.4521, + "step": 24788 + }, + { + "epoch": 1.95, + "learning_rate": 8.183040346900984e-05, + "loss": 1.4778, + "step": 24789 + }, + { + "epoch": 1.95, + "learning_rate": 8.181939409642738e-05, + "loss": 1.4978, + "step": 24790 + }, + { + "epoch": 1.95, + "learning_rate": 8.180838518675359e-05, + "loss": 1.5029, + "step": 24791 + }, + { + "epoch": 1.95, + "learning_rate": 8.179737674006314e-05, + "loss": 1.5342, + "step": 24792 + }, + { + "epoch": 1.95, + "learning_rate": 8.178636875643098e-05, + "loss": 1.499, + "step": 24793 + }, + { + "epoch": 1.95, + "learning_rate": 8.177536123593172e-05, + "loss": 1.5218, + "step": 24794 + }, + { + "epoch": 1.95, + "learning_rate": 8.176435417864012e-05, + "loss": 1.4489, + "step": 24795 + }, + { + "epoch": 1.95, + "learning_rate": 8.175334758463082e-05, + "loss": 1.4946, + "step": 24796 + }, + { + "epoch": 1.95, + "learning_rate": 8.174234145397872e-05, + "loss": 1.501, + "step": 24797 + }, + { + "epoch": 1.95, + "learning_rate": 8.173133578675842e-05, + "loss": 1.5398, + "step": 24798 + }, + { + "epoch": 1.95, + "learning_rate": 8.172033058304465e-05, + "loss": 1.5122, + "step": 24799 + }, + { + "epoch": 1.95, + "learning_rate": 8.17093258429122e-05, + "loss": 1.4852, + "step": 24800 + }, + { + "epoch": 1.95, + "learning_rate": 8.169832156643573e-05, + "loss": 1.4959, + "step": 24801 + }, + { + "epoch": 1.95, + "learning_rate": 8.168731775368993e-05, + "loss": 1.499, + "step": 24802 + }, + { + "epoch": 1.95, + "learning_rate": 8.167631440474957e-05, + "loss": 1.4888, + "step": 24803 + }, + { + "epoch": 1.95, + "learning_rate": 8.166531151968936e-05, + "loss": 1.4914, + "step": 24804 + }, + { + "epoch": 1.95, + "learning_rate": 8.16543090985839e-05, + "loss": 1.4974, + "step": 24805 + }, + { + "epoch": 1.95, + "learning_rate": 8.164330714150805e-05, + "loss": 1.4868, + "step": 24806 + }, + { + "epoch": 1.95, + "learning_rate": 8.16323056485364e-05, + "loss": 1.5187, + "step": 24807 + }, + { + "epoch": 1.95, + "learning_rate": 8.16213046197436e-05, + "loss": 1.5439, + "step": 24808 + }, + { + "epoch": 1.95, + "learning_rate": 8.161030405520441e-05, + "loss": 1.4919, + "step": 24809 + }, + { + "epoch": 1.95, + "learning_rate": 8.159930395499357e-05, + "loss": 1.5032, + "step": 24810 + }, + { + "epoch": 1.95, + "learning_rate": 8.158830431918574e-05, + "loss": 1.4903, + "step": 24811 + }, + { + "epoch": 1.95, + "learning_rate": 8.157730514785547e-05, + "loss": 1.5184, + "step": 24812 + }, + { + "epoch": 1.95, + "learning_rate": 8.156630644107762e-05, + "loss": 1.4459, + "step": 24813 + }, + { + "epoch": 1.95, + "learning_rate": 8.155530819892679e-05, + "loss": 1.4975, + "step": 24814 + }, + { + "epoch": 1.95, + "learning_rate": 8.154431042147764e-05, + "loss": 1.4657, + "step": 24815 + }, + { + "epoch": 1.95, + "learning_rate": 8.153331310880477e-05, + "loss": 1.5288, + "step": 24816 + }, + { + "epoch": 1.95, + "learning_rate": 8.152231626098303e-05, + "loss": 1.5515, + "step": 24817 + }, + { + "epoch": 1.95, + "learning_rate": 8.151131987808694e-05, + "loss": 1.4937, + "step": 24818 + }, + { + "epoch": 1.95, + "learning_rate": 8.150032396019111e-05, + "loss": 1.4541, + "step": 24819 + }, + { + "epoch": 1.95, + "learning_rate": 8.148932850737037e-05, + "loss": 1.4667, + "step": 24820 + }, + { + "epoch": 1.95, + "learning_rate": 8.147833351969928e-05, + "loss": 1.5124, + "step": 24821 + }, + { + "epoch": 1.95, + "learning_rate": 8.146733899725243e-05, + "loss": 1.4315, + "step": 24822 + }, + { + "epoch": 1.95, + "learning_rate": 8.145634494010457e-05, + "loss": 1.4396, + "step": 24823 + }, + { + "epoch": 1.95, + "learning_rate": 8.144535134833026e-05, + "loss": 1.481, + "step": 24824 + }, + { + "epoch": 1.95, + "learning_rate": 8.143435822200423e-05, + "loss": 1.463, + "step": 24825 + }, + { + "epoch": 1.95, + "learning_rate": 8.142336556120104e-05, + "loss": 1.4774, + "step": 24826 + }, + { + "epoch": 1.95, + "learning_rate": 8.141237336599539e-05, + "loss": 1.506, + "step": 24827 + }, + { + "epoch": 1.95, + "learning_rate": 8.140138163646188e-05, + "loss": 1.4168, + "step": 24828 + }, + { + "epoch": 1.95, + "learning_rate": 8.139039037267507e-05, + "loss": 1.4765, + "step": 24829 + }, + { + "epoch": 1.95, + "learning_rate": 8.13793995747097e-05, + "loss": 1.4955, + "step": 24830 + }, + { + "epoch": 1.95, + "learning_rate": 8.136840924264036e-05, + "loss": 1.49, + "step": 24831 + }, + { + "epoch": 1.95, + "learning_rate": 8.135741937654163e-05, + "loss": 1.5049, + "step": 24832 + }, + { + "epoch": 1.95, + "learning_rate": 8.134642997648809e-05, + "loss": 1.5028, + "step": 24833 + }, + { + "epoch": 1.95, + "learning_rate": 8.133544104255447e-05, + "loss": 1.504, + "step": 24834 + }, + { + "epoch": 1.95, + "learning_rate": 8.132445257481531e-05, + "loss": 1.4524, + "step": 24835 + }, + { + "epoch": 1.95, + "learning_rate": 8.131346457334514e-05, + "loss": 1.4728, + "step": 24836 + }, + { + "epoch": 1.95, + "learning_rate": 8.130247703821872e-05, + "loss": 1.4982, + "step": 24837 + }, + { + "epoch": 1.95, + "learning_rate": 8.129148996951057e-05, + "loss": 1.4377, + "step": 24838 + }, + { + "epoch": 1.95, + "learning_rate": 8.128050336729521e-05, + "loss": 1.4682, + "step": 24839 + }, + { + "epoch": 1.95, + "learning_rate": 8.126951723164733e-05, + "loss": 1.4707, + "step": 24840 + }, + { + "epoch": 1.95, + "learning_rate": 8.125853156264156e-05, + "loss": 1.4586, + "step": 24841 + }, + { + "epoch": 1.95, + "learning_rate": 8.124754636035242e-05, + "loss": 1.444, + "step": 24842 + }, + { + "epoch": 1.95, + "learning_rate": 8.123656162485443e-05, + "loss": 1.4993, + "step": 24843 + }, + { + "epoch": 1.95, + "learning_rate": 8.12255773562223e-05, + "loss": 1.4362, + "step": 24844 + }, + { + "epoch": 1.95, + "learning_rate": 8.121459355453056e-05, + "loss": 1.4526, + "step": 24845 + }, + { + "epoch": 1.95, + "learning_rate": 8.120361021985371e-05, + "loss": 1.4666, + "step": 24846 + }, + { + "epoch": 1.95, + "learning_rate": 8.119262735226643e-05, + "loss": 1.5049, + "step": 24847 + }, + { + "epoch": 1.96, + "learning_rate": 8.118164495184325e-05, + "loss": 1.4569, + "step": 24848 + }, + { + "epoch": 1.96, + "learning_rate": 8.117066301865872e-05, + "loss": 1.466, + "step": 24849 + }, + { + "epoch": 1.96, + "learning_rate": 8.115968155278735e-05, + "loss": 1.458, + "step": 24850 + }, + { + "epoch": 1.96, + "learning_rate": 8.11487005543038e-05, + "loss": 1.4699, + "step": 24851 + }, + { + "epoch": 1.96, + "learning_rate": 8.11377200232826e-05, + "loss": 1.4838, + "step": 24852 + }, + { + "epoch": 1.96, + "learning_rate": 8.11267399597982e-05, + "loss": 1.5357, + "step": 24853 + }, + { + "epoch": 1.96, + "learning_rate": 8.111576036392528e-05, + "loss": 1.4824, + "step": 24854 + }, + { + "epoch": 1.96, + "learning_rate": 8.110478123573828e-05, + "loss": 1.4863, + "step": 24855 + }, + { + "epoch": 1.96, + "learning_rate": 8.109380257531186e-05, + "loss": 1.4894, + "step": 24856 + }, + { + "epoch": 1.96, + "learning_rate": 8.108282438272046e-05, + "loss": 1.4678, + "step": 24857 + }, + { + "epoch": 1.96, + "learning_rate": 8.107184665803868e-05, + "loss": 1.5087, + "step": 24858 + }, + { + "epoch": 1.96, + "learning_rate": 8.106086940134103e-05, + "loss": 1.5185, + "step": 24859 + }, + { + "epoch": 1.96, + "learning_rate": 8.104989261270198e-05, + "loss": 1.4499, + "step": 24860 + }, + { + "epoch": 1.96, + "learning_rate": 8.103891629219616e-05, + "loss": 1.4939, + "step": 24861 + }, + { + "epoch": 1.96, + "learning_rate": 8.102794043989804e-05, + "loss": 1.4894, + "step": 24862 + }, + { + "epoch": 1.96, + "learning_rate": 8.101696505588209e-05, + "loss": 1.4834, + "step": 24863 + }, + { + "epoch": 1.96, + "learning_rate": 8.100599014022295e-05, + "loss": 1.5038, + "step": 24864 + }, + { + "epoch": 1.96, + "learning_rate": 8.099501569299503e-05, + "loss": 1.523, + "step": 24865 + }, + { + "epoch": 1.96, + "learning_rate": 8.098404171427285e-05, + "loss": 1.4926, + "step": 24866 + }, + { + "epoch": 1.96, + "learning_rate": 8.097306820413098e-05, + "loss": 1.4669, + "step": 24867 + }, + { + "epoch": 1.96, + "learning_rate": 8.096209516264388e-05, + "loss": 1.5244, + "step": 24868 + }, + { + "epoch": 1.96, + "learning_rate": 8.095112258988608e-05, + "loss": 1.515, + "step": 24869 + }, + { + "epoch": 1.96, + "learning_rate": 8.094015048593199e-05, + "loss": 1.4859, + "step": 24870 + }, + { + "epoch": 1.96, + "learning_rate": 8.092917885085615e-05, + "loss": 1.5003, + "step": 24871 + }, + { + "epoch": 1.96, + "learning_rate": 8.091820768473314e-05, + "loss": 1.4707, + "step": 24872 + }, + { + "epoch": 1.96, + "learning_rate": 8.090723698763738e-05, + "loss": 1.4805, + "step": 24873 + }, + { + "epoch": 1.96, + "learning_rate": 8.089626675964326e-05, + "loss": 1.4601, + "step": 24874 + }, + { + "epoch": 1.96, + "learning_rate": 8.088529700082545e-05, + "loss": 1.4812, + "step": 24875 + }, + { + "epoch": 1.96, + "learning_rate": 8.087432771125832e-05, + "loss": 1.4545, + "step": 24876 + }, + { + "epoch": 1.96, + "learning_rate": 8.08633588910163e-05, + "loss": 1.5027, + "step": 24877 + }, + { + "epoch": 1.96, + "learning_rate": 8.085239054017398e-05, + "loss": 1.5181, + "step": 24878 + }, + { + "epoch": 1.96, + "learning_rate": 8.084142265880578e-05, + "loss": 1.5154, + "step": 24879 + }, + { + "epoch": 1.96, + "learning_rate": 8.083045524698607e-05, + "loss": 1.4605, + "step": 24880 + }, + { + "epoch": 1.96, + "learning_rate": 8.081948830478948e-05, + "loss": 1.4951, + "step": 24881 + }, + { + "epoch": 1.96, + "learning_rate": 8.080852183229038e-05, + "loss": 1.5145, + "step": 24882 + }, + { + "epoch": 1.96, + "learning_rate": 8.079755582956318e-05, + "loss": 1.5038, + "step": 24883 + }, + { + "epoch": 1.96, + "learning_rate": 8.078659029668243e-05, + "loss": 1.5011, + "step": 24884 + }, + { + "epoch": 1.96, + "learning_rate": 8.077562523372255e-05, + "loss": 1.434, + "step": 24885 + }, + { + "epoch": 1.96, + "learning_rate": 8.076466064075799e-05, + "loss": 1.4669, + "step": 24886 + }, + { + "epoch": 1.96, + "learning_rate": 8.075369651786303e-05, + "loss": 1.4929, + "step": 24887 + }, + { + "epoch": 1.96, + "learning_rate": 8.074273286511238e-05, + "loss": 1.4241, + "step": 24888 + }, + { + "epoch": 1.96, + "learning_rate": 8.073176968258038e-05, + "loss": 1.5414, + "step": 24889 + }, + { + "epoch": 1.96, + "learning_rate": 8.07208069703414e-05, + "loss": 1.4899, + "step": 24890 + }, + { + "epoch": 1.96, + "learning_rate": 8.070984472846986e-05, + "loss": 1.4402, + "step": 24891 + }, + { + "epoch": 1.96, + "learning_rate": 8.069888295704032e-05, + "loss": 1.5003, + "step": 24892 + }, + { + "epoch": 1.96, + "learning_rate": 8.068792165612709e-05, + "loss": 1.4341, + "step": 24893 + }, + { + "epoch": 1.96, + "learning_rate": 8.067696082580459e-05, + "loss": 1.5233, + "step": 24894 + }, + { + "epoch": 1.96, + "learning_rate": 8.066600046614733e-05, + "loss": 1.4825, + "step": 24895 + }, + { + "epoch": 1.96, + "learning_rate": 8.065504057722965e-05, + "loss": 1.4365, + "step": 24896 + }, + { + "epoch": 1.96, + "learning_rate": 8.064408115912591e-05, + "loss": 1.5282, + "step": 24897 + }, + { + "epoch": 1.96, + "learning_rate": 8.063312221191066e-05, + "loss": 1.4551, + "step": 24898 + }, + { + "epoch": 1.96, + "learning_rate": 8.062216373565821e-05, + "loss": 1.4453, + "step": 24899 + }, + { + "epoch": 1.96, + "learning_rate": 8.061120573044297e-05, + "loss": 1.4783, + "step": 24900 + }, + { + "epoch": 1.96, + "learning_rate": 8.060024819633937e-05, + "loss": 1.5411, + "step": 24901 + }, + { + "epoch": 1.96, + "learning_rate": 8.058929113342174e-05, + "loss": 1.4527, + "step": 24902 + }, + { + "epoch": 1.96, + "learning_rate": 8.057833454176457e-05, + "loss": 1.4717, + "step": 24903 + }, + { + "epoch": 1.96, + "learning_rate": 8.056737842144215e-05, + "loss": 1.4616, + "step": 24904 + }, + { + "epoch": 1.96, + "learning_rate": 8.055642277252897e-05, + "loss": 1.4379, + "step": 24905 + }, + { + "epoch": 1.96, + "learning_rate": 8.054546759509935e-05, + "loss": 1.465, + "step": 24906 + }, + { + "epoch": 1.96, + "learning_rate": 8.053451288922763e-05, + "loss": 1.443, + "step": 24907 + }, + { + "epoch": 1.96, + "learning_rate": 8.052355865498828e-05, + "loss": 1.5032, + "step": 24908 + }, + { + "epoch": 1.96, + "learning_rate": 8.051260489245564e-05, + "loss": 1.5013, + "step": 24909 + }, + { + "epoch": 1.96, + "learning_rate": 8.050165160170405e-05, + "loss": 1.511, + "step": 24910 + }, + { + "epoch": 1.96, + "learning_rate": 8.049069878280783e-05, + "loss": 1.4917, + "step": 24911 + }, + { + "epoch": 1.96, + "learning_rate": 8.047974643584148e-05, + "loss": 1.5094, + "step": 24912 + }, + { + "epoch": 1.96, + "learning_rate": 8.04687945608793e-05, + "loss": 1.5044, + "step": 24913 + }, + { + "epoch": 1.96, + "learning_rate": 8.045784315799556e-05, + "loss": 1.5312, + "step": 24914 + }, + { + "epoch": 1.96, + "learning_rate": 8.044689222726475e-05, + "loss": 1.4927, + "step": 24915 + }, + { + "epoch": 1.96, + "learning_rate": 8.043594176876117e-05, + "loss": 1.5044, + "step": 24916 + }, + { + "epoch": 1.96, + "learning_rate": 8.042499178255909e-05, + "loss": 1.4747, + "step": 24917 + }, + { + "epoch": 1.96, + "learning_rate": 8.04140422687329e-05, + "loss": 1.5439, + "step": 24918 + }, + { + "epoch": 1.96, + "learning_rate": 8.040309322735705e-05, + "loss": 1.4821, + "step": 24919 + }, + { + "epoch": 1.96, + "learning_rate": 8.039214465850578e-05, + "loss": 1.474, + "step": 24920 + }, + { + "epoch": 1.96, + "learning_rate": 8.038119656225339e-05, + "loss": 1.4552, + "step": 24921 + }, + { + "epoch": 1.96, + "learning_rate": 8.037024893867427e-05, + "loss": 1.451, + "step": 24922 + }, + { + "epoch": 1.96, + "learning_rate": 8.035930178784278e-05, + "loss": 1.4318, + "step": 24923 + }, + { + "epoch": 1.96, + "learning_rate": 8.034835510983312e-05, + "loss": 1.484, + "step": 24924 + }, + { + "epoch": 1.96, + "learning_rate": 8.033740890471976e-05, + "loss": 1.4711, + "step": 24925 + }, + { + "epoch": 1.96, + "learning_rate": 8.032646317257694e-05, + "loss": 1.496, + "step": 24926 + }, + { + "epoch": 1.96, + "learning_rate": 8.031551791347901e-05, + "loss": 1.4872, + "step": 24927 + }, + { + "epoch": 1.96, + "learning_rate": 8.030457312750018e-05, + "loss": 1.468, + "step": 24928 + }, + { + "epoch": 1.96, + "learning_rate": 8.02936288147149e-05, + "loss": 1.5012, + "step": 24929 + }, + { + "epoch": 1.96, + "learning_rate": 8.02826849751974e-05, + "loss": 1.4654, + "step": 24930 + }, + { + "epoch": 1.96, + "learning_rate": 8.027174160902195e-05, + "loss": 1.4274, + "step": 24931 + }, + { + "epoch": 1.96, + "learning_rate": 8.026079871626296e-05, + "loss": 1.4545, + "step": 24932 + }, + { + "epoch": 1.96, + "learning_rate": 8.024985629699465e-05, + "loss": 1.4421, + "step": 24933 + }, + { + "epoch": 1.96, + "learning_rate": 8.023891435129128e-05, + "loss": 1.4662, + "step": 24934 + }, + { + "epoch": 1.96, + "learning_rate": 8.022797287922717e-05, + "loss": 1.4223, + "step": 24935 + }, + { + "epoch": 1.96, + "learning_rate": 8.021703188087668e-05, + "loss": 1.4426, + "step": 24936 + }, + { + "epoch": 1.96, + "learning_rate": 8.020609135631404e-05, + "loss": 1.4912, + "step": 24937 + }, + { + "epoch": 1.96, + "learning_rate": 8.019515130561347e-05, + "loss": 1.4966, + "step": 24938 + }, + { + "epoch": 1.96, + "learning_rate": 8.018421172884935e-05, + "loss": 1.4538, + "step": 24939 + }, + { + "epoch": 1.96, + "learning_rate": 8.017327262609591e-05, + "loss": 1.4903, + "step": 24940 + }, + { + "epoch": 1.96, + "learning_rate": 8.016233399742735e-05, + "loss": 1.4715, + "step": 24941 + }, + { + "epoch": 1.96, + "learning_rate": 8.015139584291808e-05, + "loss": 1.4538, + "step": 24942 + }, + { + "epoch": 1.96, + "learning_rate": 8.014045816264225e-05, + "loss": 1.4344, + "step": 24943 + }, + { + "epoch": 1.96, + "learning_rate": 8.01295209566742e-05, + "loss": 1.4437, + "step": 24944 + }, + { + "epoch": 1.96, + "learning_rate": 8.011858422508806e-05, + "loss": 1.4897, + "step": 24945 + }, + { + "epoch": 1.96, + "learning_rate": 8.010764796795823e-05, + "loss": 1.4458, + "step": 24946 + }, + { + "epoch": 1.96, + "learning_rate": 8.00967121853589e-05, + "loss": 1.4712, + "step": 24947 + }, + { + "epoch": 1.96, + "learning_rate": 8.008577687736427e-05, + "loss": 1.4729, + "step": 24948 + }, + { + "epoch": 1.96, + "learning_rate": 8.007484204404868e-05, + "loss": 1.4657, + "step": 24949 + }, + { + "epoch": 1.96, + "learning_rate": 8.006390768548628e-05, + "loss": 1.4942, + "step": 24950 + }, + { + "epoch": 1.96, + "learning_rate": 8.00529738017514e-05, + "loss": 1.4284, + "step": 24951 + }, + { + "epoch": 1.96, + "learning_rate": 8.004204039291818e-05, + "loss": 1.44, + "step": 24952 + }, + { + "epoch": 1.96, + "learning_rate": 8.003110745906096e-05, + "loss": 1.4763, + "step": 24953 + }, + { + "epoch": 1.96, + "learning_rate": 8.00201750002539e-05, + "loss": 1.5157, + "step": 24954 + }, + { + "epoch": 1.96, + "learning_rate": 8.000924301657117e-05, + "loss": 1.4433, + "step": 24955 + }, + { + "epoch": 1.96, + "learning_rate": 7.999831150808712e-05, + "loss": 1.4663, + "step": 24956 + }, + { + "epoch": 1.96, + "learning_rate": 7.99873804748759e-05, + "loss": 1.4931, + "step": 24957 + }, + { + "epoch": 1.96, + "learning_rate": 7.997644991701168e-05, + "loss": 1.4993, + "step": 24958 + }, + { + "epoch": 1.96, + "learning_rate": 7.996551983456877e-05, + "loss": 1.4665, + "step": 24959 + }, + { + "epoch": 1.96, + "learning_rate": 7.995459022762135e-05, + "loss": 1.4746, + "step": 24960 + }, + { + "epoch": 1.96, + "learning_rate": 7.994366109624359e-05, + "loss": 1.504, + "step": 24961 + }, + { + "epoch": 1.96, + "learning_rate": 7.993273244050967e-05, + "loss": 1.4871, + "step": 24962 + }, + { + "epoch": 1.96, + "learning_rate": 7.992180426049388e-05, + "loss": 1.434, + "step": 24963 + }, + { + "epoch": 1.96, + "learning_rate": 7.991087655627036e-05, + "loss": 1.4342, + "step": 24964 + }, + { + "epoch": 1.96, + "learning_rate": 7.98999493279132e-05, + "loss": 1.4622, + "step": 24965 + }, + { + "epoch": 1.96, + "learning_rate": 7.988902257549682e-05, + "loss": 1.4675, + "step": 24966 + }, + { + "epoch": 1.96, + "learning_rate": 7.987809629909527e-05, + "loss": 1.4345, + "step": 24967 + }, + { + "epoch": 1.96, + "learning_rate": 7.986717049878276e-05, + "loss": 1.4862, + "step": 24968 + }, + { + "epoch": 1.96, + "learning_rate": 7.98562451746334e-05, + "loss": 1.5122, + "step": 24969 + }, + { + "epoch": 1.96, + "learning_rate": 7.98453203267215e-05, + "loss": 1.4841, + "step": 24970 + }, + { + "epoch": 1.96, + "learning_rate": 7.983439595512114e-05, + "loss": 1.4973, + "step": 24971 + }, + { + "epoch": 1.96, + "learning_rate": 7.982347205990646e-05, + "loss": 1.4665, + "step": 24972 + }, + { + "epoch": 1.96, + "learning_rate": 7.981254864115176e-05, + "loss": 1.4969, + "step": 24973 + }, + { + "epoch": 1.96, + "learning_rate": 7.980162569893107e-05, + "loss": 1.4697, + "step": 24974 + }, + { + "epoch": 1.97, + "learning_rate": 7.979070323331858e-05, + "loss": 1.4711, + "step": 24975 + }, + { + "epoch": 1.97, + "learning_rate": 7.977978124438854e-05, + "loss": 1.4903, + "step": 24976 + }, + { + "epoch": 1.97, + "learning_rate": 7.976885973221501e-05, + "loss": 1.5597, + "step": 24977 + }, + { + "epoch": 1.97, + "learning_rate": 7.975793869687212e-05, + "loss": 1.554, + "step": 24978 + }, + { + "epoch": 1.97, + "learning_rate": 7.974701813843411e-05, + "loss": 1.49, + "step": 24979 + }, + { + "epoch": 1.97, + "learning_rate": 7.973609805697508e-05, + "loss": 1.5278, + "step": 24980 + }, + { + "epoch": 1.97, + "learning_rate": 7.972517845256913e-05, + "loss": 1.5028, + "step": 24981 + }, + { + "epoch": 1.97, + "learning_rate": 7.971425932529041e-05, + "loss": 1.4653, + "step": 24982 + }, + { + "epoch": 1.97, + "learning_rate": 7.970334067521316e-05, + "loss": 1.4727, + "step": 24983 + }, + { + "epoch": 1.97, + "learning_rate": 7.969242250241142e-05, + "loss": 1.536, + "step": 24984 + }, + { + "epoch": 1.97, + "learning_rate": 7.968150480695935e-05, + "loss": 1.4957, + "step": 24985 + }, + { + "epoch": 1.97, + "learning_rate": 7.967058758893099e-05, + "loss": 1.5061, + "step": 24986 + }, + { + "epoch": 1.97, + "learning_rate": 7.965967084840057e-05, + "loss": 1.4968, + "step": 24987 + }, + { + "epoch": 1.97, + "learning_rate": 7.964875458544219e-05, + "loss": 1.5345, + "step": 24988 + }, + { + "epoch": 1.97, + "learning_rate": 7.963783880012988e-05, + "loss": 1.4997, + "step": 24989 + }, + { + "epoch": 1.97, + "learning_rate": 7.962692349253787e-05, + "loss": 1.4967, + "step": 24990 + }, + { + "epoch": 1.97, + "learning_rate": 7.961600866274022e-05, + "loss": 1.4537, + "step": 24991 + }, + { + "epoch": 1.97, + "learning_rate": 7.960509431081099e-05, + "loss": 1.4477, + "step": 24992 + }, + { + "epoch": 1.97, + "learning_rate": 7.959418043682433e-05, + "loss": 1.4486, + "step": 24993 + }, + { + "epoch": 1.97, + "learning_rate": 7.958326704085437e-05, + "loss": 1.497, + "step": 24994 + }, + { + "epoch": 1.97, + "learning_rate": 7.957235412297511e-05, + "loss": 1.4635, + "step": 24995 + }, + { + "epoch": 1.97, + "learning_rate": 7.956144168326073e-05, + "loss": 1.4733, + "step": 24996 + }, + { + "epoch": 1.97, + "learning_rate": 7.955052972178526e-05, + "loss": 1.494, + "step": 24997 + }, + { + "epoch": 1.97, + "learning_rate": 7.953961823862287e-05, + "loss": 1.415, + "step": 24998 + }, + { + "epoch": 1.97, + "learning_rate": 7.952870723384754e-05, + "loss": 1.5518, + "step": 24999 + }, + { + "epoch": 1.97, + "learning_rate": 7.951779670753342e-05, + "loss": 1.4617, + "step": 25000 + }, + { + "epoch": 1.97, + "learning_rate": 7.950688665975459e-05, + "loss": 1.5204, + "step": 25001 + }, + { + "epoch": 1.97, + "learning_rate": 7.94959770905851e-05, + "loss": 1.4948, + "step": 25002 + }, + { + "epoch": 1.97, + "learning_rate": 7.948506800009895e-05, + "loss": 1.5018, + "step": 25003 + }, + { + "epoch": 1.97, + "learning_rate": 7.947415938837035e-05, + "loss": 1.576, + "step": 25004 + }, + { + "epoch": 1.97, + "learning_rate": 7.946325125547328e-05, + "loss": 1.5086, + "step": 25005 + }, + { + "epoch": 1.97, + "learning_rate": 7.945234360148175e-05, + "loss": 1.455, + "step": 25006 + }, + { + "epoch": 1.97, + "learning_rate": 7.944143642646993e-05, + "loss": 1.5447, + "step": 25007 + }, + { + "epoch": 1.97, + "learning_rate": 7.943052973051183e-05, + "loss": 1.4051, + "step": 25008 + }, + { + "epoch": 1.97, + "learning_rate": 7.941962351368142e-05, + "loss": 1.4728, + "step": 25009 + }, + { + "epoch": 1.97, + "learning_rate": 7.940871777605285e-05, + "loss": 1.4996, + "step": 25010 + }, + { + "epoch": 1.97, + "learning_rate": 7.939781251770017e-05, + "loss": 1.4473, + "step": 25011 + }, + { + "epoch": 1.97, + "learning_rate": 7.938690773869732e-05, + "loss": 1.4776, + "step": 25012 + }, + { + "epoch": 1.97, + "learning_rate": 7.93760034391184e-05, + "loss": 1.4887, + "step": 25013 + }, + { + "epoch": 1.97, + "learning_rate": 7.936509961903748e-05, + "loss": 1.5109, + "step": 25014 + }, + { + "epoch": 1.97, + "learning_rate": 7.935419627852857e-05, + "loss": 1.5318, + "step": 25015 + }, + { + "epoch": 1.97, + "learning_rate": 7.934329341766561e-05, + "loss": 1.499, + "step": 25016 + }, + { + "epoch": 1.97, + "learning_rate": 7.933239103652276e-05, + "loss": 1.4553, + "step": 25017 + }, + { + "epoch": 1.97, + "learning_rate": 7.932148913517398e-05, + "loss": 1.5047, + "step": 25018 + }, + { + "epoch": 1.97, + "learning_rate": 7.931058771369323e-05, + "loss": 1.5009, + "step": 25019 + }, + { + "epoch": 1.97, + "learning_rate": 7.929968677215464e-05, + "loss": 1.4822, + "step": 25020 + }, + { + "epoch": 1.97, + "learning_rate": 7.928878631063217e-05, + "loss": 1.4867, + "step": 25021 + }, + { + "epoch": 1.97, + "learning_rate": 7.92778863291998e-05, + "loss": 1.4973, + "step": 25022 + }, + { + "epoch": 1.97, + "learning_rate": 7.92669868279315e-05, + "loss": 1.4553, + "step": 25023 + }, + { + "epoch": 1.97, + "learning_rate": 7.925608780690139e-05, + "loss": 1.4719, + "step": 25024 + }, + { + "epoch": 1.97, + "learning_rate": 7.92451892661834e-05, + "loss": 1.4339, + "step": 25025 + }, + { + "epoch": 1.97, + "learning_rate": 7.923429120585147e-05, + "loss": 1.4384, + "step": 25026 + }, + { + "epoch": 1.97, + "learning_rate": 7.922339362597971e-05, + "loss": 1.4817, + "step": 25027 + }, + { + "epoch": 1.97, + "learning_rate": 7.921249652664197e-05, + "loss": 1.4585, + "step": 25028 + }, + { + "epoch": 1.97, + "learning_rate": 7.920159990791241e-05, + "loss": 1.5015, + "step": 25029 + }, + { + "epoch": 1.97, + "learning_rate": 7.919070376986485e-05, + "loss": 1.5304, + "step": 25030 + }, + { + "epoch": 1.97, + "learning_rate": 7.917980811257338e-05, + "loss": 1.5347, + "step": 25031 + }, + { + "epoch": 1.97, + "learning_rate": 7.916891293611195e-05, + "loss": 1.4879, + "step": 25032 + }, + { + "epoch": 1.97, + "learning_rate": 7.915801824055444e-05, + "loss": 1.4903, + "step": 25033 + }, + { + "epoch": 1.97, + "learning_rate": 7.914712402597493e-05, + "loss": 1.5098, + "step": 25034 + }, + { + "epoch": 1.97, + "learning_rate": 7.91362302924474e-05, + "loss": 1.444, + "step": 25035 + }, + { + "epoch": 1.97, + "learning_rate": 7.912533704004568e-05, + "loss": 1.5125, + "step": 25036 + }, + { + "epoch": 1.97, + "learning_rate": 7.911444426884384e-05, + "loss": 1.4706, + "step": 25037 + }, + { + "epoch": 1.97, + "learning_rate": 7.910355197891584e-05, + "loss": 1.4917, + "step": 25038 + }, + { + "epoch": 1.97, + "learning_rate": 7.909266017033559e-05, + "loss": 1.4719, + "step": 25039 + }, + { + "epoch": 1.97, + "learning_rate": 7.908176884317697e-05, + "loss": 1.4603, + "step": 25040 + }, + { + "epoch": 1.97, + "learning_rate": 7.907087799751409e-05, + "loss": 1.4608, + "step": 25041 + }, + { + "epoch": 1.97, + "learning_rate": 7.905998763342078e-05, + "loss": 1.4743, + "step": 25042 + }, + { + "epoch": 1.97, + "learning_rate": 7.904909775097097e-05, + "loss": 1.4596, + "step": 25043 + }, + { + "epoch": 1.97, + "learning_rate": 7.903820835023863e-05, + "loss": 1.453, + "step": 25044 + }, + { + "epoch": 1.97, + "learning_rate": 7.902731943129774e-05, + "loss": 1.4713, + "step": 25045 + }, + { + "epoch": 1.97, + "learning_rate": 7.901643099422221e-05, + "loss": 1.4846, + "step": 25046 + }, + { + "epoch": 1.97, + "learning_rate": 7.900554303908585e-05, + "loss": 1.4436, + "step": 25047 + }, + { + "epoch": 1.97, + "learning_rate": 7.899465556596274e-05, + "loss": 1.5001, + "step": 25048 + }, + { + "epoch": 1.97, + "learning_rate": 7.898376857492674e-05, + "loss": 1.4753, + "step": 25049 + }, + { + "epoch": 1.97, + "learning_rate": 7.897288206605171e-05, + "loss": 1.4864, + "step": 25050 + }, + { + "epoch": 1.97, + "learning_rate": 7.896199603941168e-05, + "loss": 1.5096, + "step": 25051 + }, + { + "epoch": 1.97, + "learning_rate": 7.895111049508049e-05, + "loss": 1.4879, + "step": 25052 + }, + { + "epoch": 1.97, + "learning_rate": 7.894022543313199e-05, + "loss": 1.5133, + "step": 25053 + }, + { + "epoch": 1.97, + "learning_rate": 7.89293408536402e-05, + "loss": 1.4839, + "step": 25054 + }, + { + "epoch": 1.97, + "learning_rate": 7.891845675667897e-05, + "loss": 1.5014, + "step": 25055 + }, + { + "epoch": 1.97, + "learning_rate": 7.890757314232217e-05, + "loss": 1.4807, + "step": 25056 + }, + { + "epoch": 1.97, + "learning_rate": 7.889669001064369e-05, + "loss": 1.479, + "step": 25057 + }, + { + "epoch": 1.97, + "learning_rate": 7.888580736171748e-05, + "loss": 1.5129, + "step": 25058 + }, + { + "epoch": 1.97, + "learning_rate": 7.887492519561742e-05, + "loss": 1.495, + "step": 25059 + }, + { + "epoch": 1.97, + "learning_rate": 7.88640435124173e-05, + "loss": 1.52, + "step": 25060 + }, + { + "epoch": 1.97, + "learning_rate": 7.885316231219104e-05, + "loss": 1.4975, + "step": 25061 + }, + { + "epoch": 1.97, + "learning_rate": 7.884228159501264e-05, + "loss": 1.4118, + "step": 25062 + }, + { + "epoch": 1.97, + "learning_rate": 7.883140136095588e-05, + "loss": 1.4446, + "step": 25063 + }, + { + "epoch": 1.97, + "learning_rate": 7.882052161009456e-05, + "loss": 1.451, + "step": 25064 + }, + { + "epoch": 1.97, + "learning_rate": 7.880964234250267e-05, + "loss": 1.4647, + "step": 25065 + }, + { + "epoch": 1.97, + "learning_rate": 7.879876355825402e-05, + "loss": 1.4757, + "step": 25066 + }, + { + "epoch": 1.97, + "learning_rate": 7.878788525742244e-05, + "loss": 1.4794, + "step": 25067 + }, + { + "epoch": 1.97, + "learning_rate": 7.877700744008186e-05, + "loss": 1.4373, + "step": 25068 + }, + { + "epoch": 1.97, + "learning_rate": 7.87661301063061e-05, + "loss": 1.4839, + "step": 25069 + }, + { + "epoch": 1.97, + "learning_rate": 7.875525325616895e-05, + "loss": 1.4959, + "step": 25070 + }, + { + "epoch": 1.97, + "learning_rate": 7.874437688974437e-05, + "loss": 1.5081, + "step": 25071 + }, + { + "epoch": 1.97, + "learning_rate": 7.873350100710614e-05, + "loss": 1.4821, + "step": 25072 + }, + { + "epoch": 1.97, + "learning_rate": 7.872262560832808e-05, + "loss": 1.457, + "step": 25073 + }, + { + "epoch": 1.97, + "learning_rate": 7.871175069348409e-05, + "loss": 1.405, + "step": 25074 + }, + { + "epoch": 1.97, + "learning_rate": 7.870087626264793e-05, + "loss": 1.4248, + "step": 25075 + }, + { + "epoch": 1.97, + "learning_rate": 7.869000231589351e-05, + "loss": 1.4594, + "step": 25076 + }, + { + "epoch": 1.97, + "learning_rate": 7.867912885329458e-05, + "loss": 1.4895, + "step": 25077 + }, + { + "epoch": 1.97, + "learning_rate": 7.866825587492506e-05, + "loss": 1.5107, + "step": 25078 + }, + { + "epoch": 1.97, + "learning_rate": 7.865738338085873e-05, + "loss": 1.4781, + "step": 25079 + }, + { + "epoch": 1.97, + "learning_rate": 7.864651137116937e-05, + "loss": 1.4916, + "step": 25080 + }, + { + "epoch": 1.97, + "learning_rate": 7.863563984593079e-05, + "loss": 1.4333, + "step": 25081 + }, + { + "epoch": 1.97, + "learning_rate": 7.862476880521687e-05, + "loss": 1.4691, + "step": 25082 + }, + { + "epoch": 1.97, + "learning_rate": 7.861389824910142e-05, + "loss": 1.4587, + "step": 25083 + }, + { + "epoch": 1.97, + "learning_rate": 7.860302817765812e-05, + "loss": 1.5424, + "step": 25084 + }, + { + "epoch": 1.97, + "learning_rate": 7.85921585909609e-05, + "loss": 1.4613, + "step": 25085 + }, + { + "epoch": 1.97, + "learning_rate": 7.858128948908354e-05, + "loss": 1.4871, + "step": 25086 + }, + { + "epoch": 1.97, + "learning_rate": 7.857042087209977e-05, + "loss": 1.4898, + "step": 25087 + }, + { + "epoch": 1.97, + "learning_rate": 7.855955274008346e-05, + "loss": 1.4853, + "step": 25088 + }, + { + "epoch": 1.97, + "learning_rate": 7.854868509310836e-05, + "loss": 1.4447, + "step": 25089 + }, + { + "epoch": 1.97, + "learning_rate": 7.853781793124821e-05, + "loss": 1.4637, + "step": 25090 + }, + { + "epoch": 1.97, + "learning_rate": 7.852695125457683e-05, + "loss": 1.5162, + "step": 25091 + }, + { + "epoch": 1.97, + "learning_rate": 7.851608506316809e-05, + "loss": 1.4581, + "step": 25092 + }, + { + "epoch": 1.97, + "learning_rate": 7.850521935709566e-05, + "loss": 1.4937, + "step": 25093 + }, + { + "epoch": 1.97, + "learning_rate": 7.849435413643328e-05, + "loss": 1.4906, + "step": 25094 + }, + { + "epoch": 1.97, + "learning_rate": 7.848348940125485e-05, + "loss": 1.4908, + "step": 25095 + }, + { + "epoch": 1.97, + "learning_rate": 7.847262515163405e-05, + "loss": 1.4943, + "step": 25096 + }, + { + "epoch": 1.97, + "learning_rate": 7.846176138764466e-05, + "loss": 1.4467, + "step": 25097 + }, + { + "epoch": 1.97, + "learning_rate": 7.845089810936036e-05, + "loss": 1.4734, + "step": 25098 + }, + { + "epoch": 1.97, + "learning_rate": 7.844003531685506e-05, + "loss": 1.4948, + "step": 25099 + }, + { + "epoch": 1.97, + "learning_rate": 7.84291730102024e-05, + "loss": 1.5258, + "step": 25100 + }, + { + "epoch": 1.97, + "learning_rate": 7.841831118947612e-05, + "loss": 1.4547, + "step": 25101 + }, + { + "epoch": 1.98, + "learning_rate": 7.840744985475005e-05, + "loss": 1.5625, + "step": 25102 + }, + { + "epoch": 1.98, + "learning_rate": 7.839658900609791e-05, + "loss": 1.4507, + "step": 25103 + }, + { + "epoch": 1.98, + "learning_rate": 7.838572864359333e-05, + "loss": 1.4444, + "step": 25104 + }, + { + "epoch": 1.98, + "learning_rate": 7.83748687673102e-05, + "loss": 1.5009, + "step": 25105 + }, + { + "epoch": 1.98, + "learning_rate": 7.83640093773222e-05, + "loss": 1.4546, + "step": 25106 + }, + { + "epoch": 1.98, + "learning_rate": 7.835315047370297e-05, + "loss": 1.5167, + "step": 25107 + }, + { + "epoch": 1.98, + "learning_rate": 7.834229205652632e-05, + "loss": 1.4891, + "step": 25108 + }, + { + "epoch": 1.98, + "learning_rate": 7.833143412586603e-05, + "loss": 1.4903, + "step": 25109 + }, + { + "epoch": 1.98, + "learning_rate": 7.832057668179572e-05, + "loss": 1.4552, + "step": 25110 + }, + { + "epoch": 1.98, + "learning_rate": 7.830971972438911e-05, + "loss": 1.4879, + "step": 25111 + }, + { + "epoch": 1.98, + "learning_rate": 7.829886325371999e-05, + "loss": 1.4963, + "step": 25112 + }, + { + "epoch": 1.98, + "learning_rate": 7.828800726986203e-05, + "loss": 1.5218, + "step": 25113 + }, + { + "epoch": 1.98, + "learning_rate": 7.82771517728889e-05, + "loss": 1.4182, + "step": 25114 + }, + { + "epoch": 1.98, + "learning_rate": 7.826629676287428e-05, + "loss": 1.4855, + "step": 25115 + }, + { + "epoch": 1.98, + "learning_rate": 7.825544223989201e-05, + "loss": 1.4761, + "step": 25116 + }, + { + "epoch": 1.98, + "learning_rate": 7.824458820401565e-05, + "loss": 1.4586, + "step": 25117 + }, + { + "epoch": 1.98, + "learning_rate": 7.82337346553189e-05, + "loss": 1.519, + "step": 25118 + }, + { + "epoch": 1.98, + "learning_rate": 7.822288159387555e-05, + "loss": 1.5131, + "step": 25119 + }, + { + "epoch": 1.98, + "learning_rate": 7.821202901975921e-05, + "loss": 1.5283, + "step": 25120 + }, + { + "epoch": 1.98, + "learning_rate": 7.820117693304355e-05, + "loss": 1.5091, + "step": 25121 + }, + { + "epoch": 1.98, + "learning_rate": 7.81903253338023e-05, + "loss": 1.4657, + "step": 25122 + }, + { + "epoch": 1.98, + "learning_rate": 7.817947422210909e-05, + "loss": 1.516, + "step": 25123 + }, + { + "epoch": 1.98, + "learning_rate": 7.816862359803764e-05, + "loss": 1.5357, + "step": 25124 + }, + { + "epoch": 1.98, + "learning_rate": 7.815777346166154e-05, + "loss": 1.4981, + "step": 25125 + }, + { + "epoch": 1.98, + "learning_rate": 7.814692381305461e-05, + "loss": 1.5009, + "step": 25126 + }, + { + "epoch": 1.98, + "learning_rate": 7.813607465229037e-05, + "loss": 1.4655, + "step": 25127 + }, + { + "epoch": 1.98, + "learning_rate": 7.812522597944249e-05, + "loss": 1.4645, + "step": 25128 + }, + { + "epoch": 1.98, + "learning_rate": 7.811437779458471e-05, + "loss": 1.4632, + "step": 25129 + }, + { + "epoch": 1.98, + "learning_rate": 7.810353009779064e-05, + "loss": 1.4929, + "step": 25130 + }, + { + "epoch": 1.98, + "learning_rate": 7.809268288913387e-05, + "loss": 1.4943, + "step": 25131 + }, + { + "epoch": 1.98, + "learning_rate": 7.808183616868815e-05, + "loss": 1.4765, + "step": 25132 + }, + { + "epoch": 1.98, + "learning_rate": 7.807098993652707e-05, + "loss": 1.4472, + "step": 25133 + }, + { + "epoch": 1.98, + "learning_rate": 7.80601441927243e-05, + "loss": 1.4586, + "step": 25134 + }, + { + "epoch": 1.98, + "learning_rate": 7.804929893735338e-05, + "loss": 1.4697, + "step": 25135 + }, + { + "epoch": 1.98, + "learning_rate": 7.803845417048806e-05, + "loss": 1.4842, + "step": 25136 + }, + { + "epoch": 1.98, + "learning_rate": 7.802760989220194e-05, + "loss": 1.4554, + "step": 25137 + }, + { + "epoch": 1.98, + "learning_rate": 7.801676610256858e-05, + "loss": 1.5311, + "step": 25138 + }, + { + "epoch": 1.98, + "learning_rate": 7.800592280166165e-05, + "loss": 1.5016, + "step": 25139 + }, + { + "epoch": 1.98, + "learning_rate": 7.79950799895548e-05, + "loss": 1.4656, + "step": 25140 + }, + { + "epoch": 1.98, + "learning_rate": 7.798423766632165e-05, + "loss": 1.4857, + "step": 25141 + }, + { + "epoch": 1.98, + "learning_rate": 7.797339583203574e-05, + "loss": 1.4896, + "step": 25142 + }, + { + "epoch": 1.98, + "learning_rate": 7.796255448677076e-05, + "loss": 1.509, + "step": 25143 + }, + { + "epoch": 1.98, + "learning_rate": 7.795171363060029e-05, + "loss": 1.4526, + "step": 25144 + }, + { + "epoch": 1.98, + "learning_rate": 7.794087326359787e-05, + "loss": 1.4752, + "step": 25145 + }, + { + "epoch": 1.98, + "learning_rate": 7.79300333858372e-05, + "loss": 1.4536, + "step": 25146 + }, + { + "epoch": 1.98, + "learning_rate": 7.791919399739185e-05, + "loss": 1.5175, + "step": 25147 + }, + { + "epoch": 1.98, + "learning_rate": 7.790835509833531e-05, + "loss": 1.524, + "step": 25148 + }, + { + "epoch": 1.98, + "learning_rate": 7.789751668874134e-05, + "loss": 1.5371, + "step": 25149 + }, + { + "epoch": 1.98, + "learning_rate": 7.788667876868342e-05, + "loss": 1.4484, + "step": 25150 + }, + { + "epoch": 1.98, + "learning_rate": 7.787584133823517e-05, + "loss": 1.4567, + "step": 25151 + }, + { + "epoch": 1.98, + "learning_rate": 7.78650043974701e-05, + "loss": 1.5116, + "step": 25152 + }, + { + "epoch": 1.98, + "learning_rate": 7.78541679464619e-05, + "loss": 1.5152, + "step": 25153 + }, + { + "epoch": 1.98, + "learning_rate": 7.784333198528402e-05, + "loss": 1.4682, + "step": 25154 + }, + { + "epoch": 1.98, + "learning_rate": 7.783249651401017e-05, + "loss": 1.4881, + "step": 25155 + }, + { + "epoch": 1.98, + "learning_rate": 7.782166153271377e-05, + "loss": 1.4666, + "step": 25156 + }, + { + "epoch": 1.98, + "learning_rate": 7.781082704146853e-05, + "loss": 1.5137, + "step": 25157 + }, + { + "epoch": 1.98, + "learning_rate": 7.779999304034791e-05, + "loss": 1.506, + "step": 25158 + }, + { + "epoch": 1.98, + "learning_rate": 7.778915952942545e-05, + "loss": 1.4769, + "step": 25159 + }, + { + "epoch": 1.98, + "learning_rate": 7.777832650877482e-05, + "loss": 1.4989, + "step": 25160 + }, + { + "epoch": 1.98, + "learning_rate": 7.776749397846949e-05, + "loss": 1.4513, + "step": 25161 + }, + { + "epoch": 1.98, + "learning_rate": 7.775666193858295e-05, + "loss": 1.4672, + "step": 25162 + }, + { + "epoch": 1.98, + "learning_rate": 7.774583038918887e-05, + "loss": 1.4929, + "step": 25163 + }, + { + "epoch": 1.98, + "learning_rate": 7.773499933036072e-05, + "loss": 1.4486, + "step": 25164 + }, + { + "epoch": 1.98, + "learning_rate": 7.772416876217199e-05, + "loss": 1.419, + "step": 25165 + }, + { + "epoch": 1.98, + "learning_rate": 7.771333868469633e-05, + "loss": 1.457, + "step": 25166 + }, + { + "epoch": 1.98, + "learning_rate": 7.770250909800722e-05, + "loss": 1.488, + "step": 25167 + }, + { + "epoch": 1.98, + "learning_rate": 7.769168000217817e-05, + "loss": 1.4768, + "step": 25168 + }, + { + "epoch": 1.98, + "learning_rate": 7.768085139728263e-05, + "loss": 1.4259, + "step": 25169 + }, + { + "epoch": 1.98, + "learning_rate": 7.767002328339425e-05, + "loss": 1.4983, + "step": 25170 + }, + { + "epoch": 1.98, + "learning_rate": 7.765919566058652e-05, + "loss": 1.4699, + "step": 25171 + }, + { + "epoch": 1.98, + "learning_rate": 7.764836852893293e-05, + "loss": 1.5045, + "step": 25172 + }, + { + "epoch": 1.98, + "learning_rate": 7.763754188850696e-05, + "loss": 1.4686, + "step": 25173 + }, + { + "epoch": 1.98, + "learning_rate": 7.762671573938217e-05, + "loss": 1.4847, + "step": 25174 + }, + { + "epoch": 1.98, + "learning_rate": 7.761589008163204e-05, + "loss": 1.4633, + "step": 25175 + }, + { + "epoch": 1.98, + "learning_rate": 7.760506491533003e-05, + "loss": 1.461, + "step": 25176 + }, + { + "epoch": 1.98, + "learning_rate": 7.759424024054973e-05, + "loss": 1.5068, + "step": 25177 + }, + { + "epoch": 1.98, + "learning_rate": 7.758341605736459e-05, + "loss": 1.4997, + "step": 25178 + }, + { + "epoch": 1.98, + "learning_rate": 7.757259236584803e-05, + "loss": 1.4476, + "step": 25179 + }, + { + "epoch": 1.98, + "learning_rate": 7.756176916607365e-05, + "loss": 1.531, + "step": 25180 + }, + { + "epoch": 1.98, + "learning_rate": 7.75509464581149e-05, + "loss": 1.4764, + "step": 25181 + }, + { + "epoch": 1.98, + "learning_rate": 7.754012424204518e-05, + "loss": 1.4561, + "step": 25182 + }, + { + "epoch": 1.98, + "learning_rate": 7.752930251793808e-05, + "loss": 1.4754, + "step": 25183 + }, + { + "epoch": 1.98, + "learning_rate": 7.751848128586703e-05, + "loss": 1.4961, + "step": 25184 + }, + { + "epoch": 1.98, + "learning_rate": 7.750766054590544e-05, + "loss": 1.4701, + "step": 25185 + }, + { + "epoch": 1.98, + "learning_rate": 7.749684029812681e-05, + "loss": 1.4425, + "step": 25186 + }, + { + "epoch": 1.98, + "learning_rate": 7.74860205426047e-05, + "loss": 1.4797, + "step": 25187 + }, + { + "epoch": 1.98, + "learning_rate": 7.747520127941249e-05, + "loss": 1.4909, + "step": 25188 + }, + { + "epoch": 1.98, + "learning_rate": 7.746438250862357e-05, + "loss": 1.4964, + "step": 25189 + }, + { + "epoch": 1.98, + "learning_rate": 7.745356423031153e-05, + "loss": 1.5383, + "step": 25190 + }, + { + "epoch": 1.98, + "learning_rate": 7.744274644454977e-05, + "loss": 1.4683, + "step": 25191 + }, + { + "epoch": 1.98, + "learning_rate": 7.74319291514117e-05, + "loss": 1.4974, + "step": 25192 + }, + { + "epoch": 1.98, + "learning_rate": 7.742111235097072e-05, + "loss": 1.4823, + "step": 25193 + }, + { + "epoch": 1.98, + "learning_rate": 7.741029604330043e-05, + "loss": 1.4918, + "step": 25194 + }, + { + "epoch": 1.98, + "learning_rate": 7.739948022847414e-05, + "loss": 1.4528, + "step": 25195 + }, + { + "epoch": 1.98, + "learning_rate": 7.738866490656527e-05, + "loss": 1.4413, + "step": 25196 + }, + { + "epoch": 1.98, + "learning_rate": 7.737785007764735e-05, + "loss": 1.5039, + "step": 25197 + }, + { + "epoch": 1.98, + "learning_rate": 7.736703574179375e-05, + "loss": 1.4558, + "step": 25198 + }, + { + "epoch": 1.98, + "learning_rate": 7.735622189907786e-05, + "loss": 1.4677, + "step": 25199 + }, + { + "epoch": 1.98, + "learning_rate": 7.734540854957316e-05, + "loss": 1.5574, + "step": 25200 + }, + { + "epoch": 1.98, + "learning_rate": 7.733459569335299e-05, + "loss": 1.4782, + "step": 25201 + }, + { + "epoch": 1.98, + "learning_rate": 7.732378333049088e-05, + "loss": 1.4317, + "step": 25202 + }, + { + "epoch": 1.98, + "learning_rate": 7.731297146106011e-05, + "loss": 1.4661, + "step": 25203 + }, + { + "epoch": 1.98, + "learning_rate": 7.730216008513422e-05, + "loss": 1.5075, + "step": 25204 + }, + { + "epoch": 1.98, + "learning_rate": 7.729134920278654e-05, + "loss": 1.4705, + "step": 25205 + }, + { + "epoch": 1.98, + "learning_rate": 7.728053881409042e-05, + "loss": 1.4719, + "step": 25206 + }, + { + "epoch": 1.98, + "learning_rate": 7.726972891911937e-05, + "loss": 1.432, + "step": 25207 + }, + { + "epoch": 1.98, + "learning_rate": 7.725891951794671e-05, + "loss": 1.5253, + "step": 25208 + }, + { + "epoch": 1.98, + "learning_rate": 7.724811061064586e-05, + "loss": 1.5127, + "step": 25209 + }, + { + "epoch": 1.98, + "learning_rate": 7.723730219729013e-05, + "loss": 1.491, + "step": 25210 + }, + { + "epoch": 1.98, + "learning_rate": 7.722649427795302e-05, + "loss": 1.47, + "step": 25211 + }, + { + "epoch": 1.98, + "learning_rate": 7.721568685270786e-05, + "loss": 1.4503, + "step": 25212 + }, + { + "epoch": 1.98, + "learning_rate": 7.720487992162795e-05, + "loss": 1.4797, + "step": 25213 + }, + { + "epoch": 1.98, + "learning_rate": 7.71940734847868e-05, + "loss": 1.4921, + "step": 25214 + }, + { + "epoch": 1.98, + "learning_rate": 7.718326754225773e-05, + "loss": 1.4928, + "step": 25215 + }, + { + "epoch": 1.98, + "learning_rate": 7.7172462094114e-05, + "loss": 1.5168, + "step": 25216 + }, + { + "epoch": 1.98, + "learning_rate": 7.716165714042908e-05, + "loss": 1.4833, + "step": 25217 + }, + { + "epoch": 1.98, + "learning_rate": 7.715085268127638e-05, + "loss": 1.4932, + "step": 25218 + }, + { + "epoch": 1.98, + "learning_rate": 7.714004871672917e-05, + "loss": 1.434, + "step": 25219 + }, + { + "epoch": 1.98, + "learning_rate": 7.712924524686077e-05, + "loss": 1.4779, + "step": 25220 + }, + { + "epoch": 1.98, + "learning_rate": 7.711844227174463e-05, + "loss": 1.4955, + "step": 25221 + }, + { + "epoch": 1.98, + "learning_rate": 7.710763979145407e-05, + "loss": 1.4896, + "step": 25222 + }, + { + "epoch": 1.98, + "learning_rate": 7.709683780606234e-05, + "loss": 1.4792, + "step": 25223 + }, + { + "epoch": 1.98, + "learning_rate": 7.708603631564292e-05, + "loss": 1.4406, + "step": 25224 + }, + { + "epoch": 1.98, + "learning_rate": 7.707523532026907e-05, + "loss": 1.528, + "step": 25225 + }, + { + "epoch": 1.98, + "learning_rate": 7.706443482001412e-05, + "loss": 1.4696, + "step": 25226 + }, + { + "epoch": 1.98, + "learning_rate": 7.705363481495135e-05, + "loss": 1.5323, + "step": 25227 + }, + { + "epoch": 1.98, + "learning_rate": 7.70428353051542e-05, + "loss": 1.4984, + "step": 25228 + }, + { + "epoch": 1.99, + "learning_rate": 7.703203629069594e-05, + "loss": 1.4819, + "step": 25229 + }, + { + "epoch": 1.99, + "learning_rate": 7.702123777164984e-05, + "loss": 1.5227, + "step": 25230 + }, + { + "epoch": 1.99, + "learning_rate": 7.701043974808931e-05, + "loss": 1.4708, + "step": 25231 + }, + { + "epoch": 1.99, + "learning_rate": 7.699964222008762e-05, + "loss": 1.4783, + "step": 25232 + }, + { + "epoch": 1.99, + "learning_rate": 7.6988845187718e-05, + "loss": 1.4189, + "step": 25233 + }, + { + "epoch": 1.99, + "learning_rate": 7.697804865105384e-05, + "loss": 1.5195, + "step": 25234 + }, + { + "epoch": 1.99, + "learning_rate": 7.696725261016851e-05, + "loss": 1.4891, + "step": 25235 + }, + { + "epoch": 1.99, + "learning_rate": 7.695645706513522e-05, + "loss": 1.4975, + "step": 25236 + }, + { + "epoch": 1.99, + "learning_rate": 7.69456620160272e-05, + "loss": 1.5652, + "step": 25237 + }, + { + "epoch": 1.99, + "learning_rate": 7.693486746291791e-05, + "loss": 1.5403, + "step": 25238 + }, + { + "epoch": 1.99, + "learning_rate": 7.692407340588055e-05, + "loss": 1.4889, + "step": 25239 + }, + { + "epoch": 1.99, + "learning_rate": 7.691327984498831e-05, + "loss": 1.4567, + "step": 25240 + }, + { + "epoch": 1.99, + "learning_rate": 7.690248678031466e-05, + "loss": 1.4342, + "step": 25241 + }, + { + "epoch": 1.99, + "learning_rate": 7.689169421193276e-05, + "loss": 1.4459, + "step": 25242 + }, + { + "epoch": 1.99, + "learning_rate": 7.68809021399159e-05, + "loss": 1.4673, + "step": 25243 + }, + { + "epoch": 1.99, + "learning_rate": 7.687011056433738e-05, + "loss": 1.4811, + "step": 25244 + }, + { + "epoch": 1.99, + "learning_rate": 7.685931948527045e-05, + "loss": 1.4633, + "step": 25245 + }, + { + "epoch": 1.99, + "learning_rate": 7.68485289027884e-05, + "loss": 1.476, + "step": 25246 + }, + { + "epoch": 1.99, + "learning_rate": 7.683773881696439e-05, + "loss": 1.4704, + "step": 25247 + }, + { + "epoch": 1.99, + "learning_rate": 7.682694922787177e-05, + "loss": 1.4711, + "step": 25248 + }, + { + "epoch": 1.99, + "learning_rate": 7.681616013558386e-05, + "loss": 1.4594, + "step": 25249 + }, + { + "epoch": 1.99, + "learning_rate": 7.680537154017382e-05, + "loss": 1.5027, + "step": 25250 + }, + { + "epoch": 1.99, + "learning_rate": 7.679458344171485e-05, + "loss": 1.4405, + "step": 25251 + }, + { + "epoch": 1.99, + "learning_rate": 7.678379584028033e-05, + "loss": 1.4908, + "step": 25252 + }, + { + "epoch": 1.99, + "learning_rate": 7.677300873594342e-05, + "loss": 1.4903, + "step": 25253 + }, + { + "epoch": 1.99, + "learning_rate": 7.676222212877732e-05, + "loss": 1.4573, + "step": 25254 + }, + { + "epoch": 1.99, + "learning_rate": 7.675143601885538e-05, + "loss": 1.4124, + "step": 25255 + }, + { + "epoch": 1.99, + "learning_rate": 7.674065040625076e-05, + "loss": 1.4727, + "step": 25256 + }, + { + "epoch": 1.99, + "learning_rate": 7.672986529103665e-05, + "loss": 1.5006, + "step": 25257 + }, + { + "epoch": 1.99, + "learning_rate": 7.671908067328636e-05, + "loss": 1.4864, + "step": 25258 + }, + { + "epoch": 1.99, + "learning_rate": 7.670829655307308e-05, + "loss": 1.483, + "step": 25259 + }, + { + "epoch": 1.99, + "learning_rate": 7.669751293046996e-05, + "loss": 1.4344, + "step": 25260 + }, + { + "epoch": 1.99, + "learning_rate": 7.668672980555033e-05, + "loss": 1.4854, + "step": 25261 + }, + { + "epoch": 1.99, + "learning_rate": 7.667594717838737e-05, + "loss": 1.4861, + "step": 25262 + }, + { + "epoch": 1.99, + "learning_rate": 7.666516504905426e-05, + "loss": 1.5601, + "step": 25263 + }, + { + "epoch": 1.99, + "learning_rate": 7.665438341762408e-05, + "loss": 1.4948, + "step": 25264 + }, + { + "epoch": 1.99, + "learning_rate": 7.664360228417027e-05, + "loss": 1.4551, + "step": 25265 + }, + { + "epoch": 1.99, + "learning_rate": 7.663282164876593e-05, + "loss": 1.5351, + "step": 25266 + }, + { + "epoch": 1.99, + "learning_rate": 7.662204151148424e-05, + "loss": 1.4679, + "step": 25267 + }, + { + "epoch": 1.99, + "learning_rate": 7.661126187239836e-05, + "loss": 1.4718, + "step": 25268 + }, + { + "epoch": 1.99, + "learning_rate": 7.660048273158155e-05, + "loss": 1.5264, + "step": 25269 + }, + { + "epoch": 1.99, + "learning_rate": 7.658970408910696e-05, + "loss": 1.4802, + "step": 25270 + }, + { + "epoch": 1.99, + "learning_rate": 7.657892594504771e-05, + "loss": 1.4474, + "step": 25271 + }, + { + "epoch": 1.99, + "learning_rate": 7.656814829947707e-05, + "loss": 1.476, + "step": 25272 + }, + { + "epoch": 1.99, + "learning_rate": 7.655737115246822e-05, + "loss": 1.5106, + "step": 25273 + }, + { + "epoch": 1.99, + "learning_rate": 7.654659450409421e-05, + "loss": 1.4868, + "step": 25274 + }, + { + "epoch": 1.99, + "learning_rate": 7.653581835442834e-05, + "loss": 1.4914, + "step": 25275 + }, + { + "epoch": 1.99, + "learning_rate": 7.652504270354375e-05, + "loss": 1.4402, + "step": 25276 + }, + { + "epoch": 1.99, + "learning_rate": 7.65142675515135e-05, + "loss": 1.4882, + "step": 25277 + }, + { + "epoch": 1.99, + "learning_rate": 7.650349289841087e-05, + "loss": 1.4531, + "step": 25278 + }, + { + "epoch": 1.99, + "learning_rate": 7.649271874430898e-05, + "loss": 1.5186, + "step": 25279 + }, + { + "epoch": 1.99, + "learning_rate": 7.648194508928091e-05, + "loss": 1.4983, + "step": 25280 + }, + { + "epoch": 1.99, + "learning_rate": 7.647117193339984e-05, + "loss": 1.4389, + "step": 25281 + }, + { + "epoch": 1.99, + "learning_rate": 7.6460399276739e-05, + "loss": 1.4981, + "step": 25282 + }, + { + "epoch": 1.99, + "learning_rate": 7.644962711937147e-05, + "loss": 1.4729, + "step": 25283 + }, + { + "epoch": 1.99, + "learning_rate": 7.643885546137032e-05, + "loss": 1.4666, + "step": 25284 + }, + { + "epoch": 1.99, + "learning_rate": 7.642808430280883e-05, + "loss": 1.5055, + "step": 25285 + }, + { + "epoch": 1.99, + "learning_rate": 7.641731364376001e-05, + "loss": 1.5396, + "step": 25286 + }, + { + "epoch": 1.99, + "learning_rate": 7.640654348429705e-05, + "loss": 1.5375, + "step": 25287 + }, + { + "epoch": 1.99, + "learning_rate": 7.639577382449298e-05, + "loss": 1.5267, + "step": 25288 + }, + { + "epoch": 1.99, + "learning_rate": 7.638500466442105e-05, + "loss": 1.4763, + "step": 25289 + }, + { + "epoch": 1.99, + "learning_rate": 7.637423600415433e-05, + "loss": 1.4718, + "step": 25290 + }, + { + "epoch": 1.99, + "learning_rate": 7.636346784376583e-05, + "loss": 1.4899, + "step": 25291 + }, + { + "epoch": 1.99, + "learning_rate": 7.635270018332883e-05, + "loss": 1.494, + "step": 25292 + }, + { + "epoch": 1.99, + "learning_rate": 7.634193302291633e-05, + "loss": 1.5126, + "step": 25293 + }, + { + "epoch": 1.99, + "learning_rate": 7.633116636260141e-05, + "loss": 1.533, + "step": 25294 + }, + { + "epoch": 1.99, + "learning_rate": 7.632040020245722e-05, + "loss": 1.4756, + "step": 25295 + }, + { + "epoch": 1.99, + "learning_rate": 7.63096345425569e-05, + "loss": 1.5112, + "step": 25296 + }, + { + "epoch": 1.99, + "learning_rate": 7.629886938297351e-05, + "loss": 1.4836, + "step": 25297 + }, + { + "epoch": 1.99, + "learning_rate": 7.628810472378005e-05, + "loss": 1.4841, + "step": 25298 + }, + { + "epoch": 1.99, + "learning_rate": 7.627734056504976e-05, + "loss": 1.4758, + "step": 25299 + }, + { + "epoch": 1.99, + "learning_rate": 7.626657690685565e-05, + "loss": 1.4317, + "step": 25300 + }, + { + "epoch": 1.99, + "learning_rate": 7.62558137492707e-05, + "loss": 1.417, + "step": 25301 + }, + { + "epoch": 1.99, + "learning_rate": 7.624505109236816e-05, + "loss": 1.473, + "step": 25302 + }, + { + "epoch": 1.99, + "learning_rate": 7.623428893622103e-05, + "loss": 1.5357, + "step": 25303 + }, + { + "epoch": 1.99, + "learning_rate": 7.622352728090235e-05, + "loss": 1.5497, + "step": 25304 + }, + { + "epoch": 1.99, + "learning_rate": 7.621276612648516e-05, + "loss": 1.5127, + "step": 25305 + }, + { + "epoch": 1.99, + "learning_rate": 7.620200547304263e-05, + "loss": 1.531, + "step": 25306 + }, + { + "epoch": 1.99, + "learning_rate": 7.619124532064775e-05, + "loss": 1.4997, + "step": 25307 + }, + { + "epoch": 1.99, + "learning_rate": 7.618048566937351e-05, + "loss": 1.4252, + "step": 25308 + }, + { + "epoch": 1.99, + "learning_rate": 7.616972651929311e-05, + "loss": 1.4869, + "step": 25309 + }, + { + "epoch": 1.99, + "learning_rate": 7.615896787047955e-05, + "loss": 1.48, + "step": 25310 + }, + { + "epoch": 1.99, + "learning_rate": 7.614820972300574e-05, + "loss": 1.4416, + "step": 25311 + }, + { + "epoch": 1.99, + "learning_rate": 7.613745207694488e-05, + "loss": 1.5106, + "step": 25312 + }, + { + "epoch": 1.99, + "learning_rate": 7.612669493236999e-05, + "loss": 1.4593, + "step": 25313 + }, + { + "epoch": 1.99, + "learning_rate": 7.611593828935409e-05, + "loss": 1.4944, + "step": 25314 + }, + { + "epoch": 1.99, + "learning_rate": 7.61051821479701e-05, + "loss": 1.5605, + "step": 25315 + }, + { + "epoch": 1.99, + "learning_rate": 7.609442650829126e-05, + "loss": 1.4944, + "step": 25316 + }, + { + "epoch": 1.99, + "learning_rate": 7.608367137039044e-05, + "loss": 1.4829, + "step": 25317 + }, + { + "epoch": 1.99, + "learning_rate": 7.607291673434066e-05, + "loss": 1.4577, + "step": 25318 + }, + { + "epoch": 1.99, + "learning_rate": 7.606216260021502e-05, + "loss": 1.4931, + "step": 25319 + }, + { + "epoch": 1.99, + "learning_rate": 7.605140896808651e-05, + "loss": 1.4941, + "step": 25320 + }, + { + "epoch": 1.99, + "learning_rate": 7.604065583802812e-05, + "loss": 1.4737, + "step": 25321 + }, + { + "epoch": 1.99, + "learning_rate": 7.602990321011281e-05, + "loss": 1.4343, + "step": 25322 + }, + { + "epoch": 1.99, + "learning_rate": 7.601915108441369e-05, + "loss": 1.4614, + "step": 25323 + }, + { + "epoch": 1.99, + "learning_rate": 7.60083994610037e-05, + "loss": 1.482, + "step": 25324 + }, + { + "epoch": 1.99, + "learning_rate": 7.599764833995579e-05, + "loss": 1.4988, + "step": 25325 + }, + { + "epoch": 1.99, + "learning_rate": 7.598689772134309e-05, + "loss": 1.4314, + "step": 25326 + }, + { + "epoch": 1.99, + "learning_rate": 7.597614760523842e-05, + "loss": 1.5217, + "step": 25327 + }, + { + "epoch": 1.99, + "learning_rate": 7.596539799171494e-05, + "loss": 1.4392, + "step": 25328 + }, + { + "epoch": 1.99, + "learning_rate": 7.595464888084547e-05, + "loss": 1.4859, + "step": 25329 + }, + { + "epoch": 1.99, + "learning_rate": 7.594390027270316e-05, + "loss": 1.5125, + "step": 25330 + }, + { + "epoch": 1.99, + "learning_rate": 7.593315216736088e-05, + "loss": 1.4937, + "step": 25331 + }, + { + "epoch": 1.99, + "learning_rate": 7.592240456489157e-05, + "loss": 1.4727, + "step": 25332 + }, + { + "epoch": 1.99, + "learning_rate": 7.591165746536832e-05, + "loss": 1.4502, + "step": 25333 + }, + { + "epoch": 1.99, + "learning_rate": 7.5900910868864e-05, + "loss": 1.5005, + "step": 25334 + }, + { + "epoch": 1.99, + "learning_rate": 7.589016477545158e-05, + "loss": 1.4758, + "step": 25335 + }, + { + "epoch": 1.99, + "learning_rate": 7.587941918520411e-05, + "loss": 1.4586, + "step": 25336 + }, + { + "epoch": 1.99, + "learning_rate": 7.586867409819445e-05, + "loss": 1.4434, + "step": 25337 + }, + { + "epoch": 1.99, + "learning_rate": 7.585792951449558e-05, + "loss": 1.5349, + "step": 25338 + }, + { + "epoch": 1.99, + "learning_rate": 7.584718543418043e-05, + "loss": 1.4463, + "step": 25339 + }, + { + "epoch": 1.99, + "learning_rate": 7.583644185732201e-05, + "loss": 1.5021, + "step": 25340 + }, + { + "epoch": 1.99, + "learning_rate": 7.582569878399321e-05, + "loss": 1.5014, + "step": 25341 + }, + { + "epoch": 1.99, + "learning_rate": 7.581495621426694e-05, + "loss": 1.4699, + "step": 25342 + }, + { + "epoch": 1.99, + "learning_rate": 7.580421414821618e-05, + "loss": 1.491, + "step": 25343 + }, + { + "epoch": 1.99, + "learning_rate": 7.579347258591391e-05, + "loss": 1.5199, + "step": 25344 + }, + { + "epoch": 1.99, + "learning_rate": 7.578273152743302e-05, + "loss": 1.4161, + "step": 25345 + }, + { + "epoch": 1.99, + "learning_rate": 7.577199097284636e-05, + "loss": 1.4492, + "step": 25346 + }, + { + "epoch": 1.99, + "learning_rate": 7.576125092222697e-05, + "loss": 1.4535, + "step": 25347 + }, + { + "epoch": 1.99, + "learning_rate": 7.575051137564774e-05, + "loss": 1.5033, + "step": 25348 + }, + { + "epoch": 1.99, + "learning_rate": 7.573977233318149e-05, + "loss": 1.449, + "step": 25349 + }, + { + "epoch": 1.99, + "learning_rate": 7.572903379490126e-05, + "loss": 1.5124, + "step": 25350 + }, + { + "epoch": 1.99, + "learning_rate": 7.571829576087992e-05, + "loss": 1.4637, + "step": 25351 + }, + { + "epoch": 1.99, + "learning_rate": 7.57075582311903e-05, + "loss": 1.5026, + "step": 25352 + }, + { + "epoch": 1.99, + "learning_rate": 7.56968212059054e-05, + "loss": 1.4991, + "step": 25353 + }, + { + "epoch": 1.99, + "learning_rate": 7.568608468509809e-05, + "loss": 1.4946, + "step": 25354 + }, + { + "epoch": 1.99, + "learning_rate": 7.567534866884122e-05, + "loss": 1.5085, + "step": 25355 + }, + { + "epoch": 2.0, + "learning_rate": 7.566461315720776e-05, + "loss": 1.4212, + "step": 25356 + }, + { + "epoch": 2.0, + "learning_rate": 7.565387815027055e-05, + "loss": 1.4722, + "step": 25357 + }, + { + "epoch": 2.0, + "learning_rate": 7.56431436481024e-05, + "loss": 1.4951, + "step": 25358 + }, + { + "epoch": 2.0, + "learning_rate": 7.563240965077631e-05, + "loss": 1.4738, + "step": 25359 + }, + { + "epoch": 2.0, + "learning_rate": 7.562167615836517e-05, + "loss": 1.4781, + "step": 25360 + }, + { + "epoch": 2.0, + "learning_rate": 7.561094317094177e-05, + "loss": 1.5354, + "step": 25361 + }, + { + "epoch": 2.0, + "learning_rate": 7.560021068857905e-05, + "loss": 1.5004, + "step": 25362 + }, + { + "epoch": 2.0, + "learning_rate": 7.558947871134976e-05, + "loss": 1.5234, + "step": 25363 + }, + { + "epoch": 2.0, + "learning_rate": 7.557874723932693e-05, + "loss": 1.4401, + "step": 25364 + }, + { + "epoch": 2.0, + "learning_rate": 7.556801627258332e-05, + "loss": 1.4448, + "step": 25365 + }, + { + "epoch": 2.0, + "learning_rate": 7.555728581119175e-05, + "loss": 1.4828, + "step": 25366 + }, + { + "epoch": 2.0, + "learning_rate": 7.554655585522518e-05, + "loss": 1.4493, + "step": 25367 + }, + { + "epoch": 2.0, + "learning_rate": 7.553582640475642e-05, + "loss": 1.4499, + "step": 25368 + }, + { + "epoch": 2.0, + "learning_rate": 7.552509745985825e-05, + "loss": 1.4675, + "step": 25369 + }, + { + "epoch": 2.0, + "learning_rate": 7.551436902060362e-05, + "loss": 1.463, + "step": 25370 + }, + { + "epoch": 2.0, + "learning_rate": 7.550364108706532e-05, + "loss": 1.4647, + "step": 25371 + }, + { + "epoch": 2.0, + "learning_rate": 7.549291365931612e-05, + "loss": 1.4297, + "step": 25372 + }, + { + "epoch": 2.0, + "learning_rate": 7.548218673742901e-05, + "loss": 1.4531, + "step": 25373 + }, + { + "epoch": 2.0, + "learning_rate": 7.547146032147664e-05, + "loss": 1.4719, + "step": 25374 + }, + { + "epoch": 2.0, + "learning_rate": 7.5460734411532e-05, + "loss": 1.5098, + "step": 25375 + }, + { + "epoch": 2.0, + "learning_rate": 7.545000900766776e-05, + "loss": 1.4535, + "step": 25376 + }, + { + "epoch": 2.0, + "learning_rate": 7.54392841099569e-05, + "loss": 1.5275, + "step": 25377 + }, + { + "epoch": 2.0, + "learning_rate": 7.542855971847214e-05, + "loss": 1.5099, + "step": 25378 + }, + { + "epoch": 2.0, + "learning_rate": 7.54178358332863e-05, + "loss": 1.4374, + "step": 25379 + }, + { + "epoch": 2.0, + "learning_rate": 7.540711245447216e-05, + "loss": 1.466, + "step": 25380 + }, + { + "epoch": 2.0, + "learning_rate": 7.539638958210263e-05, + "loss": 1.5151, + "step": 25381 + }, + { + "epoch": 2.0, + "learning_rate": 7.538566721625043e-05, + "loss": 1.4558, + "step": 25382 + }, + { + "epoch": 2.0, + "learning_rate": 7.53749453569883e-05, + "loss": 1.4859, + "step": 25383 + }, + { + "epoch": 2.0, + "learning_rate": 7.536422400438918e-05, + "loss": 1.5211, + "step": 25384 + }, + { + "epoch": 2.0, + "learning_rate": 7.53535031585258e-05, + "loss": 1.4729, + "step": 25385 + }, + { + "epoch": 2.0, + "learning_rate": 7.534278281947088e-05, + "loss": 1.4581, + "step": 25386 + }, + { + "epoch": 2.0, + "learning_rate": 7.533206298729732e-05, + "loss": 1.509, + "step": 25387 + }, + { + "epoch": 2.0, + "learning_rate": 7.532134366207786e-05, + "loss": 1.5061, + "step": 25388 + }, + { + "epoch": 2.0, + "learning_rate": 7.531062484388519e-05, + "loss": 1.4433, + "step": 25389 + }, + { + "epoch": 2.0, + "learning_rate": 7.529990653279215e-05, + "loss": 1.4436, + "step": 25390 + }, + { + "epoch": 2.0, + "learning_rate": 7.52891887288716e-05, + "loss": 1.5279, + "step": 25391 + }, + { + "epoch": 2.0, + "learning_rate": 7.527847143219623e-05, + "loss": 1.5053, + "step": 25392 + }, + { + "epoch": 2.0, + "learning_rate": 7.526775464283873e-05, + "loss": 1.455, + "step": 25393 + }, + { + "epoch": 2.0, + "learning_rate": 7.5257038360872e-05, + "loss": 1.4662, + "step": 25394 + }, + { + "epoch": 2.0, + "learning_rate": 7.524632258636874e-05, + "loss": 1.4996, + "step": 25395 + }, + { + "epoch": 2.0, + "learning_rate": 7.523560731940163e-05, + "loss": 1.502, + "step": 25396 + }, + { + "epoch": 2.0, + "learning_rate": 7.522489256004357e-05, + "loss": 1.4563, + "step": 25397 + }, + { + "epoch": 2.0, + "learning_rate": 7.52141783083672e-05, + "loss": 1.4695, + "step": 25398 + }, + { + "epoch": 2.0, + "learning_rate": 7.520346456444531e-05, + "loss": 1.4768, + "step": 25399 + }, + { + "epoch": 2.0, + "learning_rate": 7.519275132835052e-05, + "loss": 1.4876, + "step": 25400 + }, + { + "epoch": 2.0, + "learning_rate": 7.518203860015576e-05, + "loss": 1.5487, + "step": 25401 + }, + { + "epoch": 2.0, + "learning_rate": 7.517132637993366e-05, + "loss": 1.5039, + "step": 25402 + }, + { + "epoch": 2.0, + "learning_rate": 7.51606146677569e-05, + "loss": 1.4435, + "step": 25403 + }, + { + "epoch": 2.0, + "learning_rate": 7.514990346369833e-05, + "loss": 1.4866, + "step": 25404 + }, + { + "epoch": 2.0, + "learning_rate": 7.513919276783055e-05, + "loss": 1.4878, + "step": 25405 + }, + { + "epoch": 2.0, + "learning_rate": 7.51284825802264e-05, + "loss": 1.5251, + "step": 25406 + }, + { + "epoch": 2.0, + "learning_rate": 7.511777290095848e-05, + "loss": 1.4809, + "step": 25407 + }, + { + "epoch": 2.0, + "learning_rate": 7.51070637300996e-05, + "loss": 1.4381, + "step": 25408 + }, + { + "epoch": 2.0, + "learning_rate": 7.509635506772244e-05, + "loss": 1.5179, + "step": 25409 + }, + { + "epoch": 2.0, + "learning_rate": 7.508564691389964e-05, + "loss": 1.4522, + "step": 25410 + }, + { + "epoch": 2.0, + "learning_rate": 7.507493926870403e-05, + "loss": 1.4848, + "step": 25411 + }, + { + "epoch": 2.0, + "learning_rate": 7.50642321322082e-05, + "loss": 1.5028, + "step": 25412 + }, + { + "epoch": 2.0, + "learning_rate": 7.505352550448483e-05, + "loss": 1.5235, + "step": 25413 + }, + { + "epoch": 2.0, + "learning_rate": 7.504281938560673e-05, + "loss": 1.5265, + "step": 25414 + }, + { + "epoch": 2.0, + "learning_rate": 7.503211377564652e-05, + "loss": 1.425, + "step": 25415 + }, + { + "epoch": 2.0, + "learning_rate": 7.50214086746769e-05, + "loss": 1.4788, + "step": 25416 + }, + { + "epoch": 2.0, + "learning_rate": 7.501070408277047e-05, + "loss": 1.5071, + "step": 25417 + }, + { + "epoch": 2.0, + "learning_rate": 7.500000000000002e-05, + "loss": 1.4764, + "step": 25418 + }, + { + "epoch": 2.0, + "learning_rate": 7.49892964264382e-05, + "loss": 1.4458, + "step": 25419 + }, + { + "epoch": 2.0, + "learning_rate": 7.497859336215758e-05, + "loss": 1.4265, + "step": 25420 + }, + { + "epoch": 2.0, + "learning_rate": 7.496789080723093e-05, + "loss": 1.4619, + "step": 25421 + }, + { + "epoch": 2.0, + "learning_rate": 7.495718876173097e-05, + "loss": 1.4466, + "step": 25422 + }, + { + "epoch": 2.0, + "learning_rate": 7.494648722573027e-05, + "loss": 1.4412, + "step": 25423 + }, + { + "epoch": 2.0, + "learning_rate": 7.493578619930145e-05, + "loss": 1.4859, + "step": 25424 + }, + { + "epoch": 2.0, + "learning_rate": 7.492508568251727e-05, + "loss": 1.4936, + "step": 25425 + }, + { + "epoch": 2.0, + "learning_rate": 7.491438567545032e-05, + "loss": 1.4631, + "step": 25426 + }, + { + "epoch": 2.0, + "learning_rate": 7.490368617817321e-05, + "loss": 1.4498, + "step": 25427 + }, + { + "epoch": 2.0, + "learning_rate": 7.489298719075869e-05, + "loss": 1.4615, + "step": 25428 + }, + { + "epoch": 2.0, + "learning_rate": 7.488228871327934e-05, + "loss": 1.4935, + "step": 25429 + }, + { + "epoch": 2.0, + "learning_rate": 7.487159074580772e-05, + "loss": 1.4953, + "step": 25430 + }, + { + "epoch": 2.0, + "learning_rate": 7.486089328841661e-05, + "loss": 1.5141, + "step": 25431 + }, + { + "epoch": 2.0, + "learning_rate": 7.485019634117858e-05, + "loss": 1.4864, + "step": 25432 + }, + { + "epoch": 2.0, + "learning_rate": 7.483949990416622e-05, + "loss": 1.4298, + "step": 25433 + }, + { + "epoch": 2.0, + "learning_rate": 7.482880397745214e-05, + "loss": 1.4744, + "step": 25434 + }, + { + "epoch": 2.0, + "learning_rate": 7.481810856110905e-05, + "loss": 1.4144, + "step": 25435 + }, + { + "epoch": 2.0, + "learning_rate": 7.480741365520951e-05, + "loss": 1.4703, + "step": 25436 + }, + { + "epoch": 2.0, + "learning_rate": 7.479671925982609e-05, + "loss": 1.4394, + "step": 25437 + }, + { + "epoch": 2.0, + "learning_rate": 7.478602537503143e-05, + "loss": 1.4375, + "step": 25438 + }, + { + "epoch": 2.0, + "learning_rate": 7.477533200089822e-05, + "loss": 1.438, + "step": 25439 + }, + { + "epoch": 2.0, + "learning_rate": 7.4764639137499e-05, + "loss": 1.457, + "step": 25440 + }, + { + "epoch": 2.0, + "learning_rate": 7.47539467849063e-05, + "loss": 1.4576, + "step": 25441 + }, + { + "epoch": 2.0, + "learning_rate": 7.474325494319283e-05, + "loss": 1.3786, + "step": 25442 + }, + { + "epoch": 2.0, + "learning_rate": 7.473256361243113e-05, + "loss": 1.4951, + "step": 25443 + }, + { + "epoch": 2.0, + "learning_rate": 7.472187279269373e-05, + "loss": 1.4086, + "step": 25444 + }, + { + "epoch": 2.0, + "learning_rate": 7.471118248405334e-05, + "loss": 1.4588, + "step": 25445 + }, + { + "epoch": 2.0, + "learning_rate": 7.470049268658246e-05, + "loss": 1.4566, + "step": 25446 + }, + { + "epoch": 2.0, + "learning_rate": 7.468980340035361e-05, + "loss": 1.5186, + "step": 25447 + }, + { + "epoch": 2.0, + "learning_rate": 7.46791146254395e-05, + "loss": 1.486, + "step": 25448 + }, + { + "epoch": 2.0, + "learning_rate": 7.466842636191266e-05, + "loss": 1.4317, + "step": 25449 + }, + { + "epoch": 2.0, + "learning_rate": 7.465773860984557e-05, + "loss": 1.5232, + "step": 25450 + }, + { + "epoch": 2.0, + "learning_rate": 7.46470513693109e-05, + "loss": 1.4619, + "step": 25451 + }, + { + "epoch": 2.0, + "learning_rate": 7.463636464038116e-05, + "loss": 1.4651, + "step": 25452 + }, + { + "epoch": 2.0, + "learning_rate": 7.462567842312887e-05, + "loss": 1.4532, + "step": 25453 + }, + { + "epoch": 2.0, + "learning_rate": 7.461499271762664e-05, + "loss": 1.4271, + "step": 25454 + }, + { + "epoch": 2.0, + "learning_rate": 7.460430752394706e-05, + "loss": 1.4377, + "step": 25455 + }, + { + "epoch": 2.0, + "learning_rate": 7.459362284216262e-05, + "loss": 1.4718, + "step": 25456 + }, + { + "epoch": 2.0, + "learning_rate": 7.458293867234588e-05, + "loss": 1.5016, + "step": 25457 + }, + { + "epoch": 2.0, + "learning_rate": 7.457225501456928e-05, + "loss": 1.4499, + "step": 25458 + }, + { + "epoch": 2.0, + "learning_rate": 7.456157186890554e-05, + "loss": 1.4567, + "step": 25459 + }, + { + "epoch": 2.0, + "learning_rate": 7.455088923542707e-05, + "loss": 1.4928, + "step": 25460 + }, + { + "epoch": 2.0, + "learning_rate": 7.454020711420636e-05, + "loss": 1.503, + "step": 25461 + }, + { + "epoch": 2.0, + "learning_rate": 7.452952550531608e-05, + "loss": 1.4927, + "step": 25462 + }, + { + "epoch": 2.0, + "learning_rate": 7.451884440882867e-05, + "loss": 1.4439, + "step": 25463 + }, + { + "epoch": 2.0, + "learning_rate": 7.45081638248166e-05, + "loss": 1.4673, + "step": 25464 + }, + { + "epoch": 2.0, + "learning_rate": 7.449748375335248e-05, + "loss": 1.426, + "step": 25465 + }, + { + "epoch": 2.0, + "learning_rate": 7.448680419450879e-05, + "loss": 1.4719, + "step": 25466 + }, + { + "epoch": 2.0, + "learning_rate": 7.447612514835797e-05, + "loss": 1.4429, + "step": 25467 + }, + { + "epoch": 2.0, + "learning_rate": 7.446544661497258e-05, + "loss": 1.4619, + "step": 25468 + }, + { + "epoch": 2.0, + "learning_rate": 7.445476859442518e-05, + "loss": 1.4708, + "step": 25469 + }, + { + "epoch": 2.0, + "learning_rate": 7.444409108678823e-05, + "loss": 1.433, + "step": 25470 + }, + { + "epoch": 2.0, + "learning_rate": 7.443341409213413e-05, + "loss": 1.4392, + "step": 25471 + }, + { + "epoch": 2.0, + "learning_rate": 7.44227376105355e-05, + "loss": 1.4889, + "step": 25472 + }, + { + "epoch": 2.0, + "learning_rate": 7.441206164206479e-05, + "loss": 1.4777, + "step": 25473 + }, + { + "epoch": 2.0, + "learning_rate": 7.440138618679447e-05, + "loss": 1.5297, + "step": 25474 + }, + { + "epoch": 2.0, + "learning_rate": 7.439071124479693e-05, + "loss": 1.4538, + "step": 25475 + }, + { + "epoch": 2.0, + "learning_rate": 7.438003681614482e-05, + "loss": 1.4196, + "step": 25476 + }, + { + "epoch": 2.0, + "learning_rate": 7.436936290091053e-05, + "loss": 1.4915, + "step": 25477 + }, + { + "epoch": 2.0, + "learning_rate": 7.435868949916648e-05, + "loss": 1.3885, + "step": 25478 + }, + { + "epoch": 2.0, + "learning_rate": 7.434801661098522e-05, + "loss": 1.4428, + "step": 25479 + }, + { + "epoch": 2.0, + "learning_rate": 7.43373442364392e-05, + "loss": 1.4019, + "step": 25480 + }, + { + "epoch": 2.0, + "learning_rate": 7.432667237560079e-05, + "loss": 1.46, + "step": 25481 + }, + { + "epoch": 2.0, + "learning_rate": 7.431600102854258e-05, + "loss": 1.4531, + "step": 25482 + }, + { + "epoch": 2.01, + "learning_rate": 7.430533019533695e-05, + "loss": 1.4691, + "step": 25483 + }, + { + "epoch": 2.01, + "learning_rate": 7.42946598760563e-05, + "loss": 1.4919, + "step": 25484 + }, + { + "epoch": 2.01, + "learning_rate": 7.428399007077312e-05, + "loss": 1.4711, + "step": 25485 + }, + { + "epoch": 2.01, + "learning_rate": 7.427332077955994e-05, + "loss": 1.4623, + "step": 25486 + }, + { + "epoch": 2.01, + "learning_rate": 7.426265200248912e-05, + "loss": 1.467, + "step": 25487 + }, + { + "epoch": 2.01, + "learning_rate": 7.425198373963304e-05, + "loss": 1.4705, + "step": 25488 + }, + { + "epoch": 2.01, + "learning_rate": 7.424131599106423e-05, + "loss": 1.4447, + "step": 25489 + }, + { + "epoch": 2.01, + "learning_rate": 7.42306487568551e-05, + "loss": 1.443, + "step": 25490 + }, + { + "epoch": 2.01, + "learning_rate": 7.421998203707803e-05, + "loss": 1.4364, + "step": 25491 + }, + { + "epoch": 2.01, + "learning_rate": 7.420931583180542e-05, + "loss": 1.4071, + "step": 25492 + }, + { + "epoch": 2.01, + "learning_rate": 7.419865014110978e-05, + "loss": 1.4394, + "step": 25493 + }, + { + "epoch": 2.01, + "learning_rate": 7.418798496506349e-05, + "loss": 1.4694, + "step": 25494 + }, + { + "epoch": 2.01, + "learning_rate": 7.417732030373889e-05, + "loss": 1.4471, + "step": 25495 + }, + { + "epoch": 2.01, + "learning_rate": 7.416665615720848e-05, + "loss": 1.4432, + "step": 25496 + }, + { + "epoch": 2.01, + "learning_rate": 7.415599252554462e-05, + "loss": 1.4213, + "step": 25497 + }, + { + "epoch": 2.01, + "learning_rate": 7.414532940881968e-05, + "loss": 1.3855, + "step": 25498 + }, + { + "epoch": 2.01, + "learning_rate": 7.413466680710615e-05, + "loss": 1.4836, + "step": 25499 + }, + { + "epoch": 2.01, + "learning_rate": 7.41240047204763e-05, + "loss": 1.4737, + "step": 25500 + }, + { + "epoch": 2.01, + "learning_rate": 7.411334314900263e-05, + "loss": 1.4467, + "step": 25501 + }, + { + "epoch": 2.01, + "learning_rate": 7.410268209275747e-05, + "loss": 1.515, + "step": 25502 + }, + { + "epoch": 2.01, + "learning_rate": 7.409202155181324e-05, + "loss": 1.4501, + "step": 25503 + }, + { + "epoch": 2.01, + "learning_rate": 7.408136152624229e-05, + "loss": 1.4327, + "step": 25504 + }, + { + "epoch": 2.01, + "learning_rate": 7.407070201611695e-05, + "loss": 1.4359, + "step": 25505 + }, + { + "epoch": 2.01, + "learning_rate": 7.40600430215097e-05, + "loss": 1.4623, + "step": 25506 + }, + { + "epoch": 2.01, + "learning_rate": 7.404938454249285e-05, + "loss": 1.4047, + "step": 25507 + }, + { + "epoch": 2.01, + "learning_rate": 7.40387265791387e-05, + "loss": 1.454, + "step": 25508 + }, + { + "epoch": 2.01, + "learning_rate": 7.402806913151977e-05, + "loss": 1.4623, + "step": 25509 + }, + { + "epoch": 2.01, + "learning_rate": 7.401741219970829e-05, + "loss": 1.4582, + "step": 25510 + }, + { + "epoch": 2.01, + "learning_rate": 7.400675578377665e-05, + "loss": 1.544, + "step": 25511 + }, + { + "epoch": 2.01, + "learning_rate": 7.399609988379716e-05, + "loss": 1.3921, + "step": 25512 + }, + { + "epoch": 2.01, + "learning_rate": 7.398544449984228e-05, + "loss": 1.4797, + "step": 25513 + }, + { + "epoch": 2.01, + "learning_rate": 7.397478963198425e-05, + "loss": 1.4547, + "step": 25514 + }, + { + "epoch": 2.01, + "learning_rate": 7.39641352802954e-05, + "loss": 1.4739, + "step": 25515 + }, + { + "epoch": 2.01, + "learning_rate": 7.395348144484811e-05, + "loss": 1.4869, + "step": 25516 + }, + { + "epoch": 2.01, + "learning_rate": 7.394282812571479e-05, + "loss": 1.469, + "step": 25517 + }, + { + "epoch": 2.01, + "learning_rate": 7.393217532296769e-05, + "loss": 1.447, + "step": 25518 + }, + { + "epoch": 2.01, + "learning_rate": 7.392152303667907e-05, + "loss": 1.478, + "step": 25519 + }, + { + "epoch": 2.01, + "learning_rate": 7.391087126692139e-05, + "loss": 1.4297, + "step": 25520 + }, + { + "epoch": 2.01, + "learning_rate": 7.39002200137669e-05, + "loss": 1.4587, + "step": 25521 + }, + { + "epoch": 2.01, + "learning_rate": 7.388956927728786e-05, + "loss": 1.4586, + "step": 25522 + }, + { + "epoch": 2.01, + "learning_rate": 7.387891905755672e-05, + "loss": 1.4655, + "step": 25523 + }, + { + "epoch": 2.01, + "learning_rate": 7.386826935464569e-05, + "loss": 1.5097, + "step": 25524 + }, + { + "epoch": 2.01, + "learning_rate": 7.385762016862705e-05, + "loss": 1.4864, + "step": 25525 + }, + { + "epoch": 2.01, + "learning_rate": 7.384697149957321e-05, + "loss": 1.4541, + "step": 25526 + }, + { + "epoch": 2.01, + "learning_rate": 7.383632334755642e-05, + "loss": 1.4268, + "step": 25527 + }, + { + "epoch": 2.01, + "learning_rate": 7.382567571264894e-05, + "loss": 1.4596, + "step": 25528 + }, + { + "epoch": 2.01, + "learning_rate": 7.381502859492303e-05, + "loss": 1.4632, + "step": 25529 + }, + { + "epoch": 2.01, + "learning_rate": 7.380438199445111e-05, + "loss": 1.4786, + "step": 25530 + }, + { + "epoch": 2.01, + "learning_rate": 7.379373591130533e-05, + "loss": 1.3976, + "step": 25531 + }, + { + "epoch": 2.01, + "learning_rate": 7.378309034555807e-05, + "loss": 1.4404, + "step": 25532 + }, + { + "epoch": 2.01, + "learning_rate": 7.377244529728151e-05, + "loss": 1.4617, + "step": 25533 + }, + { + "epoch": 2.01, + "learning_rate": 7.376180076654804e-05, + "loss": 1.484, + "step": 25534 + }, + { + "epoch": 2.01, + "learning_rate": 7.375115675342988e-05, + "loss": 1.4699, + "step": 25535 + }, + { + "epoch": 2.01, + "learning_rate": 7.374051325799923e-05, + "loss": 1.4598, + "step": 25536 + }, + { + "epoch": 2.01, + "learning_rate": 7.372987028032846e-05, + "loss": 1.4687, + "step": 25537 + }, + { + "epoch": 2.01, + "learning_rate": 7.371922782048979e-05, + "loss": 1.4898, + "step": 25538 + }, + { + "epoch": 2.01, + "learning_rate": 7.370858587855541e-05, + "loss": 1.446, + "step": 25539 + }, + { + "epoch": 2.01, + "learning_rate": 7.369794445459768e-05, + "loss": 1.4283, + "step": 25540 + }, + { + "epoch": 2.01, + "learning_rate": 7.36873035486888e-05, + "loss": 1.4489, + "step": 25541 + }, + { + "epoch": 2.01, + "learning_rate": 7.367666316090097e-05, + "loss": 1.5041, + "step": 25542 + }, + { + "epoch": 2.01, + "learning_rate": 7.366602329130653e-05, + "loss": 1.4633, + "step": 25543 + }, + { + "epoch": 2.01, + "learning_rate": 7.365538393997767e-05, + "loss": 1.4591, + "step": 25544 + }, + { + "epoch": 2.01, + "learning_rate": 7.364474510698661e-05, + "loss": 1.4809, + "step": 25545 + }, + { + "epoch": 2.01, + "learning_rate": 7.363410679240556e-05, + "loss": 1.4371, + "step": 25546 + }, + { + "epoch": 2.01, + "learning_rate": 7.362346899630675e-05, + "loss": 1.4839, + "step": 25547 + }, + { + "epoch": 2.01, + "learning_rate": 7.361283171876252e-05, + "loss": 1.457, + "step": 25548 + }, + { + "epoch": 2.01, + "learning_rate": 7.360219495984494e-05, + "loss": 1.471, + "step": 25549 + }, + { + "epoch": 2.01, + "learning_rate": 7.359155871962637e-05, + "loss": 1.4229, + "step": 25550 + }, + { + "epoch": 2.01, + "learning_rate": 7.358092299817894e-05, + "loss": 1.449, + "step": 25551 + }, + { + "epoch": 2.01, + "learning_rate": 7.357028779557488e-05, + "loss": 1.4792, + "step": 25552 + }, + { + "epoch": 2.01, + "learning_rate": 7.355965311188631e-05, + "loss": 1.5017, + "step": 25553 + }, + { + "epoch": 2.01, + "learning_rate": 7.354901894718559e-05, + "loss": 1.4585, + "step": 25554 + }, + { + "epoch": 2.01, + "learning_rate": 7.353838530154483e-05, + "loss": 1.4424, + "step": 25555 + }, + { + "epoch": 2.01, + "learning_rate": 7.352775217503618e-05, + "loss": 1.5119, + "step": 25556 + }, + { + "epoch": 2.01, + "learning_rate": 7.351711956773196e-05, + "loss": 1.4173, + "step": 25557 + }, + { + "epoch": 2.01, + "learning_rate": 7.350648747970428e-05, + "loss": 1.5272, + "step": 25558 + }, + { + "epoch": 2.01, + "learning_rate": 7.349585591102528e-05, + "loss": 1.4983, + "step": 25559 + }, + { + "epoch": 2.01, + "learning_rate": 7.348522486176727e-05, + "loss": 1.4607, + "step": 25560 + }, + { + "epoch": 2.01, + "learning_rate": 7.347459433200235e-05, + "loss": 1.4413, + "step": 25561 + }, + { + "epoch": 2.01, + "learning_rate": 7.346396432180267e-05, + "loss": 1.4333, + "step": 25562 + }, + { + "epoch": 2.01, + "learning_rate": 7.34533348312404e-05, + "loss": 1.4416, + "step": 25563 + }, + { + "epoch": 2.01, + "learning_rate": 7.344270586038782e-05, + "loss": 1.4779, + "step": 25564 + }, + { + "epoch": 2.01, + "learning_rate": 7.343207740931702e-05, + "loss": 1.4792, + "step": 25565 + }, + { + "epoch": 2.01, + "learning_rate": 7.34214494781001e-05, + "loss": 1.4726, + "step": 25566 + }, + { + "epoch": 2.01, + "learning_rate": 7.341082206680932e-05, + "loss": 1.4527, + "step": 25567 + }, + { + "epoch": 2.01, + "learning_rate": 7.340019517551682e-05, + "loss": 1.4756, + "step": 25568 + }, + { + "epoch": 2.01, + "learning_rate": 7.338956880429472e-05, + "loss": 1.4614, + "step": 25569 + }, + { + "epoch": 2.01, + "learning_rate": 7.337894295321509e-05, + "loss": 1.4881, + "step": 25570 + }, + { + "epoch": 2.01, + "learning_rate": 7.336831762235023e-05, + "loss": 1.4561, + "step": 25571 + }, + { + "epoch": 2.01, + "learning_rate": 7.335769281177221e-05, + "loss": 1.4298, + "step": 25572 + }, + { + "epoch": 2.01, + "learning_rate": 7.334706852155308e-05, + "loss": 1.4599, + "step": 25573 + }, + { + "epoch": 2.01, + "learning_rate": 7.333644475176514e-05, + "loss": 1.4919, + "step": 25574 + }, + { + "epoch": 2.01, + "learning_rate": 7.332582150248041e-05, + "loss": 1.3991, + "step": 25575 + }, + { + "epoch": 2.01, + "learning_rate": 7.331519877377099e-05, + "loss": 1.4343, + "step": 25576 + }, + { + "epoch": 2.01, + "learning_rate": 7.330457656570912e-05, + "loss": 1.4527, + "step": 25577 + }, + { + "epoch": 2.01, + "learning_rate": 7.329395487836678e-05, + "loss": 1.465, + "step": 25578 + }, + { + "epoch": 2.01, + "learning_rate": 7.328333371181623e-05, + "loss": 1.4584, + "step": 25579 + }, + { + "epoch": 2.01, + "learning_rate": 7.327271306612944e-05, + "loss": 1.4699, + "step": 25580 + }, + { + "epoch": 2.01, + "learning_rate": 7.326209294137864e-05, + "loss": 1.5, + "step": 25581 + }, + { + "epoch": 2.01, + "learning_rate": 7.325147333763589e-05, + "loss": 1.4528, + "step": 25582 + }, + { + "epoch": 2.01, + "learning_rate": 7.324085425497321e-05, + "loss": 1.4377, + "step": 25583 + }, + { + "epoch": 2.01, + "learning_rate": 7.323023569346285e-05, + "loss": 1.4389, + "step": 25584 + }, + { + "epoch": 2.01, + "learning_rate": 7.32196176531768e-05, + "loss": 1.4083, + "step": 25585 + }, + { + "epoch": 2.01, + "learning_rate": 7.32090001341872e-05, + "loss": 1.4255, + "step": 25586 + }, + { + "epoch": 2.01, + "learning_rate": 7.319838313656605e-05, + "loss": 1.462, + "step": 25587 + }, + { + "epoch": 2.01, + "learning_rate": 7.318776666038556e-05, + "loss": 1.4521, + "step": 25588 + }, + { + "epoch": 2.01, + "learning_rate": 7.317715070571772e-05, + "loss": 1.4287, + "step": 25589 + }, + { + "epoch": 2.01, + "learning_rate": 7.316653527263459e-05, + "loss": 1.4599, + "step": 25590 + }, + { + "epoch": 2.01, + "learning_rate": 7.315592036120835e-05, + "loss": 1.4481, + "step": 25591 + }, + { + "epoch": 2.01, + "learning_rate": 7.314530597151098e-05, + "loss": 1.4732, + "step": 25592 + }, + { + "epoch": 2.01, + "learning_rate": 7.313469210361453e-05, + "loss": 1.4625, + "step": 25593 + }, + { + "epoch": 2.01, + "learning_rate": 7.31240787575911e-05, + "loss": 1.4449, + "step": 25594 + }, + { + "epoch": 2.01, + "learning_rate": 7.31134659335128e-05, + "loss": 1.3664, + "step": 25595 + }, + { + "epoch": 2.01, + "learning_rate": 7.310285363145166e-05, + "loss": 1.4845, + "step": 25596 + }, + { + "epoch": 2.01, + "learning_rate": 7.309224185147965e-05, + "loss": 1.4782, + "step": 25597 + }, + { + "epoch": 2.01, + "learning_rate": 7.308163059366892e-05, + "loss": 1.4752, + "step": 25598 + }, + { + "epoch": 2.01, + "learning_rate": 7.307101985809147e-05, + "loss": 1.4511, + "step": 25599 + }, + { + "epoch": 2.01, + "learning_rate": 7.30604096448193e-05, + "loss": 1.4439, + "step": 25600 + }, + { + "epoch": 2.01, + "learning_rate": 7.304979995392452e-05, + "loss": 1.4516, + "step": 25601 + }, + { + "epoch": 2.01, + "learning_rate": 7.303919078547915e-05, + "loss": 1.4269, + "step": 25602 + }, + { + "epoch": 2.01, + "learning_rate": 7.30285821395552e-05, + "loss": 1.4856, + "step": 25603 + }, + { + "epoch": 2.01, + "learning_rate": 7.301797401622465e-05, + "loss": 1.4494, + "step": 25604 + }, + { + "epoch": 2.01, + "learning_rate": 7.300736641555962e-05, + "loss": 1.4761, + "step": 25605 + }, + { + "epoch": 2.01, + "learning_rate": 7.29967593376321e-05, + "loss": 1.4595, + "step": 25606 + }, + { + "epoch": 2.01, + "learning_rate": 7.298615278251403e-05, + "loss": 1.4629, + "step": 25607 + }, + { + "epoch": 2.01, + "learning_rate": 7.297554675027754e-05, + "loss": 1.4501, + "step": 25608 + }, + { + "epoch": 2.01, + "learning_rate": 7.296494124099457e-05, + "loss": 1.4599, + "step": 25609 + }, + { + "epoch": 2.02, + "learning_rate": 7.295433625473709e-05, + "loss": 1.4238, + "step": 25610 + }, + { + "epoch": 2.02, + "learning_rate": 7.294373179157715e-05, + "loss": 1.4652, + "step": 25611 + }, + { + "epoch": 2.02, + "learning_rate": 7.29331278515868e-05, + "loss": 1.4106, + "step": 25612 + }, + { + "epoch": 2.02, + "learning_rate": 7.292252443483798e-05, + "loss": 1.528, + "step": 25613 + }, + { + "epoch": 2.02, + "learning_rate": 7.291192154140263e-05, + "loss": 1.4875, + "step": 25614 + }, + { + "epoch": 2.02, + "learning_rate": 7.290131917135284e-05, + "loss": 1.4733, + "step": 25615 + }, + { + "epoch": 2.02, + "learning_rate": 7.289071732476057e-05, + "loss": 1.4194, + "step": 25616 + }, + { + "epoch": 2.02, + "learning_rate": 7.28801160016977e-05, + "loss": 1.3963, + "step": 25617 + }, + { + "epoch": 2.02, + "learning_rate": 7.286951520223637e-05, + "loss": 1.5206, + "step": 25618 + }, + { + "epoch": 2.02, + "learning_rate": 7.285891492644843e-05, + "loss": 1.4805, + "step": 25619 + }, + { + "epoch": 2.02, + "learning_rate": 7.284831517440585e-05, + "loss": 1.4337, + "step": 25620 + }, + { + "epoch": 2.02, + "learning_rate": 7.283771594618068e-05, + "loss": 1.4366, + "step": 25621 + }, + { + "epoch": 2.02, + "learning_rate": 7.282711724184487e-05, + "loss": 1.4972, + "step": 25622 + }, + { + "epoch": 2.02, + "learning_rate": 7.281651906147031e-05, + "loss": 1.4362, + "step": 25623 + }, + { + "epoch": 2.02, + "learning_rate": 7.280592140512894e-05, + "loss": 1.4789, + "step": 25624 + }, + { + "epoch": 2.02, + "learning_rate": 7.279532427289277e-05, + "loss": 1.497, + "step": 25625 + }, + { + "epoch": 2.02, + "learning_rate": 7.27847276648338e-05, + "loss": 1.481, + "step": 25626 + }, + { + "epoch": 2.02, + "learning_rate": 7.277413158102393e-05, + "loss": 1.4234, + "step": 25627 + }, + { + "epoch": 2.02, + "learning_rate": 7.276353602153501e-05, + "loss": 1.4565, + "step": 25628 + }, + { + "epoch": 2.02, + "learning_rate": 7.275294098643914e-05, + "loss": 1.4568, + "step": 25629 + }, + { + "epoch": 2.02, + "learning_rate": 7.274234647580814e-05, + "loss": 1.4679, + "step": 25630 + }, + { + "epoch": 2.02, + "learning_rate": 7.273175248971395e-05, + "loss": 1.3814, + "step": 25631 + }, + { + "epoch": 2.02, + "learning_rate": 7.272115902822857e-05, + "loss": 1.4777, + "step": 25632 + }, + { + "epoch": 2.02, + "learning_rate": 7.271056609142387e-05, + "loss": 1.4699, + "step": 25633 + }, + { + "epoch": 2.02, + "learning_rate": 7.26999736793717e-05, + "loss": 1.4173, + "step": 25634 + }, + { + "epoch": 2.02, + "learning_rate": 7.268938179214412e-05, + "loss": 1.4689, + "step": 25635 + }, + { + "epoch": 2.02, + "learning_rate": 7.267879042981299e-05, + "loss": 1.4427, + "step": 25636 + }, + { + "epoch": 2.02, + "learning_rate": 7.266819959245014e-05, + "loss": 1.4895, + "step": 25637 + }, + { + "epoch": 2.02, + "learning_rate": 7.265760928012758e-05, + "loss": 1.425, + "step": 25638 + }, + { + "epoch": 2.02, + "learning_rate": 7.264701949291718e-05, + "loss": 1.4569, + "step": 25639 + }, + { + "epoch": 2.02, + "learning_rate": 7.263643023089084e-05, + "loss": 1.4585, + "step": 25640 + }, + { + "epoch": 2.02, + "learning_rate": 7.262584149412032e-05, + "loss": 1.4744, + "step": 25641 + }, + { + "epoch": 2.02, + "learning_rate": 7.261525328267776e-05, + "loss": 1.4576, + "step": 25642 + }, + { + "epoch": 2.02, + "learning_rate": 7.260466559663492e-05, + "loss": 1.4322, + "step": 25643 + }, + { + "epoch": 2.02, + "learning_rate": 7.259407843606369e-05, + "loss": 1.4269, + "step": 25644 + }, + { + "epoch": 2.02, + "learning_rate": 7.25834918010359e-05, + "loss": 1.4392, + "step": 25645 + }, + { + "epoch": 2.02, + "learning_rate": 7.257290569162353e-05, + "loss": 1.4742, + "step": 25646 + }, + { + "epoch": 2.02, + "learning_rate": 7.256232010789841e-05, + "loss": 1.4805, + "step": 25647 + }, + { + "epoch": 2.02, + "learning_rate": 7.255173504993234e-05, + "loss": 1.4428, + "step": 25648 + }, + { + "epoch": 2.02, + "learning_rate": 7.254115051779729e-05, + "loss": 1.4694, + "step": 25649 + }, + { + "epoch": 2.02, + "learning_rate": 7.25305665115651e-05, + "loss": 1.5048, + "step": 25650 + }, + { + "epoch": 2.02, + "learning_rate": 7.251998303130756e-05, + "loss": 1.4405, + "step": 25651 + }, + { + "epoch": 2.02, + "learning_rate": 7.250940007709665e-05, + "loss": 1.4915, + "step": 25652 + }, + { + "epoch": 2.02, + "learning_rate": 7.249881764900412e-05, + "loss": 1.4996, + "step": 25653 + }, + { + "epoch": 2.02, + "learning_rate": 7.24882357471018e-05, + "loss": 1.496, + "step": 25654 + }, + { + "epoch": 2.02, + "learning_rate": 7.247765437146166e-05, + "loss": 1.4777, + "step": 25655 + }, + { + "epoch": 2.02, + "learning_rate": 7.246707352215545e-05, + "loss": 1.5003, + "step": 25656 + }, + { + "epoch": 2.02, + "learning_rate": 7.245649319925497e-05, + "loss": 1.4728, + "step": 25657 + }, + { + "epoch": 2.02, + "learning_rate": 7.244591340283209e-05, + "loss": 1.4705, + "step": 25658 + }, + { + "epoch": 2.02, + "learning_rate": 7.243533413295875e-05, + "loss": 1.472, + "step": 25659 + }, + { + "epoch": 2.02, + "learning_rate": 7.242475538970667e-05, + "loss": 1.4402, + "step": 25660 + }, + { + "epoch": 2.02, + "learning_rate": 7.241417717314764e-05, + "loss": 1.4634, + "step": 25661 + }, + { + "epoch": 2.02, + "learning_rate": 7.240359948335357e-05, + "loss": 1.4586, + "step": 25662 + }, + { + "epoch": 2.02, + "learning_rate": 7.239302232039626e-05, + "loss": 1.4711, + "step": 25663 + }, + { + "epoch": 2.02, + "learning_rate": 7.238244568434751e-05, + "loss": 1.4888, + "step": 25664 + }, + { + "epoch": 2.02, + "learning_rate": 7.237186957527904e-05, + "loss": 1.4524, + "step": 25665 + }, + { + "epoch": 2.02, + "learning_rate": 7.23612939932628e-05, + "loss": 1.4386, + "step": 25666 + }, + { + "epoch": 2.02, + "learning_rate": 7.235071893837054e-05, + "loss": 1.4343, + "step": 25667 + }, + { + "epoch": 2.02, + "learning_rate": 7.234014441067399e-05, + "loss": 1.4803, + "step": 25668 + }, + { + "epoch": 2.02, + "learning_rate": 7.232957041024506e-05, + "loss": 1.4943, + "step": 25669 + }, + { + "epoch": 2.02, + "learning_rate": 7.231899693715548e-05, + "loss": 1.4393, + "step": 25670 + }, + { + "epoch": 2.02, + "learning_rate": 7.230842399147698e-05, + "loss": 1.4388, + "step": 25671 + }, + { + "epoch": 2.02, + "learning_rate": 7.229785157328146e-05, + "loss": 1.4418, + "step": 25672 + }, + { + "epoch": 2.02, + "learning_rate": 7.228727968264061e-05, + "loss": 1.4973, + "step": 25673 + }, + { + "epoch": 2.02, + "learning_rate": 7.227670831962628e-05, + "loss": 1.4557, + "step": 25674 + }, + { + "epoch": 2.02, + "learning_rate": 7.226613748431017e-05, + "loss": 1.4187, + "step": 25675 + }, + { + "epoch": 2.02, + "learning_rate": 7.225556717676414e-05, + "loss": 1.4516, + "step": 25676 + }, + { + "epoch": 2.02, + "learning_rate": 7.22449973970599e-05, + "loss": 1.4773, + "step": 25677 + }, + { + "epoch": 2.02, + "learning_rate": 7.223442814526918e-05, + "loss": 1.4249, + "step": 25678 + }, + { + "epoch": 2.02, + "learning_rate": 7.222385942146382e-05, + "loss": 1.4939, + "step": 25679 + }, + { + "epoch": 2.02, + "learning_rate": 7.221329122571553e-05, + "loss": 1.4377, + "step": 25680 + }, + { + "epoch": 2.02, + "learning_rate": 7.220272355809609e-05, + "loss": 1.394, + "step": 25681 + }, + { + "epoch": 2.02, + "learning_rate": 7.219215641867714e-05, + "loss": 1.4579, + "step": 25682 + }, + { + "epoch": 2.02, + "learning_rate": 7.218158980753058e-05, + "loss": 1.4871, + "step": 25683 + }, + { + "epoch": 2.02, + "learning_rate": 7.217102372472807e-05, + "loss": 1.4623, + "step": 25684 + }, + { + "epoch": 2.02, + "learning_rate": 7.216045817034132e-05, + "loss": 1.5234, + "step": 25685 + }, + { + "epoch": 2.02, + "learning_rate": 7.214989314444216e-05, + "loss": 1.4961, + "step": 25686 + }, + { + "epoch": 2.02, + "learning_rate": 7.213932864710227e-05, + "loss": 1.4325, + "step": 25687 + }, + { + "epoch": 2.02, + "learning_rate": 7.21287646783933e-05, + "loss": 1.4412, + "step": 25688 + }, + { + "epoch": 2.02, + "learning_rate": 7.211820123838704e-05, + "loss": 1.4579, + "step": 25689 + }, + { + "epoch": 2.02, + "learning_rate": 7.210763832715527e-05, + "loss": 1.425, + "step": 25690 + }, + { + "epoch": 2.02, + "learning_rate": 7.209707594476966e-05, + "loss": 1.4707, + "step": 25691 + }, + { + "epoch": 2.02, + "learning_rate": 7.208651409130186e-05, + "loss": 1.5373, + "step": 25692 + }, + { + "epoch": 2.02, + "learning_rate": 7.20759527668237e-05, + "loss": 1.4229, + "step": 25693 + }, + { + "epoch": 2.02, + "learning_rate": 7.20653919714068e-05, + "loss": 1.4435, + "step": 25694 + }, + { + "epoch": 2.02, + "learning_rate": 7.205483170512283e-05, + "loss": 1.4316, + "step": 25695 + }, + { + "epoch": 2.02, + "learning_rate": 7.20442719680436e-05, + "loss": 1.4458, + "step": 25696 + }, + { + "epoch": 2.02, + "learning_rate": 7.203371276024074e-05, + "loss": 1.4264, + "step": 25697 + }, + { + "epoch": 2.02, + "learning_rate": 7.202315408178596e-05, + "loss": 1.4054, + "step": 25698 + }, + { + "epoch": 2.02, + "learning_rate": 7.201259593275085e-05, + "loss": 1.4303, + "step": 25699 + }, + { + "epoch": 2.02, + "learning_rate": 7.200203831320724e-05, + "loss": 1.5127, + "step": 25700 + }, + { + "epoch": 2.02, + "learning_rate": 7.199148122322675e-05, + "loss": 1.4888, + "step": 25701 + }, + { + "epoch": 2.02, + "learning_rate": 7.198092466288101e-05, + "loss": 1.4918, + "step": 25702 + }, + { + "epoch": 2.02, + "learning_rate": 7.197036863224177e-05, + "loss": 1.5063, + "step": 25703 + }, + { + "epoch": 2.02, + "learning_rate": 7.195981313138063e-05, + "loss": 1.4966, + "step": 25704 + }, + { + "epoch": 2.02, + "learning_rate": 7.194925816036934e-05, + "loss": 1.4378, + "step": 25705 + }, + { + "epoch": 2.02, + "learning_rate": 7.193870371927946e-05, + "loss": 1.4988, + "step": 25706 + }, + { + "epoch": 2.02, + "learning_rate": 7.192814980818277e-05, + "loss": 1.4091, + "step": 25707 + }, + { + "epoch": 2.02, + "learning_rate": 7.191759642715084e-05, + "loss": 1.496, + "step": 25708 + }, + { + "epoch": 2.02, + "learning_rate": 7.190704357625529e-05, + "loss": 1.4721, + "step": 25709 + }, + { + "epoch": 2.02, + "learning_rate": 7.189649125556789e-05, + "loss": 1.389, + "step": 25710 + }, + { + "epoch": 2.02, + "learning_rate": 7.18859394651602e-05, + "loss": 1.5081, + "step": 25711 + }, + { + "epoch": 2.02, + "learning_rate": 7.187538820510382e-05, + "loss": 1.4736, + "step": 25712 + }, + { + "epoch": 2.02, + "learning_rate": 7.186483747547048e-05, + "loss": 1.4592, + "step": 25713 + }, + { + "epoch": 2.02, + "learning_rate": 7.185428727633181e-05, + "loss": 1.5167, + "step": 25714 + }, + { + "epoch": 2.02, + "learning_rate": 7.184373760775939e-05, + "loss": 1.4446, + "step": 25715 + }, + { + "epoch": 2.02, + "learning_rate": 7.183318846982479e-05, + "loss": 1.4521, + "step": 25716 + }, + { + "epoch": 2.02, + "learning_rate": 7.182263986259979e-05, + "loss": 1.4538, + "step": 25717 + }, + { + "epoch": 2.02, + "learning_rate": 7.18120917861559e-05, + "loss": 1.487, + "step": 25718 + }, + { + "epoch": 2.02, + "learning_rate": 7.180154424056472e-05, + "loss": 1.4281, + "step": 25719 + }, + { + "epoch": 2.02, + "learning_rate": 7.179099722589789e-05, + "loss": 1.4646, + "step": 25720 + }, + { + "epoch": 2.02, + "learning_rate": 7.178045074222708e-05, + "loss": 1.419, + "step": 25721 + }, + { + "epoch": 2.02, + "learning_rate": 7.176990478962385e-05, + "loss": 1.4527, + "step": 25722 + }, + { + "epoch": 2.02, + "learning_rate": 7.175935936815974e-05, + "loss": 1.4221, + "step": 25723 + }, + { + "epoch": 2.02, + "learning_rate": 7.174881447790646e-05, + "loss": 1.4528, + "step": 25724 + }, + { + "epoch": 2.02, + "learning_rate": 7.173827011893554e-05, + "loss": 1.4695, + "step": 25725 + }, + { + "epoch": 2.02, + "learning_rate": 7.172772629131854e-05, + "loss": 1.4898, + "step": 25726 + }, + { + "epoch": 2.02, + "learning_rate": 7.171718299512713e-05, + "loss": 1.4519, + "step": 25727 + }, + { + "epoch": 2.02, + "learning_rate": 7.170664023043284e-05, + "loss": 1.4707, + "step": 25728 + }, + { + "epoch": 2.02, + "learning_rate": 7.169609799730722e-05, + "loss": 1.4918, + "step": 25729 + }, + { + "epoch": 2.02, + "learning_rate": 7.168555629582192e-05, + "loss": 1.4569, + "step": 25730 + }, + { + "epoch": 2.02, + "learning_rate": 7.167501512604848e-05, + "loss": 1.4614, + "step": 25731 + }, + { + "epoch": 2.02, + "learning_rate": 7.166447448805842e-05, + "loss": 1.4231, + "step": 25732 + }, + { + "epoch": 2.02, + "learning_rate": 7.165393438192338e-05, + "loss": 1.4738, + "step": 25733 + }, + { + "epoch": 2.02, + "learning_rate": 7.16433948077149e-05, + "loss": 1.4488, + "step": 25734 + }, + { + "epoch": 2.02, + "learning_rate": 7.163285576550449e-05, + "loss": 1.4623, + "step": 25735 + }, + { + "epoch": 2.02, + "learning_rate": 7.162231725536373e-05, + "loss": 1.4966, + "step": 25736 + }, + { + "epoch": 2.03, + "learning_rate": 7.161177927736423e-05, + "loss": 1.4131, + "step": 25737 + }, + { + "epoch": 2.03, + "learning_rate": 7.16012418315775e-05, + "loss": 1.454, + "step": 25738 + }, + { + "epoch": 2.03, + "learning_rate": 7.159070491807508e-05, + "loss": 1.4466, + "step": 25739 + }, + { + "epoch": 2.03, + "learning_rate": 7.158016853692845e-05, + "loss": 1.4596, + "step": 25740 + }, + { + "epoch": 2.03, + "learning_rate": 7.156963268820924e-05, + "loss": 1.4617, + "step": 25741 + }, + { + "epoch": 2.03, + "learning_rate": 7.155909737198895e-05, + "loss": 1.4635, + "step": 25742 + }, + { + "epoch": 2.03, + "learning_rate": 7.154856258833905e-05, + "loss": 1.4729, + "step": 25743 + }, + { + "epoch": 2.03, + "learning_rate": 7.153802833733117e-05, + "loss": 1.4537, + "step": 25744 + }, + { + "epoch": 2.03, + "learning_rate": 7.152749461903679e-05, + "loss": 1.4835, + "step": 25745 + }, + { + "epoch": 2.03, + "learning_rate": 7.151696143352734e-05, + "loss": 1.5135, + "step": 25746 + }, + { + "epoch": 2.03, + "learning_rate": 7.150642878087447e-05, + "loss": 1.3621, + "step": 25747 + }, + { + "epoch": 2.03, + "learning_rate": 7.149589666114965e-05, + "loss": 1.4953, + "step": 25748 + }, + { + "epoch": 2.03, + "learning_rate": 7.148536507442429e-05, + "loss": 1.4256, + "step": 25749 + }, + { + "epoch": 2.03, + "learning_rate": 7.147483402077004e-05, + "loss": 1.4808, + "step": 25750 + }, + { + "epoch": 2.03, + "learning_rate": 7.146430350025828e-05, + "loss": 1.4824, + "step": 25751 + }, + { + "epoch": 2.03, + "learning_rate": 7.145377351296061e-05, + "loss": 1.5191, + "step": 25752 + }, + { + "epoch": 2.03, + "learning_rate": 7.144324405894843e-05, + "loss": 1.4634, + "step": 25753 + }, + { + "epoch": 2.03, + "learning_rate": 7.143271513829331e-05, + "loss": 1.4244, + "step": 25754 + }, + { + "epoch": 2.03, + "learning_rate": 7.142218675106671e-05, + "loss": 1.4745, + "step": 25755 + }, + { + "epoch": 2.03, + "learning_rate": 7.14116588973401e-05, + "loss": 1.446, + "step": 25756 + }, + { + "epoch": 2.03, + "learning_rate": 7.14011315771849e-05, + "loss": 1.423, + "step": 25757 + }, + { + "epoch": 2.03, + "learning_rate": 7.139060479067268e-05, + "loss": 1.4625, + "step": 25758 + }, + { + "epoch": 2.03, + "learning_rate": 7.138007853787489e-05, + "loss": 1.4974, + "step": 25759 + }, + { + "epoch": 2.03, + "learning_rate": 7.136955281886293e-05, + "loss": 1.4551, + "step": 25760 + }, + { + "epoch": 2.03, + "learning_rate": 7.135902763370836e-05, + "loss": 1.432, + "step": 25761 + }, + { + "epoch": 2.03, + "learning_rate": 7.134850298248259e-05, + "loss": 1.5176, + "step": 25762 + }, + { + "epoch": 2.03, + "learning_rate": 7.133797886525705e-05, + "loss": 1.4797, + "step": 25763 + }, + { + "epoch": 2.03, + "learning_rate": 7.132745528210324e-05, + "loss": 1.4493, + "step": 25764 + }, + { + "epoch": 2.03, + "learning_rate": 7.131693223309262e-05, + "loss": 1.4894, + "step": 25765 + }, + { + "epoch": 2.03, + "learning_rate": 7.130640971829655e-05, + "loss": 1.447, + "step": 25766 + }, + { + "epoch": 2.03, + "learning_rate": 7.129588773778653e-05, + "loss": 1.4648, + "step": 25767 + }, + { + "epoch": 2.03, + "learning_rate": 7.128536629163406e-05, + "loss": 1.5388, + "step": 25768 + }, + { + "epoch": 2.03, + "learning_rate": 7.127484537991052e-05, + "loss": 1.444, + "step": 25769 + }, + { + "epoch": 2.03, + "learning_rate": 7.126432500268727e-05, + "loss": 1.4356, + "step": 25770 + }, + { + "epoch": 2.03, + "learning_rate": 7.125380516003586e-05, + "loss": 1.4558, + "step": 25771 + }, + { + "epoch": 2.03, + "learning_rate": 7.124328585202766e-05, + "loss": 1.5186, + "step": 25772 + }, + { + "epoch": 2.03, + "learning_rate": 7.123276707873403e-05, + "loss": 1.4155, + "step": 25773 + }, + { + "epoch": 2.03, + "learning_rate": 7.12222488402265e-05, + "loss": 1.411, + "step": 25774 + }, + { + "epoch": 2.03, + "learning_rate": 7.121173113657642e-05, + "loss": 1.4707, + "step": 25775 + }, + { + "epoch": 2.03, + "learning_rate": 7.12012139678552e-05, + "loss": 1.4687, + "step": 25776 + }, + { + "epoch": 2.03, + "learning_rate": 7.119069733413422e-05, + "loss": 1.451, + "step": 25777 + }, + { + "epoch": 2.03, + "learning_rate": 7.118018123548495e-05, + "loss": 1.4244, + "step": 25778 + }, + { + "epoch": 2.03, + "learning_rate": 7.116966567197877e-05, + "loss": 1.5051, + "step": 25779 + }, + { + "epoch": 2.03, + "learning_rate": 7.1159150643687e-05, + "loss": 1.5087, + "step": 25780 + }, + { + "epoch": 2.03, + "learning_rate": 7.114863615068114e-05, + "loss": 1.4448, + "step": 25781 + }, + { + "epoch": 2.03, + "learning_rate": 7.113812219303252e-05, + "loss": 1.4472, + "step": 25782 + }, + { + "epoch": 2.03, + "learning_rate": 7.112760877081247e-05, + "loss": 1.4368, + "step": 25783 + }, + { + "epoch": 2.03, + "learning_rate": 7.111709588409244e-05, + "loss": 1.4193, + "step": 25784 + }, + { + "epoch": 2.03, + "learning_rate": 7.110658353294388e-05, + "loss": 1.4459, + "step": 25785 + }, + { + "epoch": 2.03, + "learning_rate": 7.109607171743806e-05, + "loss": 1.4799, + "step": 25786 + }, + { + "epoch": 2.03, + "learning_rate": 7.10855604376463e-05, + "loss": 1.4149, + "step": 25787 + }, + { + "epoch": 2.03, + "learning_rate": 7.107504969364009e-05, + "loss": 1.4941, + "step": 25788 + }, + { + "epoch": 2.03, + "learning_rate": 7.106453948549077e-05, + "loss": 1.4078, + "step": 25789 + }, + { + "epoch": 2.03, + "learning_rate": 7.10540298132696e-05, + "loss": 1.4309, + "step": 25790 + }, + { + "epoch": 2.03, + "learning_rate": 7.104352067704804e-05, + "loss": 1.4502, + "step": 25791 + }, + { + "epoch": 2.03, + "learning_rate": 7.103301207689742e-05, + "loss": 1.4461, + "step": 25792 + }, + { + "epoch": 2.03, + "learning_rate": 7.102250401288905e-05, + "loss": 1.4533, + "step": 25793 + }, + { + "epoch": 2.03, + "learning_rate": 7.101199648509424e-05, + "loss": 1.4454, + "step": 25794 + }, + { + "epoch": 2.03, + "learning_rate": 7.100148949358448e-05, + "loss": 1.4757, + "step": 25795 + }, + { + "epoch": 2.03, + "learning_rate": 7.099098303843098e-05, + "loss": 1.4924, + "step": 25796 + }, + { + "epoch": 2.03, + "learning_rate": 7.098047711970505e-05, + "loss": 1.4486, + "step": 25797 + }, + { + "epoch": 2.03, + "learning_rate": 7.096997173747806e-05, + "loss": 1.4792, + "step": 25798 + }, + { + "epoch": 2.03, + "learning_rate": 7.095946689182142e-05, + "loss": 1.4257, + "step": 25799 + }, + { + "epoch": 2.03, + "learning_rate": 7.094896258280639e-05, + "loss": 1.4877, + "step": 25800 + }, + { + "epoch": 2.03, + "learning_rate": 7.093845881050421e-05, + "loss": 1.4687, + "step": 25801 + }, + { + "epoch": 2.03, + "learning_rate": 7.092795557498633e-05, + "loss": 1.4544, + "step": 25802 + }, + { + "epoch": 2.03, + "learning_rate": 7.0917452876324e-05, + "loss": 1.4807, + "step": 25803 + }, + { + "epoch": 2.03, + "learning_rate": 7.090695071458845e-05, + "loss": 1.4266, + "step": 25804 + }, + { + "epoch": 2.03, + "learning_rate": 7.089644908985114e-05, + "loss": 1.4569, + "step": 25805 + }, + { + "epoch": 2.03, + "learning_rate": 7.088594800218327e-05, + "loss": 1.462, + "step": 25806 + }, + { + "epoch": 2.03, + "learning_rate": 7.087544745165609e-05, + "loss": 1.4559, + "step": 25807 + }, + { + "epoch": 2.03, + "learning_rate": 7.086494743834104e-05, + "loss": 1.4754, + "step": 25808 + }, + { + "epoch": 2.03, + "learning_rate": 7.08544479623093e-05, + "loss": 1.4533, + "step": 25809 + }, + { + "epoch": 2.03, + "learning_rate": 7.084394902363221e-05, + "loss": 1.4153, + "step": 25810 + }, + { + "epoch": 2.03, + "learning_rate": 7.083345062238093e-05, + "loss": 1.4445, + "step": 25811 + }, + { + "epoch": 2.03, + "learning_rate": 7.082295275862691e-05, + "loss": 1.4847, + "step": 25812 + }, + { + "epoch": 2.03, + "learning_rate": 7.081245543244137e-05, + "loss": 1.4387, + "step": 25813 + }, + { + "epoch": 2.03, + "learning_rate": 7.080195864389547e-05, + "loss": 1.463, + "step": 25814 + }, + { + "epoch": 2.03, + "learning_rate": 7.079146239306057e-05, + "loss": 1.474, + "step": 25815 + }, + { + "epoch": 2.03, + "learning_rate": 7.078096668000798e-05, + "loss": 1.4346, + "step": 25816 + }, + { + "epoch": 2.03, + "learning_rate": 7.077047150480893e-05, + "loss": 1.497, + "step": 25817 + }, + { + "epoch": 2.03, + "learning_rate": 7.075997686753458e-05, + "loss": 1.4808, + "step": 25818 + }, + { + "epoch": 2.03, + "learning_rate": 7.074948276825633e-05, + "loss": 1.5102, + "step": 25819 + }, + { + "epoch": 2.03, + "learning_rate": 7.073898920704536e-05, + "loss": 1.4362, + "step": 25820 + }, + { + "epoch": 2.03, + "learning_rate": 7.072849618397285e-05, + "loss": 1.4353, + "step": 25821 + }, + { + "epoch": 2.03, + "learning_rate": 7.071800369911016e-05, + "loss": 1.4673, + "step": 25822 + }, + { + "epoch": 2.03, + "learning_rate": 7.070751175252847e-05, + "loss": 1.4632, + "step": 25823 + }, + { + "epoch": 2.03, + "learning_rate": 7.069702034429898e-05, + "loss": 1.4466, + "step": 25824 + }, + { + "epoch": 2.03, + "learning_rate": 7.0686529474493e-05, + "loss": 1.4933, + "step": 25825 + }, + { + "epoch": 2.03, + "learning_rate": 7.067603914318171e-05, + "loss": 1.4707, + "step": 25826 + }, + { + "epoch": 2.03, + "learning_rate": 7.066554935043629e-05, + "loss": 1.4303, + "step": 25827 + }, + { + "epoch": 2.03, + "learning_rate": 7.065506009632807e-05, + "loss": 1.4154, + "step": 25828 + }, + { + "epoch": 2.03, + "learning_rate": 7.06445713809282e-05, + "loss": 1.4603, + "step": 25829 + }, + { + "epoch": 2.03, + "learning_rate": 7.063408320430784e-05, + "loss": 1.4538, + "step": 25830 + }, + { + "epoch": 2.03, + "learning_rate": 7.062359556653827e-05, + "loss": 1.4736, + "step": 25831 + }, + { + "epoch": 2.03, + "learning_rate": 7.061310846769073e-05, + "loss": 1.4753, + "step": 25832 + }, + { + "epoch": 2.03, + "learning_rate": 7.060262190783637e-05, + "loss": 1.4381, + "step": 25833 + }, + { + "epoch": 2.03, + "learning_rate": 7.059213588704641e-05, + "loss": 1.4244, + "step": 25834 + }, + { + "epoch": 2.03, + "learning_rate": 7.058165040539195e-05, + "loss": 1.4805, + "step": 25835 + }, + { + "epoch": 2.03, + "learning_rate": 7.057116546294432e-05, + "loss": 1.4427, + "step": 25836 + }, + { + "epoch": 2.03, + "learning_rate": 7.056068105977465e-05, + "loss": 1.4446, + "step": 25837 + }, + { + "epoch": 2.03, + "learning_rate": 7.055019719595404e-05, + "loss": 1.4871, + "step": 25838 + }, + { + "epoch": 2.03, + "learning_rate": 7.053971387155383e-05, + "loss": 1.3956, + "step": 25839 + }, + { + "epoch": 2.03, + "learning_rate": 7.052923108664511e-05, + "loss": 1.4673, + "step": 25840 + }, + { + "epoch": 2.03, + "learning_rate": 7.051874884129899e-05, + "loss": 1.4426, + "step": 25841 + }, + { + "epoch": 2.03, + "learning_rate": 7.050826713558676e-05, + "loss": 1.4426, + "step": 25842 + }, + { + "epoch": 2.03, + "learning_rate": 7.049778596957954e-05, + "loss": 1.4311, + "step": 25843 + }, + { + "epoch": 2.03, + "learning_rate": 7.048730534334842e-05, + "loss": 1.529, + "step": 25844 + }, + { + "epoch": 2.03, + "learning_rate": 7.047682525696459e-05, + "loss": 1.4293, + "step": 25845 + }, + { + "epoch": 2.03, + "learning_rate": 7.046634571049933e-05, + "loss": 1.4347, + "step": 25846 + }, + { + "epoch": 2.03, + "learning_rate": 7.045586670402366e-05, + "loss": 1.4747, + "step": 25847 + }, + { + "epoch": 2.03, + "learning_rate": 7.044538823760872e-05, + "loss": 1.4982, + "step": 25848 + }, + { + "epoch": 2.03, + "learning_rate": 7.043491031132575e-05, + "loss": 1.4841, + "step": 25849 + }, + { + "epoch": 2.03, + "learning_rate": 7.042443292524583e-05, + "loss": 1.5321, + "step": 25850 + }, + { + "epoch": 2.03, + "learning_rate": 7.041395607944008e-05, + "loss": 1.4863, + "step": 25851 + }, + { + "epoch": 2.03, + "learning_rate": 7.040347977397962e-05, + "loss": 1.5371, + "step": 25852 + }, + { + "epoch": 2.03, + "learning_rate": 7.039300400893564e-05, + "loss": 1.4591, + "step": 25853 + }, + { + "epoch": 2.03, + "learning_rate": 7.038252878437923e-05, + "loss": 1.4261, + "step": 25854 + }, + { + "epoch": 2.03, + "learning_rate": 7.037205410038148e-05, + "loss": 1.4262, + "step": 25855 + }, + { + "epoch": 2.03, + "learning_rate": 7.036157995701358e-05, + "loss": 1.4151, + "step": 25856 + }, + { + "epoch": 2.03, + "learning_rate": 7.035110635434661e-05, + "loss": 1.4823, + "step": 25857 + }, + { + "epoch": 2.03, + "learning_rate": 7.034063329245162e-05, + "loss": 1.4545, + "step": 25858 + }, + { + "epoch": 2.03, + "learning_rate": 7.033016077139981e-05, + "loss": 1.408, + "step": 25859 + }, + { + "epoch": 2.03, + "learning_rate": 7.031968879126227e-05, + "loss": 1.4441, + "step": 25860 + }, + { + "epoch": 2.03, + "learning_rate": 7.030921735210999e-05, + "loss": 1.453, + "step": 25861 + }, + { + "epoch": 2.03, + "learning_rate": 7.029874645401417e-05, + "loss": 1.4474, + "step": 25862 + }, + { + "epoch": 2.03, + "learning_rate": 7.028827609704593e-05, + "loss": 1.431, + "step": 25863 + }, + { + "epoch": 2.04, + "learning_rate": 7.027780628127629e-05, + "loss": 1.4708, + "step": 25864 + }, + { + "epoch": 2.04, + "learning_rate": 7.02673370067763e-05, + "loss": 1.5013, + "step": 25865 + }, + { + "epoch": 2.04, + "learning_rate": 7.025686827361716e-05, + "loss": 1.4712, + "step": 25866 + }, + { + "epoch": 2.04, + "learning_rate": 7.024640008186987e-05, + "loss": 1.5144, + "step": 25867 + }, + { + "epoch": 2.04, + "learning_rate": 7.023593243160551e-05, + "loss": 1.4648, + "step": 25868 + }, + { + "epoch": 2.04, + "learning_rate": 7.02254653228951e-05, + "loss": 1.5248, + "step": 25869 + }, + { + "epoch": 2.04, + "learning_rate": 7.02149987558098e-05, + "loss": 1.4961, + "step": 25870 + }, + { + "epoch": 2.04, + "learning_rate": 7.020453273042066e-05, + "loss": 1.4297, + "step": 25871 + }, + { + "epoch": 2.04, + "learning_rate": 7.019406724679862e-05, + "loss": 1.4886, + "step": 25872 + }, + { + "epoch": 2.04, + "learning_rate": 7.018360230501489e-05, + "loss": 1.5233, + "step": 25873 + }, + { + "epoch": 2.04, + "learning_rate": 7.017313790514047e-05, + "loss": 1.4394, + "step": 25874 + }, + { + "epoch": 2.04, + "learning_rate": 7.01626740472463e-05, + "loss": 1.4879, + "step": 25875 + }, + { + "epoch": 2.04, + "learning_rate": 7.01522107314036e-05, + "loss": 1.4279, + "step": 25876 + }, + { + "epoch": 2.04, + "learning_rate": 7.014174795768328e-05, + "loss": 1.4875, + "step": 25877 + }, + { + "epoch": 2.04, + "learning_rate": 7.013128572615645e-05, + "loss": 1.4773, + "step": 25878 + }, + { + "epoch": 2.04, + "learning_rate": 7.012082403689407e-05, + "loss": 1.4004, + "step": 25879 + }, + { + "epoch": 2.04, + "learning_rate": 7.011036288996728e-05, + "loss": 1.4564, + "step": 25880 + }, + { + "epoch": 2.04, + "learning_rate": 7.009990228544702e-05, + "loss": 1.4713, + "step": 25881 + }, + { + "epoch": 2.04, + "learning_rate": 7.008944222340427e-05, + "loss": 1.419, + "step": 25882 + }, + { + "epoch": 2.04, + "learning_rate": 7.007898270391019e-05, + "loss": 1.4995, + "step": 25883 + }, + { + "epoch": 2.04, + "learning_rate": 7.006852372703569e-05, + "loss": 1.451, + "step": 25884 + }, + { + "epoch": 2.04, + "learning_rate": 7.005806529285177e-05, + "loss": 1.4245, + "step": 25885 + }, + { + "epoch": 2.04, + "learning_rate": 7.00476074014295e-05, + "loss": 1.4836, + "step": 25886 + }, + { + "epoch": 2.04, + "learning_rate": 7.003715005283988e-05, + "loss": 1.4111, + "step": 25887 + }, + { + "epoch": 2.04, + "learning_rate": 7.002669324715388e-05, + "loss": 1.4511, + "step": 25888 + }, + { + "epoch": 2.04, + "learning_rate": 7.001623698444243e-05, + "loss": 1.4586, + "step": 25889 + }, + { + "epoch": 2.04, + "learning_rate": 7.000578126477667e-05, + "loss": 1.4734, + "step": 25890 + }, + { + "epoch": 2.04, + "learning_rate": 6.99953260882275e-05, + "loss": 1.4517, + "step": 25891 + }, + { + "epoch": 2.04, + "learning_rate": 6.998487145486584e-05, + "loss": 1.4721, + "step": 25892 + }, + { + "epoch": 2.04, + "learning_rate": 6.997441736476278e-05, + "loss": 1.4777, + "step": 25893 + }, + { + "epoch": 2.04, + "learning_rate": 6.996396381798931e-05, + "loss": 1.4753, + "step": 25894 + }, + { + "epoch": 2.04, + "learning_rate": 6.995351081461634e-05, + "loss": 1.4614, + "step": 25895 + }, + { + "epoch": 2.04, + "learning_rate": 6.994305835471481e-05, + "loss": 1.4342, + "step": 25896 + }, + { + "epoch": 2.04, + "learning_rate": 6.99326064383558e-05, + "loss": 1.4547, + "step": 25897 + }, + { + "epoch": 2.04, + "learning_rate": 6.99221550656102e-05, + "loss": 1.4338, + "step": 25898 + }, + { + "epoch": 2.04, + "learning_rate": 6.991170423654892e-05, + "loss": 1.4117, + "step": 25899 + }, + { + "epoch": 2.04, + "learning_rate": 6.990125395124303e-05, + "loss": 1.4281, + "step": 25900 + }, + { + "epoch": 2.04, + "learning_rate": 6.989080420976344e-05, + "loss": 1.4132, + "step": 25901 + }, + { + "epoch": 2.04, + "learning_rate": 6.9880355012181e-05, + "loss": 1.483, + "step": 25902 + }, + { + "epoch": 2.04, + "learning_rate": 6.98699063585668e-05, + "loss": 1.3947, + "step": 25903 + }, + { + "epoch": 2.04, + "learning_rate": 6.985945824899173e-05, + "loss": 1.4025, + "step": 25904 + }, + { + "epoch": 2.04, + "learning_rate": 6.98490106835267e-05, + "loss": 1.4375, + "step": 25905 + }, + { + "epoch": 2.04, + "learning_rate": 6.983856366224259e-05, + "loss": 1.463, + "step": 25906 + }, + { + "epoch": 2.04, + "learning_rate": 6.982811718521047e-05, + "loss": 1.4547, + "step": 25907 + }, + { + "epoch": 2.04, + "learning_rate": 6.981767125250113e-05, + "loss": 1.4573, + "step": 25908 + }, + { + "epoch": 2.04, + "learning_rate": 6.980722586418562e-05, + "loss": 1.4404, + "step": 25909 + }, + { + "epoch": 2.04, + "learning_rate": 6.979678102033472e-05, + "loss": 1.4776, + "step": 25910 + }, + { + "epoch": 2.04, + "learning_rate": 6.978633672101947e-05, + "loss": 1.5457, + "step": 25911 + }, + { + "epoch": 2.04, + "learning_rate": 6.977589296631075e-05, + "loss": 1.4307, + "step": 25912 + }, + { + "epoch": 2.04, + "learning_rate": 6.976544975627937e-05, + "loss": 1.4529, + "step": 25913 + }, + { + "epoch": 2.04, + "learning_rate": 6.975500709099638e-05, + "loss": 1.474, + "step": 25914 + }, + { + "epoch": 2.04, + "learning_rate": 6.974456497053258e-05, + "loss": 1.4807, + "step": 25915 + }, + { + "epoch": 2.04, + "learning_rate": 6.973412339495886e-05, + "loss": 1.4945, + "step": 25916 + }, + { + "epoch": 2.04, + "learning_rate": 6.972368236434622e-05, + "loss": 1.4763, + "step": 25917 + }, + { + "epoch": 2.04, + "learning_rate": 6.971324187876546e-05, + "loss": 1.4748, + "step": 25918 + }, + { + "epoch": 2.04, + "learning_rate": 6.970280193828743e-05, + "loss": 1.4539, + "step": 25919 + }, + { + "epoch": 2.04, + "learning_rate": 6.969236254298311e-05, + "loss": 1.4525, + "step": 25920 + }, + { + "epoch": 2.04, + "learning_rate": 6.968192369292334e-05, + "loss": 1.4736, + "step": 25921 + }, + { + "epoch": 2.04, + "learning_rate": 6.967148538817898e-05, + "loss": 1.3753, + "step": 25922 + }, + { + "epoch": 2.04, + "learning_rate": 6.966104762882085e-05, + "loss": 1.4326, + "step": 25923 + }, + { + "epoch": 2.04, + "learning_rate": 6.965061041491988e-05, + "loss": 1.4566, + "step": 25924 + }, + { + "epoch": 2.04, + "learning_rate": 6.964017374654697e-05, + "loss": 1.4421, + "step": 25925 + }, + { + "epoch": 2.04, + "learning_rate": 6.962973762377287e-05, + "loss": 1.4685, + "step": 25926 + }, + { + "epoch": 2.04, + "learning_rate": 6.961930204666857e-05, + "loss": 1.4538, + "step": 25927 + }, + { + "epoch": 2.04, + "learning_rate": 6.960886701530486e-05, + "loss": 1.5333, + "step": 25928 + }, + { + "epoch": 2.04, + "learning_rate": 6.959843252975255e-05, + "loss": 1.4297, + "step": 25929 + }, + { + "epoch": 2.04, + "learning_rate": 6.95879985900825e-05, + "loss": 1.5036, + "step": 25930 + }, + { + "epoch": 2.04, + "learning_rate": 6.957756519636558e-05, + "loss": 1.4404, + "step": 25931 + }, + { + "epoch": 2.04, + "learning_rate": 6.956713234867262e-05, + "loss": 1.4683, + "step": 25932 + }, + { + "epoch": 2.04, + "learning_rate": 6.955670004707441e-05, + "loss": 1.4834, + "step": 25933 + }, + { + "epoch": 2.04, + "learning_rate": 6.954626829164186e-05, + "loss": 1.4481, + "step": 25934 + }, + { + "epoch": 2.04, + "learning_rate": 6.953583708244574e-05, + "loss": 1.4471, + "step": 25935 + }, + { + "epoch": 2.04, + "learning_rate": 6.952540641955685e-05, + "loss": 1.4258, + "step": 25936 + }, + { + "epoch": 2.04, + "learning_rate": 6.951497630304607e-05, + "loss": 1.4187, + "step": 25937 + }, + { + "epoch": 2.04, + "learning_rate": 6.95045467329842e-05, + "loss": 1.4567, + "step": 25938 + }, + { + "epoch": 2.04, + "learning_rate": 6.949411770944197e-05, + "loss": 1.4294, + "step": 25939 + }, + { + "epoch": 2.04, + "learning_rate": 6.948368923249025e-05, + "loss": 1.4855, + "step": 25940 + }, + { + "epoch": 2.04, + "learning_rate": 6.947326130219992e-05, + "loss": 1.4653, + "step": 25941 + }, + { + "epoch": 2.04, + "learning_rate": 6.946283391864171e-05, + "loss": 1.4652, + "step": 25942 + }, + { + "epoch": 2.04, + "learning_rate": 6.945240708188635e-05, + "loss": 1.388, + "step": 25943 + }, + { + "epoch": 2.04, + "learning_rate": 6.944198079200474e-05, + "loss": 1.4378, + "step": 25944 + }, + { + "epoch": 2.04, + "learning_rate": 6.943155504906764e-05, + "loss": 1.4289, + "step": 25945 + }, + { + "epoch": 2.04, + "learning_rate": 6.942112985314581e-05, + "loss": 1.4965, + "step": 25946 + }, + { + "epoch": 2.04, + "learning_rate": 6.941070520431e-05, + "loss": 1.4624, + "step": 25947 + }, + { + "epoch": 2.04, + "learning_rate": 6.940028110263109e-05, + "loss": 1.4134, + "step": 25948 + }, + { + "epoch": 2.04, + "learning_rate": 6.938985754817977e-05, + "loss": 1.4507, + "step": 25949 + }, + { + "epoch": 2.04, + "learning_rate": 6.937943454102678e-05, + "loss": 1.4811, + "step": 25950 + }, + { + "epoch": 2.04, + "learning_rate": 6.9369012081243e-05, + "loss": 1.4628, + "step": 25951 + }, + { + "epoch": 2.04, + "learning_rate": 6.935859016889914e-05, + "loss": 1.4481, + "step": 25952 + }, + { + "epoch": 2.04, + "learning_rate": 6.934816880406587e-05, + "loss": 1.4468, + "step": 25953 + }, + { + "epoch": 2.04, + "learning_rate": 6.933774798681412e-05, + "loss": 1.4927, + "step": 25954 + }, + { + "epoch": 2.04, + "learning_rate": 6.932732771721446e-05, + "loss": 1.4827, + "step": 25955 + }, + { + "epoch": 2.04, + "learning_rate": 6.93169079953378e-05, + "loss": 1.4873, + "step": 25956 + }, + { + "epoch": 2.04, + "learning_rate": 6.930648882125476e-05, + "loss": 1.4484, + "step": 25957 + }, + { + "epoch": 2.04, + "learning_rate": 6.929607019503617e-05, + "loss": 1.4411, + "step": 25958 + }, + { + "epoch": 2.04, + "learning_rate": 6.928565211675273e-05, + "loss": 1.4413, + "step": 25959 + }, + { + "epoch": 2.04, + "learning_rate": 6.927523458647513e-05, + "loss": 1.4456, + "step": 25960 + }, + { + "epoch": 2.04, + "learning_rate": 6.926481760427417e-05, + "loss": 1.4398, + "step": 25961 + }, + { + "epoch": 2.04, + "learning_rate": 6.925440117022056e-05, + "loss": 1.4681, + "step": 25962 + }, + { + "epoch": 2.04, + "learning_rate": 6.924398528438499e-05, + "loss": 1.4609, + "step": 25963 + }, + { + "epoch": 2.04, + "learning_rate": 6.923356994683816e-05, + "loss": 1.4286, + "step": 25964 + }, + { + "epoch": 2.04, + "learning_rate": 6.922315515765087e-05, + "loss": 1.4647, + "step": 25965 + }, + { + "epoch": 2.04, + "learning_rate": 6.921274091689378e-05, + "loss": 1.451, + "step": 25966 + }, + { + "epoch": 2.04, + "learning_rate": 6.920232722463756e-05, + "loss": 1.466, + "step": 25967 + }, + { + "epoch": 2.04, + "learning_rate": 6.919191408095297e-05, + "loss": 1.4741, + "step": 25968 + }, + { + "epoch": 2.04, + "learning_rate": 6.91815014859107e-05, + "loss": 1.4352, + "step": 25969 + }, + { + "epoch": 2.04, + "learning_rate": 6.917108943958138e-05, + "loss": 1.5035, + "step": 25970 + }, + { + "epoch": 2.04, + "learning_rate": 6.916067794203578e-05, + "loss": 1.4443, + "step": 25971 + }, + { + "epoch": 2.04, + "learning_rate": 6.91502669933446e-05, + "loss": 1.4853, + "step": 25972 + }, + { + "epoch": 2.04, + "learning_rate": 6.91398565935785e-05, + "loss": 1.4508, + "step": 25973 + }, + { + "epoch": 2.04, + "learning_rate": 6.912944674280808e-05, + "loss": 1.5069, + "step": 25974 + }, + { + "epoch": 2.04, + "learning_rate": 6.911903744110417e-05, + "loss": 1.4136, + "step": 25975 + }, + { + "epoch": 2.04, + "learning_rate": 6.910862868853735e-05, + "loss": 1.4467, + "step": 25976 + }, + { + "epoch": 2.04, + "learning_rate": 6.909822048517823e-05, + "loss": 1.4702, + "step": 25977 + }, + { + "epoch": 2.04, + "learning_rate": 6.908781283109762e-05, + "loss": 1.4706, + "step": 25978 + }, + { + "epoch": 2.04, + "learning_rate": 6.907740572636611e-05, + "loss": 1.4211, + "step": 25979 + }, + { + "epoch": 2.04, + "learning_rate": 6.906699917105434e-05, + "loss": 1.4809, + "step": 25980 + }, + { + "epoch": 2.04, + "learning_rate": 6.905659316523295e-05, + "loss": 1.4667, + "step": 25981 + }, + { + "epoch": 2.04, + "learning_rate": 6.904618770897269e-05, + "loss": 1.4962, + "step": 25982 + }, + { + "epoch": 2.04, + "learning_rate": 6.903578280234411e-05, + "loss": 1.4829, + "step": 25983 + }, + { + "epoch": 2.04, + "learning_rate": 6.902537844541785e-05, + "loss": 1.4471, + "step": 25984 + }, + { + "epoch": 2.04, + "learning_rate": 6.901497463826464e-05, + "loss": 1.4845, + "step": 25985 + }, + { + "epoch": 2.04, + "learning_rate": 6.900457138095505e-05, + "loss": 1.4566, + "step": 25986 + }, + { + "epoch": 2.04, + "learning_rate": 6.899416867355967e-05, + "loss": 1.4978, + "step": 25987 + }, + { + "epoch": 2.04, + "learning_rate": 6.898376651614918e-05, + "loss": 1.4773, + "step": 25988 + }, + { + "epoch": 2.04, + "learning_rate": 6.897336490879428e-05, + "loss": 1.4773, + "step": 25989 + }, + { + "epoch": 2.04, + "learning_rate": 6.89629638515655e-05, + "loss": 1.4775, + "step": 25990 + }, + { + "epoch": 2.05, + "learning_rate": 6.895256334453343e-05, + "loss": 1.4786, + "step": 25991 + }, + { + "epoch": 2.05, + "learning_rate": 6.894216338776877e-05, + "loss": 1.4518, + "step": 25992 + }, + { + "epoch": 2.05, + "learning_rate": 6.89317639813421e-05, + "loss": 1.4121, + "step": 25993 + }, + { + "epoch": 2.05, + "learning_rate": 6.892136512532396e-05, + "loss": 1.425, + "step": 25994 + }, + { + "epoch": 2.05, + "learning_rate": 6.891096681978507e-05, + "loss": 1.3908, + "step": 25995 + }, + { + "epoch": 2.05, + "learning_rate": 6.890056906479596e-05, + "loss": 1.4114, + "step": 25996 + }, + { + "epoch": 2.05, + "learning_rate": 6.889017186042717e-05, + "loss": 1.4256, + "step": 25997 + }, + { + "epoch": 2.05, + "learning_rate": 6.887977520674941e-05, + "loss": 1.4239, + "step": 25998 + }, + { + "epoch": 2.05, + "learning_rate": 6.886937910383323e-05, + "loss": 1.4334, + "step": 25999 + }, + { + "epoch": 2.05, + "learning_rate": 6.885898355174917e-05, + "loss": 1.5033, + "step": 26000 + }, + { + "epoch": 2.05, + "learning_rate": 6.884858855056777e-05, + "loss": 1.454, + "step": 26001 + }, + { + "epoch": 2.05, + "learning_rate": 6.883819410035976e-05, + "loss": 1.5267, + "step": 26002 + }, + { + "epoch": 2.05, + "learning_rate": 6.882780020119554e-05, + "loss": 1.5105, + "step": 26003 + }, + { + "epoch": 2.05, + "learning_rate": 6.881740685314583e-05, + "loss": 1.4872, + "step": 26004 + }, + { + "epoch": 2.05, + "learning_rate": 6.880701405628108e-05, + "loss": 1.4407, + "step": 26005 + }, + { + "epoch": 2.05, + "learning_rate": 6.879662181067193e-05, + "loss": 1.4771, + "step": 26006 + }, + { + "epoch": 2.05, + "learning_rate": 6.878623011638893e-05, + "loss": 1.4005, + "step": 26007 + }, + { + "epoch": 2.05, + "learning_rate": 6.877583897350255e-05, + "loss": 1.4257, + "step": 26008 + }, + { + "epoch": 2.05, + "learning_rate": 6.876544838208344e-05, + "loss": 1.4975, + "step": 26009 + }, + { + "epoch": 2.05, + "learning_rate": 6.875505834220212e-05, + "loss": 1.4794, + "step": 26010 + }, + { + "epoch": 2.05, + "learning_rate": 6.874466885392907e-05, + "loss": 1.4662, + "step": 26011 + }, + { + "epoch": 2.05, + "learning_rate": 6.873427991733493e-05, + "loss": 1.5118, + "step": 26012 + }, + { + "epoch": 2.05, + "learning_rate": 6.872389153249017e-05, + "loss": 1.4034, + "step": 26013 + }, + { + "epoch": 2.05, + "learning_rate": 6.87135036994653e-05, + "loss": 1.5283, + "step": 26014 + }, + { + "epoch": 2.05, + "learning_rate": 6.870311641833092e-05, + "loss": 1.4087, + "step": 26015 + }, + { + "epoch": 2.05, + "learning_rate": 6.869272968915751e-05, + "loss": 1.4688, + "step": 26016 + }, + { + "epoch": 2.05, + "learning_rate": 6.868234351201562e-05, + "loss": 1.4331, + "step": 26017 + }, + { + "epoch": 2.05, + "learning_rate": 6.86719578869756e-05, + "loss": 1.4642, + "step": 26018 + }, + { + "epoch": 2.05, + "learning_rate": 6.866157281410825e-05, + "loss": 1.465, + "step": 26019 + }, + { + "epoch": 2.05, + "learning_rate": 6.865118829348392e-05, + "loss": 1.445, + "step": 26020 + }, + { + "epoch": 2.05, + "learning_rate": 6.864080432517312e-05, + "loss": 1.4197, + "step": 26021 + }, + { + "epoch": 2.05, + "learning_rate": 6.863042090924633e-05, + "loss": 1.4199, + "step": 26022 + }, + { + "epoch": 2.05, + "learning_rate": 6.862003804577411e-05, + "loss": 1.5118, + "step": 26023 + }, + { + "epoch": 2.05, + "learning_rate": 6.860965573482693e-05, + "loss": 1.4164, + "step": 26024 + }, + { + "epoch": 2.05, + "learning_rate": 6.859927397647521e-05, + "loss": 1.4334, + "step": 26025 + }, + { + "epoch": 2.05, + "learning_rate": 6.858889277078959e-05, + "loss": 1.4825, + "step": 26026 + }, + { + "epoch": 2.05, + "learning_rate": 6.857851211784042e-05, + "loss": 1.4575, + "step": 26027 + }, + { + "epoch": 2.05, + "learning_rate": 6.856813201769818e-05, + "loss": 1.4577, + "step": 26028 + }, + { + "epoch": 2.05, + "learning_rate": 6.855775247043344e-05, + "loss": 1.4431, + "step": 26029 + }, + { + "epoch": 2.05, + "learning_rate": 6.854737347611662e-05, + "loss": 1.434, + "step": 26030 + }, + { + "epoch": 2.05, + "learning_rate": 6.853699503481813e-05, + "loss": 1.481, + "step": 26031 + }, + { + "epoch": 2.05, + "learning_rate": 6.852661714660854e-05, + "loss": 1.4533, + "step": 26032 + }, + { + "epoch": 2.05, + "learning_rate": 6.851623981155826e-05, + "loss": 1.4426, + "step": 26033 + }, + { + "epoch": 2.05, + "learning_rate": 6.85058630297377e-05, + "loss": 1.4354, + "step": 26034 + }, + { + "epoch": 2.05, + "learning_rate": 6.849548680121735e-05, + "loss": 1.4805, + "step": 26035 + }, + { + "epoch": 2.05, + "learning_rate": 6.84851111260677e-05, + "loss": 1.4352, + "step": 26036 + }, + { + "epoch": 2.05, + "learning_rate": 6.847473600435919e-05, + "loss": 1.4807, + "step": 26037 + }, + { + "epoch": 2.05, + "learning_rate": 6.846436143616217e-05, + "loss": 1.45, + "step": 26038 + }, + { + "epoch": 2.05, + "learning_rate": 6.84539874215472e-05, + "loss": 1.4742, + "step": 26039 + }, + { + "epoch": 2.05, + "learning_rate": 6.844361396058466e-05, + "loss": 1.4455, + "step": 26040 + }, + { + "epoch": 2.05, + "learning_rate": 6.843324105334496e-05, + "loss": 1.4964, + "step": 26041 + }, + { + "epoch": 2.05, + "learning_rate": 6.84228686998985e-05, + "loss": 1.4335, + "step": 26042 + }, + { + "epoch": 2.05, + "learning_rate": 6.841249690031578e-05, + "loss": 1.4314, + "step": 26043 + }, + { + "epoch": 2.05, + "learning_rate": 6.840212565466719e-05, + "loss": 1.4899, + "step": 26044 + }, + { + "epoch": 2.05, + "learning_rate": 6.839175496302309e-05, + "loss": 1.3959, + "step": 26045 + }, + { + "epoch": 2.05, + "learning_rate": 6.838138482545398e-05, + "loss": 1.4787, + "step": 26046 + }, + { + "epoch": 2.05, + "learning_rate": 6.837101524203024e-05, + "loss": 1.4529, + "step": 26047 + }, + { + "epoch": 2.05, + "learning_rate": 6.83606462128222e-05, + "loss": 1.4482, + "step": 26048 + }, + { + "epoch": 2.05, + "learning_rate": 6.835027773790037e-05, + "loss": 1.4884, + "step": 26049 + }, + { + "epoch": 2.05, + "learning_rate": 6.833990981733506e-05, + "loss": 1.4727, + "step": 26050 + }, + { + "epoch": 2.05, + "learning_rate": 6.832954245119673e-05, + "loss": 1.5095, + "step": 26051 + }, + { + "epoch": 2.05, + "learning_rate": 6.83191756395557e-05, + "loss": 1.4839, + "step": 26052 + }, + { + "epoch": 2.05, + "learning_rate": 6.830880938248243e-05, + "loss": 1.4489, + "step": 26053 + }, + { + "epoch": 2.05, + "learning_rate": 6.829844368004727e-05, + "loss": 1.4929, + "step": 26054 + }, + { + "epoch": 2.05, + "learning_rate": 6.828807853232053e-05, + "loss": 1.4136, + "step": 26055 + }, + { + "epoch": 2.05, + "learning_rate": 6.827771393937272e-05, + "loss": 1.4893, + "step": 26056 + }, + { + "epoch": 2.05, + "learning_rate": 6.826734990127412e-05, + "loss": 1.4335, + "step": 26057 + }, + { + "epoch": 2.05, + "learning_rate": 6.825698641809512e-05, + "loss": 1.4317, + "step": 26058 + }, + { + "epoch": 2.05, + "learning_rate": 6.8246623489906e-05, + "loss": 1.4726, + "step": 26059 + }, + { + "epoch": 2.05, + "learning_rate": 6.823626111677726e-05, + "loss": 1.4438, + "step": 26060 + }, + { + "epoch": 2.05, + "learning_rate": 6.822589929877918e-05, + "loss": 1.3829, + "step": 26061 + }, + { + "epoch": 2.05, + "learning_rate": 6.821553803598206e-05, + "loss": 1.431, + "step": 26062 + }, + { + "epoch": 2.05, + "learning_rate": 6.820517732845636e-05, + "loss": 1.4387, + "step": 26063 + }, + { + "epoch": 2.05, + "learning_rate": 6.819481717627237e-05, + "loss": 1.4373, + "step": 26064 + }, + { + "epoch": 2.05, + "learning_rate": 6.818445757950038e-05, + "loss": 1.4464, + "step": 26065 + }, + { + "epoch": 2.05, + "learning_rate": 6.817409853821077e-05, + "loss": 1.4599, + "step": 26066 + }, + { + "epoch": 2.05, + "learning_rate": 6.816374005247392e-05, + "loss": 1.4456, + "step": 26067 + }, + { + "epoch": 2.05, + "learning_rate": 6.815338212236012e-05, + "loss": 1.5271, + "step": 26068 + }, + { + "epoch": 2.05, + "learning_rate": 6.814302474793963e-05, + "loss": 1.464, + "step": 26069 + }, + { + "epoch": 2.05, + "learning_rate": 6.813266792928289e-05, + "loss": 1.4442, + "step": 26070 + }, + { + "epoch": 2.05, + "learning_rate": 6.812231166646017e-05, + "loss": 1.4486, + "step": 26071 + }, + { + "epoch": 2.05, + "learning_rate": 6.811195595954171e-05, + "loss": 1.4726, + "step": 26072 + }, + { + "epoch": 2.05, + "learning_rate": 6.810160080859792e-05, + "loss": 1.4587, + "step": 26073 + }, + { + "epoch": 2.05, + "learning_rate": 6.809124621369907e-05, + "loss": 1.4483, + "step": 26074 + }, + { + "epoch": 2.05, + "learning_rate": 6.808089217491545e-05, + "loss": 1.4483, + "step": 26075 + }, + { + "epoch": 2.05, + "learning_rate": 6.807053869231733e-05, + "loss": 1.4724, + "step": 26076 + }, + { + "epoch": 2.05, + "learning_rate": 6.806018576597508e-05, + "loss": 1.4877, + "step": 26077 + }, + { + "epoch": 2.05, + "learning_rate": 6.804983339595894e-05, + "loss": 1.4642, + "step": 26078 + }, + { + "epoch": 2.05, + "learning_rate": 6.803948158233918e-05, + "loss": 1.4479, + "step": 26079 + }, + { + "epoch": 2.05, + "learning_rate": 6.802913032518614e-05, + "loss": 1.4311, + "step": 26080 + }, + { + "epoch": 2.05, + "learning_rate": 6.801877962457003e-05, + "loss": 1.4507, + "step": 26081 + }, + { + "epoch": 2.05, + "learning_rate": 6.800842948056124e-05, + "loss": 1.4733, + "step": 26082 + }, + { + "epoch": 2.05, + "learning_rate": 6.799807989322988e-05, + "loss": 1.3995, + "step": 26083 + }, + { + "epoch": 2.05, + "learning_rate": 6.798773086264636e-05, + "loss": 1.4876, + "step": 26084 + }, + { + "epoch": 2.05, + "learning_rate": 6.797738238888091e-05, + "loss": 1.4281, + "step": 26085 + }, + { + "epoch": 2.05, + "learning_rate": 6.79670344720037e-05, + "loss": 1.4656, + "step": 26086 + }, + { + "epoch": 2.05, + "learning_rate": 6.795668711208512e-05, + "loss": 1.4713, + "step": 26087 + }, + { + "epoch": 2.05, + "learning_rate": 6.794634030919535e-05, + "loss": 1.4225, + "step": 26088 + }, + { + "epoch": 2.05, + "learning_rate": 6.79359940634046e-05, + "loss": 1.4483, + "step": 26089 + }, + { + "epoch": 2.05, + "learning_rate": 6.792564837478322e-05, + "loss": 1.4473, + "step": 26090 + }, + { + "epoch": 2.05, + "learning_rate": 6.791530324340138e-05, + "loss": 1.4795, + "step": 26091 + }, + { + "epoch": 2.05, + "learning_rate": 6.790495866932935e-05, + "loss": 1.4913, + "step": 26092 + }, + { + "epoch": 2.05, + "learning_rate": 6.78946146526373e-05, + "loss": 1.4513, + "step": 26093 + }, + { + "epoch": 2.05, + "learning_rate": 6.788427119339553e-05, + "loss": 1.4874, + "step": 26094 + }, + { + "epoch": 2.05, + "learning_rate": 6.787392829167426e-05, + "loss": 1.4595, + "step": 26095 + }, + { + "epoch": 2.05, + "learning_rate": 6.786358594754366e-05, + "loss": 1.4364, + "step": 26096 + }, + { + "epoch": 2.05, + "learning_rate": 6.785324416107396e-05, + "loss": 1.4727, + "step": 26097 + }, + { + "epoch": 2.05, + "learning_rate": 6.784290293233546e-05, + "loss": 1.4071, + "step": 26098 + }, + { + "epoch": 2.05, + "learning_rate": 6.783256226139833e-05, + "loss": 1.4427, + "step": 26099 + }, + { + "epoch": 2.05, + "learning_rate": 6.782222214833268e-05, + "loss": 1.4601, + "step": 26100 + }, + { + "epoch": 2.05, + "learning_rate": 6.781188259320885e-05, + "loss": 1.4354, + "step": 26101 + }, + { + "epoch": 2.05, + "learning_rate": 6.780154359609698e-05, + "loss": 1.4171, + "step": 26102 + }, + { + "epoch": 2.05, + "learning_rate": 6.779120515706721e-05, + "loss": 1.5357, + "step": 26103 + }, + { + "epoch": 2.05, + "learning_rate": 6.778086727618987e-05, + "loss": 1.4728, + "step": 26104 + }, + { + "epoch": 2.05, + "learning_rate": 6.777052995353505e-05, + "loss": 1.3899, + "step": 26105 + }, + { + "epoch": 2.05, + "learning_rate": 6.77601931891729e-05, + "loss": 1.502, + "step": 26106 + }, + { + "epoch": 2.05, + "learning_rate": 6.77498569831737e-05, + "loss": 1.4607, + "step": 26107 + }, + { + "epoch": 2.05, + "learning_rate": 6.77395213356076e-05, + "loss": 1.4252, + "step": 26108 + }, + { + "epoch": 2.05, + "learning_rate": 6.77291862465447e-05, + "loss": 1.4642, + "step": 26109 + }, + { + "epoch": 2.05, + "learning_rate": 6.771885171605527e-05, + "loss": 1.5097, + "step": 26110 + }, + { + "epoch": 2.05, + "learning_rate": 6.770851774420944e-05, + "loss": 1.4552, + "step": 26111 + }, + { + "epoch": 2.05, + "learning_rate": 6.769818433107735e-05, + "loss": 1.4503, + "step": 26112 + }, + { + "epoch": 2.05, + "learning_rate": 6.768785147672907e-05, + "loss": 1.4049, + "step": 26113 + }, + { + "epoch": 2.05, + "learning_rate": 6.767751918123497e-05, + "loss": 1.445, + "step": 26114 + }, + { + "epoch": 2.05, + "learning_rate": 6.766718744466507e-05, + "loss": 1.3894, + "step": 26115 + }, + { + "epoch": 2.05, + "learning_rate": 6.765685626708954e-05, + "loss": 1.4427, + "step": 26116 + }, + { + "epoch": 2.05, + "learning_rate": 6.764652564857845e-05, + "loss": 1.4671, + "step": 26117 + }, + { + "epoch": 2.05, + "learning_rate": 6.763619558920208e-05, + "loss": 1.4223, + "step": 26118 + }, + { + "epoch": 2.06, + "learning_rate": 6.762586608903047e-05, + "loss": 1.5214, + "step": 26119 + }, + { + "epoch": 2.06, + "learning_rate": 6.761553714813373e-05, + "loss": 1.5216, + "step": 26120 + }, + { + "epoch": 2.06, + "learning_rate": 6.760520876658208e-05, + "loss": 1.436, + "step": 26121 + }, + { + "epoch": 2.06, + "learning_rate": 6.75948809444456e-05, + "loss": 1.4839, + "step": 26122 + }, + { + "epoch": 2.06, + "learning_rate": 6.758455368179434e-05, + "loss": 1.4492, + "step": 26123 + }, + { + "epoch": 2.06, + "learning_rate": 6.757422697869853e-05, + "loss": 1.5067, + "step": 26124 + }, + { + "epoch": 2.06, + "learning_rate": 6.756390083522823e-05, + "loss": 1.4788, + "step": 26125 + }, + { + "epoch": 2.06, + "learning_rate": 6.755357525145351e-05, + "loss": 1.4685, + "step": 26126 + }, + { + "epoch": 2.06, + "learning_rate": 6.754325022744457e-05, + "loss": 1.4321, + "step": 26127 + }, + { + "epoch": 2.06, + "learning_rate": 6.753292576327138e-05, + "loss": 1.4808, + "step": 26128 + }, + { + "epoch": 2.06, + "learning_rate": 6.75226018590042e-05, + "loss": 1.4585, + "step": 26129 + }, + { + "epoch": 2.06, + "learning_rate": 6.751227851471297e-05, + "loss": 1.4671, + "step": 26130 + }, + { + "epoch": 2.06, + "learning_rate": 6.750195573046791e-05, + "loss": 1.447, + "step": 26131 + }, + { + "epoch": 2.06, + "learning_rate": 6.749163350633903e-05, + "loss": 1.417, + "step": 26132 + }, + { + "epoch": 2.06, + "learning_rate": 6.748131184239646e-05, + "loss": 1.492, + "step": 26133 + }, + { + "epoch": 2.06, + "learning_rate": 6.747099073871015e-05, + "loss": 1.4587, + "step": 26134 + }, + { + "epoch": 2.06, + "learning_rate": 6.746067019535034e-05, + "loss": 1.4703, + "step": 26135 + }, + { + "epoch": 2.06, + "learning_rate": 6.745035021238703e-05, + "loss": 1.4649, + "step": 26136 + }, + { + "epoch": 2.06, + "learning_rate": 6.744003078989025e-05, + "loss": 1.4378, + "step": 26137 + }, + { + "epoch": 2.06, + "learning_rate": 6.742971192793014e-05, + "loss": 1.4731, + "step": 26138 + }, + { + "epoch": 2.06, + "learning_rate": 6.741939362657671e-05, + "loss": 1.4417, + "step": 26139 + }, + { + "epoch": 2.06, + "learning_rate": 6.740907588589997e-05, + "loss": 1.4441, + "step": 26140 + }, + { + "epoch": 2.06, + "learning_rate": 6.73987587059701e-05, + "loss": 1.4364, + "step": 26141 + }, + { + "epoch": 2.06, + "learning_rate": 6.738844208685707e-05, + "loss": 1.5313, + "step": 26142 + }, + { + "epoch": 2.06, + "learning_rate": 6.737812602863087e-05, + "loss": 1.4421, + "step": 26143 + }, + { + "epoch": 2.06, + "learning_rate": 6.736781053136161e-05, + "loss": 1.4465, + "step": 26144 + }, + { + "epoch": 2.06, + "learning_rate": 6.735749559511936e-05, + "loss": 1.4235, + "step": 26145 + }, + { + "epoch": 2.06, + "learning_rate": 6.734718121997412e-05, + "loss": 1.4975, + "step": 26146 + }, + { + "epoch": 2.06, + "learning_rate": 6.733686740599582e-05, + "loss": 1.4948, + "step": 26147 + }, + { + "epoch": 2.06, + "learning_rate": 6.732655415325467e-05, + "loss": 1.4126, + "step": 26148 + }, + { + "epoch": 2.06, + "learning_rate": 6.731624146182057e-05, + "loss": 1.4249, + "step": 26149 + }, + { + "epoch": 2.06, + "learning_rate": 6.730592933176351e-05, + "loss": 1.4638, + "step": 26150 + }, + { + "epoch": 2.06, + "learning_rate": 6.729561776315362e-05, + "loss": 1.4253, + "step": 26151 + }, + { + "epoch": 2.06, + "learning_rate": 6.728530675606085e-05, + "loss": 1.414, + "step": 26152 + }, + { + "epoch": 2.06, + "learning_rate": 6.727499631055518e-05, + "loss": 1.454, + "step": 26153 + }, + { + "epoch": 2.06, + "learning_rate": 6.72646864267066e-05, + "loss": 1.4875, + "step": 26154 + }, + { + "epoch": 2.06, + "learning_rate": 6.725437710458518e-05, + "loss": 1.4821, + "step": 26155 + }, + { + "epoch": 2.06, + "learning_rate": 6.724406834426088e-05, + "loss": 1.5272, + "step": 26156 + }, + { + "epoch": 2.06, + "learning_rate": 6.723376014580364e-05, + "loss": 1.4288, + "step": 26157 + }, + { + "epoch": 2.06, + "learning_rate": 6.722345250928355e-05, + "loss": 1.4495, + "step": 26158 + }, + { + "epoch": 2.06, + "learning_rate": 6.721314543477053e-05, + "loss": 1.4774, + "step": 26159 + }, + { + "epoch": 2.06, + "learning_rate": 6.720283892233451e-05, + "loss": 1.4917, + "step": 26160 + }, + { + "epoch": 2.06, + "learning_rate": 6.719253297204553e-05, + "loss": 1.4018, + "step": 26161 + }, + { + "epoch": 2.06, + "learning_rate": 6.718222758397361e-05, + "loss": 1.4474, + "step": 26162 + }, + { + "epoch": 2.06, + "learning_rate": 6.717192275818865e-05, + "loss": 1.4464, + "step": 26163 + }, + { + "epoch": 2.06, + "learning_rate": 6.716161849476059e-05, + "loss": 1.4445, + "step": 26164 + }, + { + "epoch": 2.06, + "learning_rate": 6.715131479375948e-05, + "loss": 1.4748, + "step": 26165 + }, + { + "epoch": 2.06, + "learning_rate": 6.71410116552552e-05, + "loss": 1.4825, + "step": 26166 + }, + { + "epoch": 2.06, + "learning_rate": 6.713070907931769e-05, + "loss": 1.4654, + "step": 26167 + }, + { + "epoch": 2.06, + "learning_rate": 6.712040706601697e-05, + "loss": 1.471, + "step": 26168 + }, + { + "epoch": 2.06, + "learning_rate": 6.711010561542297e-05, + "loss": 1.4617, + "step": 26169 + }, + { + "epoch": 2.06, + "learning_rate": 6.709980472760561e-05, + "loss": 1.45, + "step": 26170 + }, + { + "epoch": 2.06, + "learning_rate": 6.708950440263477e-05, + "loss": 1.4413, + "step": 26171 + }, + { + "epoch": 2.06, + "learning_rate": 6.70792046405805e-05, + "loss": 1.4353, + "step": 26172 + }, + { + "epoch": 2.06, + "learning_rate": 6.706890544151265e-05, + "loss": 1.4654, + "step": 26173 + }, + { + "epoch": 2.06, + "learning_rate": 6.705860680550112e-05, + "loss": 1.5221, + "step": 26174 + }, + { + "epoch": 2.06, + "learning_rate": 6.70483087326159e-05, + "loss": 1.409, + "step": 26175 + }, + { + "epoch": 2.06, + "learning_rate": 6.703801122292692e-05, + "loss": 1.4428, + "step": 26176 + }, + { + "epoch": 2.06, + "learning_rate": 6.702771427650407e-05, + "loss": 1.4111, + "step": 26177 + }, + { + "epoch": 2.06, + "learning_rate": 6.701741789341719e-05, + "loss": 1.4423, + "step": 26178 + }, + { + "epoch": 2.06, + "learning_rate": 6.700712207373631e-05, + "loss": 1.4449, + "step": 26179 + }, + { + "epoch": 2.06, + "learning_rate": 6.699682681753128e-05, + "loss": 1.4889, + "step": 26180 + }, + { + "epoch": 2.06, + "learning_rate": 6.698653212487192e-05, + "loss": 1.4898, + "step": 26181 + }, + { + "epoch": 2.06, + "learning_rate": 6.697623799582826e-05, + "loss": 1.4684, + "step": 26182 + }, + { + "epoch": 2.06, + "learning_rate": 6.696594443047013e-05, + "loss": 1.4335, + "step": 26183 + }, + { + "epoch": 2.06, + "learning_rate": 6.695565142886735e-05, + "loss": 1.4338, + "step": 26184 + }, + { + "epoch": 2.06, + "learning_rate": 6.694535899108994e-05, + "loss": 1.4769, + "step": 26185 + }, + { + "epoch": 2.06, + "learning_rate": 6.693506711720769e-05, + "loss": 1.4645, + "step": 26186 + }, + { + "epoch": 2.06, + "learning_rate": 6.69247758072905e-05, + "loss": 1.4445, + "step": 26187 + }, + { + "epoch": 2.06, + "learning_rate": 6.69144850614082e-05, + "loss": 1.4205, + "step": 26188 + }, + { + "epoch": 2.06, + "learning_rate": 6.690419487963072e-05, + "loss": 1.4481, + "step": 26189 + }, + { + "epoch": 2.06, + "learning_rate": 6.689390526202793e-05, + "loss": 1.5238, + "step": 26190 + }, + { + "epoch": 2.06, + "learning_rate": 6.68836162086696e-05, + "loss": 1.425, + "step": 26191 + }, + { + "epoch": 2.06, + "learning_rate": 6.687332771962564e-05, + "loss": 1.473, + "step": 26192 + }, + { + "epoch": 2.06, + "learning_rate": 6.686303979496596e-05, + "loss": 1.4709, + "step": 26193 + }, + { + "epoch": 2.06, + "learning_rate": 6.685275243476039e-05, + "loss": 1.4425, + "step": 26194 + }, + { + "epoch": 2.06, + "learning_rate": 6.684246563907867e-05, + "loss": 1.5366, + "step": 26195 + }, + { + "epoch": 2.06, + "learning_rate": 6.683217940799077e-05, + "loss": 1.4849, + "step": 26196 + }, + { + "epoch": 2.06, + "learning_rate": 6.682189374156649e-05, + "loss": 1.4908, + "step": 26197 + }, + { + "epoch": 2.06, + "learning_rate": 6.681160863987558e-05, + "loss": 1.4614, + "step": 26198 + }, + { + "epoch": 2.06, + "learning_rate": 6.680132410298802e-05, + "loss": 1.4566, + "step": 26199 + }, + { + "epoch": 2.06, + "learning_rate": 6.679104013097353e-05, + "loss": 1.4538, + "step": 26200 + }, + { + "epoch": 2.06, + "learning_rate": 6.67807567239019e-05, + "loss": 1.4207, + "step": 26201 + }, + { + "epoch": 2.06, + "learning_rate": 6.677047388184308e-05, + "loss": 1.4318, + "step": 26202 + }, + { + "epoch": 2.06, + "learning_rate": 6.676019160486682e-05, + "loss": 1.4274, + "step": 26203 + }, + { + "epoch": 2.06, + "learning_rate": 6.674990989304286e-05, + "loss": 1.4927, + "step": 26204 + }, + { + "epoch": 2.06, + "learning_rate": 6.673962874644113e-05, + "loss": 1.4643, + "step": 26205 + }, + { + "epoch": 2.06, + "learning_rate": 6.672934816513136e-05, + "loss": 1.428, + "step": 26206 + }, + { + "epoch": 2.06, + "learning_rate": 6.671906814918331e-05, + "loss": 1.4009, + "step": 26207 + }, + { + "epoch": 2.06, + "learning_rate": 6.670878869866684e-05, + "loss": 1.4459, + "step": 26208 + }, + { + "epoch": 2.06, + "learning_rate": 6.669850981365177e-05, + "loss": 1.4608, + "step": 26209 + }, + { + "epoch": 2.06, + "learning_rate": 6.668823149420787e-05, + "loss": 1.5082, + "step": 26210 + }, + { + "epoch": 2.06, + "learning_rate": 6.667795374040489e-05, + "loss": 1.4515, + "step": 26211 + }, + { + "epoch": 2.06, + "learning_rate": 6.666767655231256e-05, + "loss": 1.4693, + "step": 26212 + }, + { + "epoch": 2.06, + "learning_rate": 6.665739993000079e-05, + "loss": 1.5056, + "step": 26213 + }, + { + "epoch": 2.06, + "learning_rate": 6.664712387353928e-05, + "loss": 1.5139, + "step": 26214 + }, + { + "epoch": 2.06, + "learning_rate": 6.663684838299774e-05, + "loss": 1.4591, + "step": 26215 + }, + { + "epoch": 2.06, + "learning_rate": 6.662657345844605e-05, + "loss": 1.491, + "step": 26216 + }, + { + "epoch": 2.06, + "learning_rate": 6.661629909995392e-05, + "loss": 1.4686, + "step": 26217 + }, + { + "epoch": 2.06, + "learning_rate": 6.660602530759104e-05, + "loss": 1.4659, + "step": 26218 + }, + { + "epoch": 2.06, + "learning_rate": 6.659575208142731e-05, + "loss": 1.4763, + "step": 26219 + }, + { + "epoch": 2.06, + "learning_rate": 6.658547942153238e-05, + "loss": 1.4842, + "step": 26220 + }, + { + "epoch": 2.06, + "learning_rate": 6.657520732797596e-05, + "loss": 1.4521, + "step": 26221 + }, + { + "epoch": 2.06, + "learning_rate": 6.65649358008279e-05, + "loss": 1.4726, + "step": 26222 + }, + { + "epoch": 2.06, + "learning_rate": 6.655466484015781e-05, + "loss": 1.4544, + "step": 26223 + }, + { + "epoch": 2.06, + "learning_rate": 6.654439444603557e-05, + "loss": 1.4395, + "step": 26224 + }, + { + "epoch": 2.06, + "learning_rate": 6.653412461853078e-05, + "loss": 1.4826, + "step": 26225 + }, + { + "epoch": 2.06, + "learning_rate": 6.652385535771327e-05, + "loss": 1.4637, + "step": 26226 + }, + { + "epoch": 2.06, + "learning_rate": 6.651358666365273e-05, + "loss": 1.4196, + "step": 26227 + }, + { + "epoch": 2.06, + "learning_rate": 6.650331853641886e-05, + "loss": 1.5012, + "step": 26228 + }, + { + "epoch": 2.06, + "learning_rate": 6.649305097608132e-05, + "loss": 1.4882, + "step": 26229 + }, + { + "epoch": 2.06, + "learning_rate": 6.648278398270995e-05, + "loss": 1.4164, + "step": 26230 + }, + { + "epoch": 2.06, + "learning_rate": 6.647251755637437e-05, + "loss": 1.4827, + "step": 26231 + }, + { + "epoch": 2.06, + "learning_rate": 6.646225169714426e-05, + "loss": 1.465, + "step": 26232 + }, + { + "epoch": 2.06, + "learning_rate": 6.645198640508941e-05, + "loss": 1.4334, + "step": 26233 + }, + { + "epoch": 2.06, + "learning_rate": 6.644172168027947e-05, + "loss": 1.4291, + "step": 26234 + }, + { + "epoch": 2.06, + "learning_rate": 6.643145752278405e-05, + "loss": 1.4243, + "step": 26235 + }, + { + "epoch": 2.06, + "learning_rate": 6.6421193932673e-05, + "loss": 1.4189, + "step": 26236 + }, + { + "epoch": 2.06, + "learning_rate": 6.641093091001591e-05, + "loss": 1.4842, + "step": 26237 + }, + { + "epoch": 2.06, + "learning_rate": 6.640066845488242e-05, + "loss": 1.4914, + "step": 26238 + }, + { + "epoch": 2.06, + "learning_rate": 6.639040656734226e-05, + "loss": 1.4629, + "step": 26239 + }, + { + "epoch": 2.06, + "learning_rate": 6.638014524746515e-05, + "loss": 1.4438, + "step": 26240 + }, + { + "epoch": 2.06, + "learning_rate": 6.636988449532071e-05, + "loss": 1.4472, + "step": 26241 + }, + { + "epoch": 2.06, + "learning_rate": 6.635962431097853e-05, + "loss": 1.4722, + "step": 26242 + }, + { + "epoch": 2.06, + "learning_rate": 6.634936469450844e-05, + "loss": 1.4336, + "step": 26243 + }, + { + "epoch": 2.06, + "learning_rate": 6.633910564597998e-05, + "loss": 1.4574, + "step": 26244 + }, + { + "epoch": 2.06, + "learning_rate": 6.632884716546281e-05, + "loss": 1.5092, + "step": 26245 + }, + { + "epoch": 2.07, + "learning_rate": 6.631858925302654e-05, + "loss": 1.4867, + "step": 26246 + }, + { + "epoch": 2.07, + "learning_rate": 6.630833190874095e-05, + "loss": 1.4241, + "step": 26247 + }, + { + "epoch": 2.07, + "learning_rate": 6.629807513267559e-05, + "loss": 1.4798, + "step": 26248 + }, + { + "epoch": 2.07, + "learning_rate": 6.628781892490004e-05, + "loss": 1.4446, + "step": 26249 + }, + { + "epoch": 2.07, + "learning_rate": 6.627756328548408e-05, + "loss": 1.4529, + "step": 26250 + }, + { + "epoch": 2.07, + "learning_rate": 6.626730821449724e-05, + "loss": 1.4349, + "step": 26251 + }, + { + "epoch": 2.07, + "learning_rate": 6.625705371200915e-05, + "loss": 1.452, + "step": 26252 + }, + { + "epoch": 2.07, + "learning_rate": 6.624679977808947e-05, + "loss": 1.4674, + "step": 26253 + }, + { + "epoch": 2.07, + "learning_rate": 6.623654641280776e-05, + "loss": 1.4313, + "step": 26254 + }, + { + "epoch": 2.07, + "learning_rate": 6.622629361623374e-05, + "loss": 1.448, + "step": 26255 + }, + { + "epoch": 2.07, + "learning_rate": 6.62160413884369e-05, + "loss": 1.4419, + "step": 26256 + }, + { + "epoch": 2.07, + "learning_rate": 6.620578972948693e-05, + "loss": 1.4573, + "step": 26257 + }, + { + "epoch": 2.07, + "learning_rate": 6.619553863945343e-05, + "loss": 1.4198, + "step": 26258 + }, + { + "epoch": 2.07, + "learning_rate": 6.618528811840593e-05, + "loss": 1.4476, + "step": 26259 + }, + { + "epoch": 2.07, + "learning_rate": 6.617503816641412e-05, + "loss": 1.4392, + "step": 26260 + }, + { + "epoch": 2.07, + "learning_rate": 6.616478878354752e-05, + "loss": 1.4694, + "step": 26261 + }, + { + "epoch": 2.07, + "learning_rate": 6.615453996987571e-05, + "loss": 1.5072, + "step": 26262 + }, + { + "epoch": 2.07, + "learning_rate": 6.614429172546835e-05, + "loss": 1.4231, + "step": 26263 + }, + { + "epoch": 2.07, + "learning_rate": 6.613404405039498e-05, + "loss": 1.4627, + "step": 26264 + }, + { + "epoch": 2.07, + "learning_rate": 6.612379694472515e-05, + "loss": 1.438, + "step": 26265 + }, + { + "epoch": 2.07, + "learning_rate": 6.611355040852842e-05, + "loss": 1.4924, + "step": 26266 + }, + { + "epoch": 2.07, + "learning_rate": 6.610330444187443e-05, + "loss": 1.4191, + "step": 26267 + }, + { + "epoch": 2.07, + "learning_rate": 6.609305904483272e-05, + "loss": 1.4644, + "step": 26268 + }, + { + "epoch": 2.07, + "learning_rate": 6.608281421747276e-05, + "loss": 1.4805, + "step": 26269 + }, + { + "epoch": 2.07, + "learning_rate": 6.607256995986419e-05, + "loss": 1.4664, + "step": 26270 + }, + { + "epoch": 2.07, + "learning_rate": 6.606232627207664e-05, + "loss": 1.4964, + "step": 26271 + }, + { + "epoch": 2.07, + "learning_rate": 6.605208315417953e-05, + "loss": 1.4618, + "step": 26272 + }, + { + "epoch": 2.07, + "learning_rate": 6.604184060624242e-05, + "loss": 1.5477, + "step": 26273 + }, + { + "epoch": 2.07, + "learning_rate": 6.603159862833492e-05, + "loss": 1.4063, + "step": 26274 + }, + { + "epoch": 2.07, + "learning_rate": 6.602135722052654e-05, + "loss": 1.4427, + "step": 26275 + }, + { + "epoch": 2.07, + "learning_rate": 6.601111638288674e-05, + "loss": 1.4569, + "step": 26276 + }, + { + "epoch": 2.07, + "learning_rate": 6.600087611548516e-05, + "loss": 1.4253, + "step": 26277 + }, + { + "epoch": 2.07, + "learning_rate": 6.599063641839129e-05, + "loss": 1.4607, + "step": 26278 + }, + { + "epoch": 2.07, + "learning_rate": 6.598039729167456e-05, + "loss": 1.4602, + "step": 26279 + }, + { + "epoch": 2.07, + "learning_rate": 6.597015873540464e-05, + "loss": 1.4851, + "step": 26280 + }, + { + "epoch": 2.07, + "learning_rate": 6.595992074965097e-05, + "loss": 1.4738, + "step": 26281 + }, + { + "epoch": 2.07, + "learning_rate": 6.594968333448306e-05, + "loss": 1.4157, + "step": 26282 + }, + { + "epoch": 2.07, + "learning_rate": 6.593944648997037e-05, + "loss": 1.4798, + "step": 26283 + }, + { + "epoch": 2.07, + "learning_rate": 6.59292102161825e-05, + "loss": 1.4843, + "step": 26284 + }, + { + "epoch": 2.07, + "learning_rate": 6.591897451318884e-05, + "loss": 1.4617, + "step": 26285 + }, + { + "epoch": 2.07, + "learning_rate": 6.590873938105899e-05, + "loss": 1.4734, + "step": 26286 + }, + { + "epoch": 2.07, + "learning_rate": 6.589850481986236e-05, + "loss": 1.4679, + "step": 26287 + }, + { + "epoch": 2.07, + "learning_rate": 6.588827082966851e-05, + "loss": 1.484, + "step": 26288 + }, + { + "epoch": 2.07, + "learning_rate": 6.587803741054689e-05, + "loss": 1.428, + "step": 26289 + }, + { + "epoch": 2.07, + "learning_rate": 6.586780456256692e-05, + "loss": 1.3617, + "step": 26290 + }, + { + "epoch": 2.07, + "learning_rate": 6.585757228579818e-05, + "loss": 1.4651, + "step": 26291 + }, + { + "epoch": 2.07, + "learning_rate": 6.584734058031008e-05, + "loss": 1.4827, + "step": 26292 + }, + { + "epoch": 2.07, + "learning_rate": 6.583710944617206e-05, + "loss": 1.444, + "step": 26293 + }, + { + "epoch": 2.07, + "learning_rate": 6.582687888345367e-05, + "loss": 1.466, + "step": 26294 + }, + { + "epoch": 2.07, + "learning_rate": 6.581664889222433e-05, + "loss": 1.4992, + "step": 26295 + }, + { + "epoch": 2.07, + "learning_rate": 6.580641947255343e-05, + "loss": 1.4335, + "step": 26296 + }, + { + "epoch": 2.07, + "learning_rate": 6.579619062451053e-05, + "loss": 1.5327, + "step": 26297 + }, + { + "epoch": 2.07, + "learning_rate": 6.578596234816503e-05, + "loss": 1.4818, + "step": 26298 + }, + { + "epoch": 2.07, + "learning_rate": 6.577573464358637e-05, + "loss": 1.4427, + "step": 26299 + }, + { + "epoch": 2.07, + "learning_rate": 6.576550751084394e-05, + "loss": 1.4502, + "step": 26300 + }, + { + "epoch": 2.07, + "learning_rate": 6.575528095000723e-05, + "loss": 1.4387, + "step": 26301 + }, + { + "epoch": 2.07, + "learning_rate": 6.574505496114573e-05, + "loss": 1.4641, + "step": 26302 + }, + { + "epoch": 2.07, + "learning_rate": 6.573482954432875e-05, + "loss": 1.4392, + "step": 26303 + }, + { + "epoch": 2.07, + "learning_rate": 6.572460469962583e-05, + "loss": 1.4815, + "step": 26304 + }, + { + "epoch": 2.07, + "learning_rate": 6.571438042710635e-05, + "loss": 1.4311, + "step": 26305 + }, + { + "epoch": 2.07, + "learning_rate": 6.57041567268397e-05, + "loss": 1.4725, + "step": 26306 + }, + { + "epoch": 2.07, + "learning_rate": 6.569393359889526e-05, + "loss": 1.4688, + "step": 26307 + }, + { + "epoch": 2.07, + "learning_rate": 6.568371104334255e-05, + "loss": 1.4743, + "step": 26308 + }, + { + "epoch": 2.07, + "learning_rate": 6.567348906025091e-05, + "loss": 1.488, + "step": 26309 + }, + { + "epoch": 2.07, + "learning_rate": 6.566326764968967e-05, + "loss": 1.5141, + "step": 26310 + }, + { + "epoch": 2.07, + "learning_rate": 6.565304681172837e-05, + "loss": 1.4263, + "step": 26311 + }, + { + "epoch": 2.07, + "learning_rate": 6.564282654643634e-05, + "loss": 1.4483, + "step": 26312 + }, + { + "epoch": 2.07, + "learning_rate": 6.56326068538829e-05, + "loss": 1.4142, + "step": 26313 + }, + { + "epoch": 2.07, + "learning_rate": 6.562238773413755e-05, + "loss": 1.4498, + "step": 26314 + }, + { + "epoch": 2.07, + "learning_rate": 6.561216918726963e-05, + "loss": 1.4325, + "step": 26315 + }, + { + "epoch": 2.07, + "learning_rate": 6.560195121334847e-05, + "loss": 1.5254, + "step": 26316 + }, + { + "epoch": 2.07, + "learning_rate": 6.559173381244348e-05, + "loss": 1.4379, + "step": 26317 + }, + { + "epoch": 2.07, + "learning_rate": 6.55815169846241e-05, + "loss": 1.513, + "step": 26318 + }, + { + "epoch": 2.07, + "learning_rate": 6.557130072995962e-05, + "loss": 1.4636, + "step": 26319 + }, + { + "epoch": 2.07, + "learning_rate": 6.556108504851937e-05, + "loss": 1.4356, + "step": 26320 + }, + { + "epoch": 2.07, + "learning_rate": 6.555086994037281e-05, + "loss": 1.4513, + "step": 26321 + }, + { + "epoch": 2.07, + "learning_rate": 6.554065540558924e-05, + "loss": 1.4132, + "step": 26322 + }, + { + "epoch": 2.07, + "learning_rate": 6.553044144423801e-05, + "loss": 1.4608, + "step": 26323 + }, + { + "epoch": 2.07, + "learning_rate": 6.55202280563884e-05, + "loss": 1.4391, + "step": 26324 + }, + { + "epoch": 2.07, + "learning_rate": 6.551001524210988e-05, + "loss": 1.4326, + "step": 26325 + }, + { + "epoch": 2.07, + "learning_rate": 6.549980300147176e-05, + "loss": 1.418, + "step": 26326 + }, + { + "epoch": 2.07, + "learning_rate": 6.548959133454324e-05, + "loss": 1.4353, + "step": 26327 + }, + { + "epoch": 2.07, + "learning_rate": 6.547938024139386e-05, + "loss": 1.4798, + "step": 26328 + }, + { + "epoch": 2.07, + "learning_rate": 6.546916972209283e-05, + "loss": 1.4385, + "step": 26329 + }, + { + "epoch": 2.07, + "learning_rate": 6.545895977670944e-05, + "loss": 1.4806, + "step": 26330 + }, + { + "epoch": 2.07, + "learning_rate": 6.544875040531311e-05, + "loss": 1.4543, + "step": 26331 + }, + { + "epoch": 2.07, + "learning_rate": 6.54385416079731e-05, + "loss": 1.4314, + "step": 26332 + }, + { + "epoch": 2.07, + "learning_rate": 6.542833338475868e-05, + "loss": 1.4503, + "step": 26333 + }, + { + "epoch": 2.07, + "learning_rate": 6.54181257357392e-05, + "loss": 1.3937, + "step": 26334 + }, + { + "epoch": 2.07, + "learning_rate": 6.540791866098403e-05, + "loss": 1.4807, + "step": 26335 + }, + { + "epoch": 2.07, + "learning_rate": 6.53977121605624e-05, + "loss": 1.4547, + "step": 26336 + }, + { + "epoch": 2.07, + "learning_rate": 6.538750623454359e-05, + "loss": 1.4607, + "step": 26337 + }, + { + "epoch": 2.07, + "learning_rate": 6.537730088299694e-05, + "loss": 1.4644, + "step": 26338 + }, + { + "epoch": 2.07, + "learning_rate": 6.536709610599174e-05, + "loss": 1.4869, + "step": 26339 + }, + { + "epoch": 2.07, + "learning_rate": 6.535689190359724e-05, + "loss": 1.507, + "step": 26340 + }, + { + "epoch": 2.07, + "learning_rate": 6.534668827588268e-05, + "loss": 1.4947, + "step": 26341 + }, + { + "epoch": 2.07, + "learning_rate": 6.533648522291747e-05, + "loss": 1.4844, + "step": 26342 + }, + { + "epoch": 2.07, + "learning_rate": 6.532628274477078e-05, + "loss": 1.4696, + "step": 26343 + }, + { + "epoch": 2.07, + "learning_rate": 6.531608084151185e-05, + "loss": 1.4212, + "step": 26344 + }, + { + "epoch": 2.07, + "learning_rate": 6.530587951321006e-05, + "loss": 1.4211, + "step": 26345 + }, + { + "epoch": 2.07, + "learning_rate": 6.52956787599346e-05, + "loss": 1.4767, + "step": 26346 + }, + { + "epoch": 2.07, + "learning_rate": 6.52854785817547e-05, + "loss": 1.4824, + "step": 26347 + }, + { + "epoch": 2.07, + "learning_rate": 6.527527897873965e-05, + "loss": 1.4427, + "step": 26348 + }, + { + "epoch": 2.07, + "learning_rate": 6.526507995095874e-05, + "loss": 1.4708, + "step": 26349 + }, + { + "epoch": 2.07, + "learning_rate": 6.525488149848117e-05, + "loss": 1.4509, + "step": 26350 + }, + { + "epoch": 2.07, + "learning_rate": 6.524468362137616e-05, + "loss": 1.4819, + "step": 26351 + }, + { + "epoch": 2.07, + "learning_rate": 6.523448631971301e-05, + "loss": 1.4269, + "step": 26352 + }, + { + "epoch": 2.07, + "learning_rate": 6.522428959356093e-05, + "loss": 1.4352, + "step": 26353 + }, + { + "epoch": 2.07, + "learning_rate": 6.521409344298908e-05, + "loss": 1.4302, + "step": 26354 + }, + { + "epoch": 2.07, + "learning_rate": 6.520389786806681e-05, + "loss": 1.4406, + "step": 26355 + }, + { + "epoch": 2.07, + "learning_rate": 6.519370286886327e-05, + "loss": 1.4412, + "step": 26356 + }, + { + "epoch": 2.07, + "learning_rate": 6.518350844544771e-05, + "loss": 1.4365, + "step": 26357 + }, + { + "epoch": 2.07, + "learning_rate": 6.517331459788924e-05, + "loss": 1.4405, + "step": 26358 + }, + { + "epoch": 2.07, + "learning_rate": 6.516312132625723e-05, + "loss": 1.4117, + "step": 26359 + }, + { + "epoch": 2.07, + "learning_rate": 6.51529286306208e-05, + "loss": 1.4446, + "step": 26360 + }, + { + "epoch": 2.07, + "learning_rate": 6.51427365110491e-05, + "loss": 1.4802, + "step": 26361 + }, + { + "epoch": 2.07, + "learning_rate": 6.513254496761143e-05, + "loss": 1.4551, + "step": 26362 + }, + { + "epoch": 2.07, + "learning_rate": 6.512235400037698e-05, + "loss": 1.4239, + "step": 26363 + }, + { + "epoch": 2.07, + "learning_rate": 6.511216360941483e-05, + "loss": 1.4168, + "step": 26364 + }, + { + "epoch": 2.07, + "learning_rate": 6.510197379479426e-05, + "loss": 1.5528, + "step": 26365 + }, + { + "epoch": 2.07, + "learning_rate": 6.509178455658447e-05, + "loss": 1.4603, + "step": 26366 + }, + { + "epoch": 2.07, + "learning_rate": 6.508159589485464e-05, + "loss": 1.4949, + "step": 26367 + }, + { + "epoch": 2.07, + "learning_rate": 6.507140780967382e-05, + "loss": 1.5011, + "step": 26368 + }, + { + "epoch": 2.07, + "learning_rate": 6.506122030111134e-05, + "loss": 1.4695, + "step": 26369 + }, + { + "epoch": 2.07, + "learning_rate": 6.505103336923633e-05, + "loss": 1.4851, + "step": 26370 + }, + { + "epoch": 2.07, + "learning_rate": 6.504084701411783e-05, + "loss": 1.4252, + "step": 26371 + }, + { + "epoch": 2.07, + "learning_rate": 6.503066123582517e-05, + "loss": 1.4571, + "step": 26372 + }, + { + "epoch": 2.08, + "learning_rate": 6.502047603442744e-05, + "loss": 1.459, + "step": 26373 + }, + { + "epoch": 2.08, + "learning_rate": 6.501029140999371e-05, + "loss": 1.4432, + "step": 26374 + }, + { + "epoch": 2.08, + "learning_rate": 6.500010736259326e-05, + "loss": 1.521, + "step": 26375 + }, + { + "epoch": 2.08, + "learning_rate": 6.498992389229517e-05, + "loss": 1.3807, + "step": 26376 + }, + { + "epoch": 2.08, + "learning_rate": 6.497974099916859e-05, + "loss": 1.4451, + "step": 26377 + }, + { + "epoch": 2.08, + "learning_rate": 6.49695586832826e-05, + "loss": 1.4208, + "step": 26378 + }, + { + "epoch": 2.08, + "learning_rate": 6.495937694470643e-05, + "loss": 1.4882, + "step": 26379 + }, + { + "epoch": 2.08, + "learning_rate": 6.49491957835091e-05, + "loss": 1.4626, + "step": 26380 + }, + { + "epoch": 2.08, + "learning_rate": 6.493901519975986e-05, + "loss": 1.4922, + "step": 26381 + }, + { + "epoch": 2.08, + "learning_rate": 6.492883519352771e-05, + "loss": 1.4815, + "step": 26382 + }, + { + "epoch": 2.08, + "learning_rate": 6.491865576488187e-05, + "loss": 1.431, + "step": 26383 + }, + { + "epoch": 2.08, + "learning_rate": 6.490847691389142e-05, + "loss": 1.4519, + "step": 26384 + }, + { + "epoch": 2.08, + "learning_rate": 6.489829864062539e-05, + "loss": 1.4798, + "step": 26385 + }, + { + "epoch": 2.08, + "learning_rate": 6.4888120945153e-05, + "loss": 1.4597, + "step": 26386 + }, + { + "epoch": 2.08, + "learning_rate": 6.487794382754331e-05, + "loss": 1.4675, + "step": 26387 + }, + { + "epoch": 2.08, + "learning_rate": 6.486776728786535e-05, + "loss": 1.477, + "step": 26388 + }, + { + "epoch": 2.08, + "learning_rate": 6.485759132618832e-05, + "loss": 1.4888, + "step": 26389 + }, + { + "epoch": 2.08, + "learning_rate": 6.484741594258127e-05, + "loss": 1.4635, + "step": 26390 + }, + { + "epoch": 2.08, + "learning_rate": 6.483724113711322e-05, + "loss": 1.4342, + "step": 26391 + }, + { + "epoch": 2.08, + "learning_rate": 6.482706690985336e-05, + "loss": 1.4566, + "step": 26392 + }, + { + "epoch": 2.08, + "learning_rate": 6.481689326087069e-05, + "loss": 1.4324, + "step": 26393 + }, + { + "epoch": 2.08, + "learning_rate": 6.480672019023433e-05, + "loss": 1.4642, + "step": 26394 + }, + { + "epoch": 2.08, + "learning_rate": 6.479654769801327e-05, + "loss": 1.502, + "step": 26395 + }, + { + "epoch": 2.08, + "learning_rate": 6.478637578427662e-05, + "loss": 1.4974, + "step": 26396 + }, + { + "epoch": 2.08, + "learning_rate": 6.477620444909351e-05, + "loss": 1.4181, + "step": 26397 + }, + { + "epoch": 2.08, + "learning_rate": 6.476603369253296e-05, + "loss": 1.4353, + "step": 26398 + }, + { + "epoch": 2.08, + "learning_rate": 6.475586351466393e-05, + "loss": 1.428, + "step": 26399 + }, + { + "epoch": 2.08, + "learning_rate": 6.474569391555561e-05, + "loss": 1.4565, + "step": 26400 + }, + { + "epoch": 2.08, + "learning_rate": 6.473552489527699e-05, + "loss": 1.4905, + "step": 26401 + }, + { + "epoch": 2.08, + "learning_rate": 6.472535645389703e-05, + "loss": 1.4462, + "step": 26402 + }, + { + "epoch": 2.08, + "learning_rate": 6.471518859148491e-05, + "loss": 1.4283, + "step": 26403 + }, + { + "epoch": 2.08, + "learning_rate": 6.470502130810959e-05, + "loss": 1.4279, + "step": 26404 + }, + { + "epoch": 2.08, + "learning_rate": 6.469485460384005e-05, + "loss": 1.4208, + "step": 26405 + }, + { + "epoch": 2.08, + "learning_rate": 6.468468847874543e-05, + "loss": 1.4453, + "step": 26406 + }, + { + "epoch": 2.08, + "learning_rate": 6.467452293289468e-05, + "loss": 1.4739, + "step": 26407 + }, + { + "epoch": 2.08, + "learning_rate": 6.466435796635678e-05, + "loss": 1.4396, + "step": 26408 + }, + { + "epoch": 2.08, + "learning_rate": 6.465419357920087e-05, + "loss": 1.499, + "step": 26409 + }, + { + "epoch": 2.08, + "learning_rate": 6.464402977149588e-05, + "loss": 1.5256, + "step": 26410 + }, + { + "epoch": 2.08, + "learning_rate": 6.463386654331077e-05, + "loss": 1.4427, + "step": 26411 + }, + { + "epoch": 2.08, + "learning_rate": 6.462370389471459e-05, + "loss": 1.4876, + "step": 26412 + }, + { + "epoch": 2.08, + "learning_rate": 6.461354182577641e-05, + "loss": 1.4515, + "step": 26413 + }, + { + "epoch": 2.08, + "learning_rate": 6.460338033656516e-05, + "loss": 1.4525, + "step": 26414 + }, + { + "epoch": 2.08, + "learning_rate": 6.459321942714977e-05, + "loss": 1.4731, + "step": 26415 + }, + { + "epoch": 2.08, + "learning_rate": 6.458305909759936e-05, + "loss": 1.4902, + "step": 26416 + }, + { + "epoch": 2.08, + "learning_rate": 6.457289934798282e-05, + "loss": 1.497, + "step": 26417 + }, + { + "epoch": 2.08, + "learning_rate": 6.456274017836917e-05, + "loss": 1.4594, + "step": 26418 + }, + { + "epoch": 2.08, + "learning_rate": 6.45525815888273e-05, + "loss": 1.4427, + "step": 26419 + }, + { + "epoch": 2.08, + "learning_rate": 6.454242357942629e-05, + "loss": 1.4492, + "step": 26420 + }, + { + "epoch": 2.08, + "learning_rate": 6.453226615023508e-05, + "loss": 1.4704, + "step": 26421 + }, + { + "epoch": 2.08, + "learning_rate": 6.452210930132257e-05, + "loss": 1.5112, + "step": 26422 + }, + { + "epoch": 2.08, + "learning_rate": 6.451195303275782e-05, + "loss": 1.4572, + "step": 26423 + }, + { + "epoch": 2.08, + "learning_rate": 6.450179734460971e-05, + "loss": 1.4572, + "step": 26424 + }, + { + "epoch": 2.08, + "learning_rate": 6.449164223694718e-05, + "loss": 1.4238, + "step": 26425 + }, + { + "epoch": 2.08, + "learning_rate": 6.448148770983928e-05, + "loss": 1.3934, + "step": 26426 + }, + { + "epoch": 2.08, + "learning_rate": 6.44713337633548e-05, + "loss": 1.484, + "step": 26427 + }, + { + "epoch": 2.08, + "learning_rate": 6.446118039756283e-05, + "loss": 1.402, + "step": 26428 + }, + { + "epoch": 2.08, + "learning_rate": 6.445102761253218e-05, + "loss": 1.4699, + "step": 26429 + }, + { + "epoch": 2.08, + "learning_rate": 6.444087540833191e-05, + "loss": 1.3887, + "step": 26430 + }, + { + "epoch": 2.08, + "learning_rate": 6.443072378503088e-05, + "loss": 1.4023, + "step": 26431 + }, + { + "epoch": 2.08, + "learning_rate": 6.442057274269796e-05, + "loss": 1.4503, + "step": 26432 + }, + { + "epoch": 2.08, + "learning_rate": 6.441042228140218e-05, + "loss": 1.4727, + "step": 26433 + }, + { + "epoch": 2.08, + "learning_rate": 6.440027240121239e-05, + "loss": 1.4256, + "step": 26434 + }, + { + "epoch": 2.08, + "learning_rate": 6.439012310219752e-05, + "loss": 1.3808, + "step": 26435 + }, + { + "epoch": 2.08, + "learning_rate": 6.437997438442642e-05, + "loss": 1.4906, + "step": 26436 + }, + { + "epoch": 2.08, + "learning_rate": 6.436982624796808e-05, + "loss": 1.4619, + "step": 26437 + }, + { + "epoch": 2.08, + "learning_rate": 6.43596786928914e-05, + "loss": 1.4347, + "step": 26438 + }, + { + "epoch": 2.08, + "learning_rate": 6.434953171926517e-05, + "loss": 1.4187, + "step": 26439 + }, + { + "epoch": 2.08, + "learning_rate": 6.43393853271584e-05, + "loss": 1.4466, + "step": 26440 + }, + { + "epoch": 2.08, + "learning_rate": 6.432923951663993e-05, + "loss": 1.4354, + "step": 26441 + }, + { + "epoch": 2.08, + "learning_rate": 6.43190942877786e-05, + "loss": 1.4687, + "step": 26442 + }, + { + "epoch": 2.08, + "learning_rate": 6.430894964064332e-05, + "loss": 1.4173, + "step": 26443 + }, + { + "epoch": 2.08, + "learning_rate": 6.429880557530308e-05, + "loss": 1.4328, + "step": 26444 + }, + { + "epoch": 2.08, + "learning_rate": 6.428866209182663e-05, + "loss": 1.4209, + "step": 26445 + }, + { + "epoch": 2.08, + "learning_rate": 6.427851919028279e-05, + "loss": 1.4644, + "step": 26446 + }, + { + "epoch": 2.08, + "learning_rate": 6.426837687074058e-05, + "loss": 1.4258, + "step": 26447 + }, + { + "epoch": 2.08, + "learning_rate": 6.425823513326879e-05, + "loss": 1.4416, + "step": 26448 + }, + { + "epoch": 2.08, + "learning_rate": 6.424809397793618e-05, + "loss": 1.4342, + "step": 26449 + }, + { + "epoch": 2.08, + "learning_rate": 6.423795340481178e-05, + "loss": 1.4207, + "step": 26450 + }, + { + "epoch": 2.08, + "learning_rate": 6.422781341396432e-05, + "loss": 1.3997, + "step": 26451 + }, + { + "epoch": 2.08, + "learning_rate": 6.421767400546269e-05, + "loss": 1.4456, + "step": 26452 + }, + { + "epoch": 2.08, + "learning_rate": 6.420753517937566e-05, + "loss": 1.4468, + "step": 26453 + }, + { + "epoch": 2.08, + "learning_rate": 6.419739693577217e-05, + "loss": 1.4224, + "step": 26454 + }, + { + "epoch": 2.08, + "learning_rate": 6.418725927472101e-05, + "loss": 1.4713, + "step": 26455 + }, + { + "epoch": 2.08, + "learning_rate": 6.417712219629095e-05, + "loss": 1.514, + "step": 26456 + }, + { + "epoch": 2.08, + "learning_rate": 6.416698570055091e-05, + "loss": 1.4857, + "step": 26457 + }, + { + "epoch": 2.08, + "learning_rate": 6.415684978756964e-05, + "loss": 1.4685, + "step": 26458 + }, + { + "epoch": 2.08, + "learning_rate": 6.414671445741603e-05, + "loss": 1.4729, + "step": 26459 + }, + { + "epoch": 2.08, + "learning_rate": 6.41365797101588e-05, + "loss": 1.463, + "step": 26460 + }, + { + "epoch": 2.08, + "learning_rate": 6.412644554586685e-05, + "loss": 1.494, + "step": 26461 + }, + { + "epoch": 2.08, + "learning_rate": 6.411631196460897e-05, + "loss": 1.4874, + "step": 26462 + }, + { + "epoch": 2.08, + "learning_rate": 6.410617896645385e-05, + "loss": 1.4301, + "step": 26463 + }, + { + "epoch": 2.08, + "learning_rate": 6.409604655147046e-05, + "loss": 1.4839, + "step": 26464 + }, + { + "epoch": 2.08, + "learning_rate": 6.408591471972749e-05, + "loss": 1.4446, + "step": 26465 + }, + { + "epoch": 2.08, + "learning_rate": 6.407578347129371e-05, + "loss": 1.447, + "step": 26466 + }, + { + "epoch": 2.08, + "learning_rate": 6.406565280623798e-05, + "loss": 1.4955, + "step": 26467 + }, + { + "epoch": 2.08, + "learning_rate": 6.405552272462905e-05, + "loss": 1.4422, + "step": 26468 + }, + { + "epoch": 2.08, + "learning_rate": 6.40453932265357e-05, + "loss": 1.4591, + "step": 26469 + }, + { + "epoch": 2.08, + "learning_rate": 6.403526431202663e-05, + "loss": 1.4656, + "step": 26470 + }, + { + "epoch": 2.08, + "learning_rate": 6.402513598117074e-05, + "loss": 1.4817, + "step": 26471 + }, + { + "epoch": 2.08, + "learning_rate": 6.401500823403675e-05, + "loss": 1.4535, + "step": 26472 + }, + { + "epoch": 2.08, + "learning_rate": 6.400488107069332e-05, + "loss": 1.4554, + "step": 26473 + }, + { + "epoch": 2.08, + "learning_rate": 6.39947544912093e-05, + "loss": 1.4653, + "step": 26474 + }, + { + "epoch": 2.08, + "learning_rate": 6.398462849565349e-05, + "loss": 1.4393, + "step": 26475 + }, + { + "epoch": 2.08, + "learning_rate": 6.397450308409459e-05, + "loss": 1.4896, + "step": 26476 + }, + { + "epoch": 2.08, + "learning_rate": 6.396437825660128e-05, + "loss": 1.4492, + "step": 26477 + }, + { + "epoch": 2.08, + "learning_rate": 6.395425401324241e-05, + "loss": 1.4932, + "step": 26478 + }, + { + "epoch": 2.08, + "learning_rate": 6.394413035408668e-05, + "loss": 1.4598, + "step": 26479 + }, + { + "epoch": 2.08, + "learning_rate": 6.393400727920277e-05, + "loss": 1.4415, + "step": 26480 + }, + { + "epoch": 2.08, + "learning_rate": 6.392388478865951e-05, + "loss": 1.4442, + "step": 26481 + }, + { + "epoch": 2.08, + "learning_rate": 6.391376288252555e-05, + "loss": 1.4765, + "step": 26482 + }, + { + "epoch": 2.08, + "learning_rate": 6.39036415608696e-05, + "loss": 1.4451, + "step": 26483 + }, + { + "epoch": 2.08, + "learning_rate": 6.389352082376045e-05, + "loss": 1.4338, + "step": 26484 + }, + { + "epoch": 2.08, + "learning_rate": 6.388340067126679e-05, + "loss": 1.4954, + "step": 26485 + }, + { + "epoch": 2.08, + "learning_rate": 6.387328110345725e-05, + "loss": 1.4807, + "step": 26486 + }, + { + "epoch": 2.08, + "learning_rate": 6.386316212040068e-05, + "loss": 1.4546, + "step": 26487 + }, + { + "epoch": 2.08, + "learning_rate": 6.385304372216569e-05, + "loss": 1.4531, + "step": 26488 + }, + { + "epoch": 2.08, + "learning_rate": 6.384292590882099e-05, + "loss": 1.5048, + "step": 26489 + }, + { + "epoch": 2.08, + "learning_rate": 6.383280868043516e-05, + "loss": 1.4356, + "step": 26490 + }, + { + "epoch": 2.08, + "learning_rate": 6.382269203707714e-05, + "loss": 1.4811, + "step": 26491 + }, + { + "epoch": 2.08, + "learning_rate": 6.381257597881547e-05, + "loss": 1.5132, + "step": 26492 + }, + { + "epoch": 2.08, + "learning_rate": 6.380246050571885e-05, + "loss": 1.487, + "step": 26493 + }, + { + "epoch": 2.08, + "learning_rate": 6.37923456178559e-05, + "loss": 1.4155, + "step": 26494 + }, + { + "epoch": 2.08, + "learning_rate": 6.378223131529542e-05, + "loss": 1.4372, + "step": 26495 + }, + { + "epoch": 2.08, + "learning_rate": 6.377211759810598e-05, + "loss": 1.3723, + "step": 26496 + }, + { + "epoch": 2.08, + "learning_rate": 6.376200446635624e-05, + "loss": 1.4635, + "step": 26497 + }, + { + "epoch": 2.08, + "learning_rate": 6.375189192011496e-05, + "loss": 1.4945, + "step": 26498 + }, + { + "epoch": 2.08, + "learning_rate": 6.374177995945072e-05, + "loss": 1.4555, + "step": 26499 + }, + { + "epoch": 2.09, + "learning_rate": 6.373166858443217e-05, + "loss": 1.4114, + "step": 26500 + }, + { + "epoch": 2.09, + "learning_rate": 6.3721557795128e-05, + "loss": 1.4389, + "step": 26501 + }, + { + "epoch": 2.09, + "learning_rate": 6.371144759160686e-05, + "loss": 1.4728, + "step": 26502 + }, + { + "epoch": 2.09, + "learning_rate": 6.370133797393732e-05, + "loss": 1.4685, + "step": 26503 + }, + { + "epoch": 2.09, + "learning_rate": 6.369122894218812e-05, + "loss": 1.4379, + "step": 26504 + }, + { + "epoch": 2.09, + "learning_rate": 6.368112049642785e-05, + "loss": 1.4723, + "step": 26505 + }, + { + "epoch": 2.09, + "learning_rate": 6.367101263672506e-05, + "loss": 1.4693, + "step": 26506 + }, + { + "epoch": 2.09, + "learning_rate": 6.366090536314849e-05, + "loss": 1.4263, + "step": 26507 + }, + { + "epoch": 2.09, + "learning_rate": 6.365079867576677e-05, + "loss": 1.4467, + "step": 26508 + }, + { + "epoch": 2.09, + "learning_rate": 6.364069257464846e-05, + "loss": 1.4348, + "step": 26509 + }, + { + "epoch": 2.09, + "learning_rate": 6.36305870598622e-05, + "loss": 1.4424, + "step": 26510 + }, + { + "epoch": 2.09, + "learning_rate": 6.362048213147654e-05, + "loss": 1.463, + "step": 26511 + }, + { + "epoch": 2.09, + "learning_rate": 6.36103777895602e-05, + "loss": 1.456, + "step": 26512 + }, + { + "epoch": 2.09, + "learning_rate": 6.360027403418171e-05, + "loss": 1.4555, + "step": 26513 + }, + { + "epoch": 2.09, + "learning_rate": 6.359017086540962e-05, + "loss": 1.4717, + "step": 26514 + }, + { + "epoch": 2.09, + "learning_rate": 6.358006828331266e-05, + "loss": 1.438, + "step": 26515 + }, + { + "epoch": 2.09, + "learning_rate": 6.356996628795933e-05, + "loss": 1.4466, + "step": 26516 + }, + { + "epoch": 2.09, + "learning_rate": 6.355986487941818e-05, + "loss": 1.4667, + "step": 26517 + }, + { + "epoch": 2.09, + "learning_rate": 6.35497640577579e-05, + "loss": 1.41, + "step": 26518 + }, + { + "epoch": 2.09, + "learning_rate": 6.353966382304702e-05, + "loss": 1.4647, + "step": 26519 + }, + { + "epoch": 2.09, + "learning_rate": 6.352956417535405e-05, + "loss": 1.4642, + "step": 26520 + }, + { + "epoch": 2.09, + "learning_rate": 6.351946511474762e-05, + "loss": 1.4593, + "step": 26521 + }, + { + "epoch": 2.09, + "learning_rate": 6.350936664129636e-05, + "loss": 1.4564, + "step": 26522 + }, + { + "epoch": 2.09, + "learning_rate": 6.349926875506877e-05, + "loss": 1.471, + "step": 26523 + }, + { + "epoch": 2.09, + "learning_rate": 6.348917145613335e-05, + "loss": 1.4822, + "step": 26524 + }, + { + "epoch": 2.09, + "learning_rate": 6.347907474455876e-05, + "loss": 1.4553, + "step": 26525 + }, + { + "epoch": 2.09, + "learning_rate": 6.346897862041353e-05, + "loss": 1.4618, + "step": 26526 + }, + { + "epoch": 2.09, + "learning_rate": 6.345888308376612e-05, + "loss": 1.4413, + "step": 26527 + }, + { + "epoch": 2.09, + "learning_rate": 6.344878813468518e-05, + "loss": 1.4842, + "step": 26528 + }, + { + "epoch": 2.09, + "learning_rate": 6.343869377323921e-05, + "loss": 1.4991, + "step": 26529 + }, + { + "epoch": 2.09, + "learning_rate": 6.342859999949676e-05, + "loss": 1.4755, + "step": 26530 + }, + { + "epoch": 2.09, + "learning_rate": 6.341850681352627e-05, + "loss": 1.4877, + "step": 26531 + }, + { + "epoch": 2.09, + "learning_rate": 6.340841421539638e-05, + "loss": 1.4576, + "step": 26532 + }, + { + "epoch": 2.09, + "learning_rate": 6.33983222051756e-05, + "loss": 1.4589, + "step": 26533 + }, + { + "epoch": 2.09, + "learning_rate": 6.338823078293235e-05, + "loss": 1.4139, + "step": 26534 + }, + { + "epoch": 2.09, + "learning_rate": 6.337813994873527e-05, + "loss": 1.4486, + "step": 26535 + }, + { + "epoch": 2.09, + "learning_rate": 6.336804970265284e-05, + "loss": 1.4277, + "step": 26536 + }, + { + "epoch": 2.09, + "learning_rate": 6.335796004475346e-05, + "loss": 1.4469, + "step": 26537 + }, + { + "epoch": 2.09, + "learning_rate": 6.334787097510575e-05, + "loss": 1.4414, + "step": 26538 + }, + { + "epoch": 2.09, + "learning_rate": 6.33377824937782e-05, + "loss": 1.4756, + "step": 26539 + }, + { + "epoch": 2.09, + "learning_rate": 6.33276946008393e-05, + "loss": 1.499, + "step": 26540 + }, + { + "epoch": 2.09, + "learning_rate": 6.331760729635747e-05, + "loss": 1.4157, + "step": 26541 + }, + { + "epoch": 2.09, + "learning_rate": 6.33075205804013e-05, + "loss": 1.4733, + "step": 26542 + }, + { + "epoch": 2.09, + "learning_rate": 6.329743445303922e-05, + "loss": 1.4847, + "step": 26543 + }, + { + "epoch": 2.09, + "learning_rate": 6.328734891433967e-05, + "loss": 1.467, + "step": 26544 + }, + { + "epoch": 2.09, + "learning_rate": 6.327726396437123e-05, + "loss": 1.4654, + "step": 26545 + }, + { + "epoch": 2.09, + "learning_rate": 6.32671796032023e-05, + "loss": 1.4492, + "step": 26546 + }, + { + "epoch": 2.09, + "learning_rate": 6.325709583090135e-05, + "loss": 1.5019, + "step": 26547 + }, + { + "epoch": 2.09, + "learning_rate": 6.32470126475368e-05, + "loss": 1.4385, + "step": 26548 + }, + { + "epoch": 2.09, + "learning_rate": 6.323693005317722e-05, + "loss": 1.473, + "step": 26549 + }, + { + "epoch": 2.09, + "learning_rate": 6.3226848047891e-05, + "loss": 1.4376, + "step": 26550 + }, + { + "epoch": 2.09, + "learning_rate": 6.321676663174656e-05, + "loss": 1.4356, + "step": 26551 + }, + { + "epoch": 2.09, + "learning_rate": 6.320668580481241e-05, + "loss": 1.4879, + "step": 26552 + }, + { + "epoch": 2.09, + "learning_rate": 6.319660556715692e-05, + "loss": 1.4166, + "step": 26553 + }, + { + "epoch": 2.09, + "learning_rate": 6.318652591884865e-05, + "loss": 1.4729, + "step": 26554 + }, + { + "epoch": 2.09, + "learning_rate": 6.317644685995589e-05, + "loss": 1.4785, + "step": 26555 + }, + { + "epoch": 2.09, + "learning_rate": 6.316636839054719e-05, + "loss": 1.4754, + "step": 26556 + }, + { + "epoch": 2.09, + "learning_rate": 6.315629051069095e-05, + "loss": 1.4272, + "step": 26557 + }, + { + "epoch": 2.09, + "learning_rate": 6.31462132204555e-05, + "loss": 1.4426, + "step": 26558 + }, + { + "epoch": 2.09, + "learning_rate": 6.31361365199094e-05, + "loss": 1.4279, + "step": 26559 + }, + { + "epoch": 2.09, + "learning_rate": 6.312606040912099e-05, + "loss": 1.4914, + "step": 26560 + }, + { + "epoch": 2.09, + "learning_rate": 6.311598488815864e-05, + "loss": 1.4263, + "step": 26561 + }, + { + "epoch": 2.09, + "learning_rate": 6.310590995709085e-05, + "loss": 1.4829, + "step": 26562 + }, + { + "epoch": 2.09, + "learning_rate": 6.3095835615986e-05, + "loss": 1.4385, + "step": 26563 + }, + { + "epoch": 2.09, + "learning_rate": 6.308576186491245e-05, + "loss": 1.4924, + "step": 26564 + }, + { + "epoch": 2.09, + "learning_rate": 6.307568870393855e-05, + "loss": 1.4519, + "step": 26565 + }, + { + "epoch": 2.09, + "learning_rate": 6.306561613313284e-05, + "loss": 1.4247, + "step": 26566 + }, + { + "epoch": 2.09, + "learning_rate": 6.30555441525636e-05, + "loss": 1.4832, + "step": 26567 + }, + { + "epoch": 2.09, + "learning_rate": 6.304547276229919e-05, + "loss": 1.4836, + "step": 26568 + }, + { + "epoch": 2.09, + "learning_rate": 6.303540196240802e-05, + "loss": 1.4352, + "step": 26569 + }, + { + "epoch": 2.09, + "learning_rate": 6.302533175295855e-05, + "loss": 1.4801, + "step": 26570 + }, + { + "epoch": 2.09, + "learning_rate": 6.301526213401907e-05, + "loss": 1.4405, + "step": 26571 + }, + { + "epoch": 2.09, + "learning_rate": 6.300519310565791e-05, + "loss": 1.4835, + "step": 26572 + }, + { + "epoch": 2.09, + "learning_rate": 6.299512466794353e-05, + "loss": 1.4599, + "step": 26573 + }, + { + "epoch": 2.09, + "learning_rate": 6.298505682094425e-05, + "loss": 1.5011, + "step": 26574 + }, + { + "epoch": 2.09, + "learning_rate": 6.297498956472836e-05, + "loss": 1.4546, + "step": 26575 + }, + { + "epoch": 2.09, + "learning_rate": 6.296492289936433e-05, + "loss": 1.4233, + "step": 26576 + }, + { + "epoch": 2.09, + "learning_rate": 6.295485682492042e-05, + "loss": 1.4342, + "step": 26577 + }, + { + "epoch": 2.09, + "learning_rate": 6.294479134146496e-05, + "loss": 1.414, + "step": 26578 + }, + { + "epoch": 2.09, + "learning_rate": 6.293472644906637e-05, + "loss": 1.446, + "step": 26579 + }, + { + "epoch": 2.09, + "learning_rate": 6.292466214779294e-05, + "loss": 1.4866, + "step": 26580 + }, + { + "epoch": 2.09, + "learning_rate": 6.291459843771296e-05, + "loss": 1.4418, + "step": 26581 + }, + { + "epoch": 2.09, + "learning_rate": 6.290453531889484e-05, + "loss": 1.464, + "step": 26582 + }, + { + "epoch": 2.09, + "learning_rate": 6.289447279140687e-05, + "loss": 1.4417, + "step": 26583 + }, + { + "epoch": 2.09, + "learning_rate": 6.288441085531729e-05, + "loss": 1.5272, + "step": 26584 + }, + { + "epoch": 2.09, + "learning_rate": 6.287434951069451e-05, + "loss": 1.4491, + "step": 26585 + }, + { + "epoch": 2.09, + "learning_rate": 6.286428875760686e-05, + "loss": 1.5196, + "step": 26586 + }, + { + "epoch": 2.09, + "learning_rate": 6.285422859612261e-05, + "loss": 1.4957, + "step": 26587 + }, + { + "epoch": 2.09, + "learning_rate": 6.284416902631005e-05, + "loss": 1.456, + "step": 26588 + }, + { + "epoch": 2.09, + "learning_rate": 6.283411004823742e-05, + "loss": 1.4395, + "step": 26589 + }, + { + "epoch": 2.09, + "learning_rate": 6.282405166197314e-05, + "loss": 1.4182, + "step": 26590 + }, + { + "epoch": 2.09, + "learning_rate": 6.281399386758545e-05, + "loss": 1.4708, + "step": 26591 + }, + { + "epoch": 2.09, + "learning_rate": 6.280393666514258e-05, + "loss": 1.4247, + "step": 26592 + }, + { + "epoch": 2.09, + "learning_rate": 6.279388005471291e-05, + "loss": 1.4368, + "step": 26593 + }, + { + "epoch": 2.09, + "learning_rate": 6.278382403636467e-05, + "loss": 1.4703, + "step": 26594 + }, + { + "epoch": 2.09, + "learning_rate": 6.277376861016608e-05, + "loss": 1.4238, + "step": 26595 + }, + { + "epoch": 2.09, + "learning_rate": 6.276371377618552e-05, + "loss": 1.4209, + "step": 26596 + }, + { + "epoch": 2.09, + "learning_rate": 6.27536595344912e-05, + "loss": 1.4939, + "step": 26597 + }, + { + "epoch": 2.09, + "learning_rate": 6.274360588515133e-05, + "loss": 1.4689, + "step": 26598 + }, + { + "epoch": 2.09, + "learning_rate": 6.273355282823429e-05, + "loss": 1.4505, + "step": 26599 + }, + { + "epoch": 2.09, + "learning_rate": 6.272350036380821e-05, + "loss": 1.4776, + "step": 26600 + }, + { + "epoch": 2.09, + "learning_rate": 6.271344849194144e-05, + "loss": 1.458, + "step": 26601 + }, + { + "epoch": 2.09, + "learning_rate": 6.270339721270216e-05, + "loss": 1.4187, + "step": 26602 + }, + { + "epoch": 2.09, + "learning_rate": 6.269334652615866e-05, + "loss": 1.4211, + "step": 26603 + }, + { + "epoch": 2.09, + "learning_rate": 6.268329643237917e-05, + "loss": 1.4341, + "step": 26604 + }, + { + "epoch": 2.09, + "learning_rate": 6.267324693143191e-05, + "loss": 1.4239, + "step": 26605 + }, + { + "epoch": 2.09, + "learning_rate": 6.266319802338506e-05, + "loss": 1.4541, + "step": 26606 + }, + { + "epoch": 2.09, + "learning_rate": 6.265314970830696e-05, + "loss": 1.4754, + "step": 26607 + }, + { + "epoch": 2.09, + "learning_rate": 6.264310198626576e-05, + "loss": 1.5246, + "step": 26608 + }, + { + "epoch": 2.09, + "learning_rate": 6.263305485732964e-05, + "loss": 1.4669, + "step": 26609 + }, + { + "epoch": 2.09, + "learning_rate": 6.262300832156693e-05, + "loss": 1.4589, + "step": 26610 + }, + { + "epoch": 2.09, + "learning_rate": 6.261296237904576e-05, + "loss": 1.4393, + "step": 26611 + }, + { + "epoch": 2.09, + "learning_rate": 6.26029170298343e-05, + "loss": 1.4533, + "step": 26612 + }, + { + "epoch": 2.09, + "learning_rate": 6.259287227400087e-05, + "loss": 1.4699, + "step": 26613 + }, + { + "epoch": 2.09, + "learning_rate": 6.258282811161359e-05, + "loss": 1.4854, + "step": 26614 + }, + { + "epoch": 2.09, + "learning_rate": 6.257278454274061e-05, + "loss": 1.4435, + "step": 26615 + }, + { + "epoch": 2.09, + "learning_rate": 6.256274156745018e-05, + "loss": 1.4967, + "step": 26616 + }, + { + "epoch": 2.09, + "learning_rate": 6.255269918581055e-05, + "loss": 1.4652, + "step": 26617 + }, + { + "epoch": 2.09, + "learning_rate": 6.254265739788981e-05, + "loss": 1.4681, + "step": 26618 + }, + { + "epoch": 2.09, + "learning_rate": 6.253261620375612e-05, + "loss": 1.4784, + "step": 26619 + }, + { + "epoch": 2.09, + "learning_rate": 6.252257560347776e-05, + "loss": 1.4865, + "step": 26620 + }, + { + "epoch": 2.09, + "learning_rate": 6.251253559712283e-05, + "loss": 1.4539, + "step": 26621 + }, + { + "epoch": 2.09, + "learning_rate": 6.250249618475952e-05, + "loss": 1.4986, + "step": 26622 + }, + { + "epoch": 2.09, + "learning_rate": 6.249245736645589e-05, + "loss": 1.468, + "step": 26623 + }, + { + "epoch": 2.09, + "learning_rate": 6.248241914228025e-05, + "loss": 1.4742, + "step": 26624 + }, + { + "epoch": 2.09, + "learning_rate": 6.247238151230071e-05, + "loss": 1.4153, + "step": 26625 + }, + { + "epoch": 2.09, + "learning_rate": 6.246234447658532e-05, + "loss": 1.52, + "step": 26626 + }, + { + "epoch": 2.1, + "learning_rate": 6.245230803520237e-05, + "loss": 1.439, + "step": 26627 + }, + { + "epoch": 2.1, + "learning_rate": 6.244227218821992e-05, + "loss": 1.4691, + "step": 26628 + }, + { + "epoch": 2.1, + "learning_rate": 6.243223693570608e-05, + "loss": 1.4878, + "step": 26629 + }, + { + "epoch": 2.1, + "learning_rate": 6.242220227772908e-05, + "loss": 1.4242, + "step": 26630 + }, + { + "epoch": 2.1, + "learning_rate": 6.241216821435695e-05, + "loss": 1.4667, + "step": 26631 + }, + { + "epoch": 2.1, + "learning_rate": 6.240213474565791e-05, + "loss": 1.5085, + "step": 26632 + }, + { + "epoch": 2.1, + "learning_rate": 6.239210187169997e-05, + "loss": 1.4728, + "step": 26633 + }, + { + "epoch": 2.1, + "learning_rate": 6.238206959255138e-05, + "loss": 1.5155, + "step": 26634 + }, + { + "epoch": 2.1, + "learning_rate": 6.23720379082802e-05, + "loss": 1.4723, + "step": 26635 + }, + { + "epoch": 2.1, + "learning_rate": 6.236200681895446e-05, + "loss": 1.437, + "step": 26636 + }, + { + "epoch": 2.1, + "learning_rate": 6.235197632464236e-05, + "loss": 1.4305, + "step": 26637 + }, + { + "epoch": 2.1, + "learning_rate": 6.2341946425412e-05, + "loss": 1.4615, + "step": 26638 + }, + { + "epoch": 2.1, + "learning_rate": 6.233191712133139e-05, + "loss": 1.4464, + "step": 26639 + }, + { + "epoch": 2.1, + "learning_rate": 6.232188841246874e-05, + "loss": 1.4047, + "step": 26640 + }, + { + "epoch": 2.1, + "learning_rate": 6.231186029889207e-05, + "loss": 1.3892, + "step": 26641 + }, + { + "epoch": 2.1, + "learning_rate": 6.23018327806695e-05, + "loss": 1.4781, + "step": 26642 + }, + { + "epoch": 2.1, + "learning_rate": 6.229180585786902e-05, + "loss": 1.3912, + "step": 26643 + }, + { + "epoch": 2.1, + "learning_rate": 6.228177953055882e-05, + "loss": 1.4263, + "step": 26644 + }, + { + "epoch": 2.1, + "learning_rate": 6.227175379880694e-05, + "loss": 1.4277, + "step": 26645 + }, + { + "epoch": 2.1, + "learning_rate": 6.22617286626814e-05, + "loss": 1.4224, + "step": 26646 + }, + { + "epoch": 2.1, + "learning_rate": 6.225170412225029e-05, + "loss": 1.4736, + "step": 26647 + }, + { + "epoch": 2.1, + "learning_rate": 6.224168017758175e-05, + "loss": 1.508, + "step": 26648 + }, + { + "epoch": 2.1, + "learning_rate": 6.223165682874377e-05, + "loss": 1.4517, + "step": 26649 + }, + { + "epoch": 2.1, + "learning_rate": 6.222163407580434e-05, + "loss": 1.4649, + "step": 26650 + }, + { + "epoch": 2.1, + "learning_rate": 6.221161191883164e-05, + "loss": 1.4561, + "step": 26651 + }, + { + "epoch": 2.1, + "learning_rate": 6.220159035789364e-05, + "loss": 1.4369, + "step": 26652 + }, + { + "epoch": 2.1, + "learning_rate": 6.219156939305835e-05, + "loss": 1.477, + "step": 26653 + }, + { + "epoch": 2.1, + "learning_rate": 6.218154902439388e-05, + "loss": 1.4635, + "step": 26654 + }, + { + "epoch": 2.1, + "learning_rate": 6.217152925196824e-05, + "loss": 1.481, + "step": 26655 + }, + { + "epoch": 2.1, + "learning_rate": 6.216151007584941e-05, + "loss": 1.4434, + "step": 26656 + }, + { + "epoch": 2.1, + "learning_rate": 6.215149149610549e-05, + "loss": 1.5031, + "step": 26657 + }, + { + "epoch": 2.1, + "learning_rate": 6.214147351280447e-05, + "loss": 1.4586, + "step": 26658 + }, + { + "epoch": 2.1, + "learning_rate": 6.213145612601436e-05, + "loss": 1.4283, + "step": 26659 + }, + { + "epoch": 2.1, + "learning_rate": 6.212143933580311e-05, + "loss": 1.428, + "step": 26660 + }, + { + "epoch": 2.1, + "learning_rate": 6.211142314223885e-05, + "loss": 1.4065, + "step": 26661 + }, + { + "epoch": 2.1, + "learning_rate": 6.210140754538955e-05, + "loss": 1.4827, + "step": 26662 + }, + { + "epoch": 2.1, + "learning_rate": 6.209139254532311e-05, + "loss": 1.4857, + "step": 26663 + }, + { + "epoch": 2.1, + "learning_rate": 6.208137814210758e-05, + "loss": 1.4977, + "step": 26664 + }, + { + "epoch": 2.1, + "learning_rate": 6.207136433581107e-05, + "loss": 1.4854, + "step": 26665 + }, + { + "epoch": 2.1, + "learning_rate": 6.206135112650145e-05, + "loss": 1.4825, + "step": 26666 + }, + { + "epoch": 2.1, + "learning_rate": 6.205133851424668e-05, + "loss": 1.4165, + "step": 26667 + }, + { + "epoch": 2.1, + "learning_rate": 6.204132649911484e-05, + "loss": 1.412, + "step": 26668 + }, + { + "epoch": 2.1, + "learning_rate": 6.203131508117386e-05, + "loss": 1.4902, + "step": 26669 + }, + { + "epoch": 2.1, + "learning_rate": 6.202130426049163e-05, + "loss": 1.4499, + "step": 26670 + }, + { + "epoch": 2.1, + "learning_rate": 6.201129403713627e-05, + "loss": 1.4473, + "step": 26671 + }, + { + "epoch": 2.1, + "learning_rate": 6.200128441117566e-05, + "loss": 1.4945, + "step": 26672 + }, + { + "epoch": 2.1, + "learning_rate": 6.199127538267772e-05, + "loss": 1.476, + "step": 26673 + }, + { + "epoch": 2.1, + "learning_rate": 6.198126695171051e-05, + "loss": 1.4609, + "step": 26674 + }, + { + "epoch": 2.1, + "learning_rate": 6.19712591183419e-05, + "loss": 1.4535, + "step": 26675 + }, + { + "epoch": 2.1, + "learning_rate": 6.196125188263988e-05, + "loss": 1.4467, + "step": 26676 + }, + { + "epoch": 2.1, + "learning_rate": 6.195124524467232e-05, + "loss": 1.4633, + "step": 26677 + }, + { + "epoch": 2.1, + "learning_rate": 6.19412392045072e-05, + "loss": 1.3969, + "step": 26678 + }, + { + "epoch": 2.1, + "learning_rate": 6.193123376221256e-05, + "loss": 1.4735, + "step": 26679 + }, + { + "epoch": 2.1, + "learning_rate": 6.192122891785617e-05, + "loss": 1.4245, + "step": 26680 + }, + { + "epoch": 2.1, + "learning_rate": 6.191122467150607e-05, + "loss": 1.4597, + "step": 26681 + }, + { + "epoch": 2.1, + "learning_rate": 6.190122102323016e-05, + "loss": 1.5169, + "step": 26682 + }, + { + "epoch": 2.1, + "learning_rate": 6.189121797309634e-05, + "loss": 1.3973, + "step": 26683 + }, + { + "epoch": 2.1, + "learning_rate": 6.188121552117247e-05, + "loss": 1.4557, + "step": 26684 + }, + { + "epoch": 2.1, + "learning_rate": 6.187121366752657e-05, + "loss": 1.4852, + "step": 26685 + }, + { + "epoch": 2.1, + "learning_rate": 6.18612124122265e-05, + "loss": 1.4712, + "step": 26686 + }, + { + "epoch": 2.1, + "learning_rate": 6.185121175534011e-05, + "loss": 1.4117, + "step": 26687 + }, + { + "epoch": 2.1, + "learning_rate": 6.18412116969354e-05, + "loss": 1.4481, + "step": 26688 + }, + { + "epoch": 2.1, + "learning_rate": 6.183121223708019e-05, + "loss": 1.443, + "step": 26689 + }, + { + "epoch": 2.1, + "learning_rate": 6.182121337584236e-05, + "loss": 1.501, + "step": 26690 + }, + { + "epoch": 2.1, + "learning_rate": 6.181121511328989e-05, + "loss": 1.4445, + "step": 26691 + }, + { + "epoch": 2.1, + "learning_rate": 6.18012174494906e-05, + "loss": 1.449, + "step": 26692 + }, + { + "epoch": 2.1, + "learning_rate": 6.179122038451231e-05, + "loss": 1.4963, + "step": 26693 + }, + { + "epoch": 2.1, + "learning_rate": 6.178122391842296e-05, + "loss": 1.4433, + "step": 26694 + }, + { + "epoch": 2.1, + "learning_rate": 6.177122805129046e-05, + "loss": 1.4515, + "step": 26695 + }, + { + "epoch": 2.1, + "learning_rate": 6.176123278318264e-05, + "loss": 1.4362, + "step": 26696 + }, + { + "epoch": 2.1, + "learning_rate": 6.175123811416731e-05, + "loss": 1.4589, + "step": 26697 + }, + { + "epoch": 2.1, + "learning_rate": 6.174124404431242e-05, + "loss": 1.4562, + "step": 26698 + }, + { + "epoch": 2.1, + "learning_rate": 6.173125057368578e-05, + "loss": 1.4746, + "step": 26699 + }, + { + "epoch": 2.1, + "learning_rate": 6.172125770235524e-05, + "loss": 1.4712, + "step": 26700 + }, + { + "epoch": 2.1, + "learning_rate": 6.171126543038857e-05, + "loss": 1.4556, + "step": 26701 + }, + { + "epoch": 2.1, + "learning_rate": 6.170127375785376e-05, + "loss": 1.424, + "step": 26702 + }, + { + "epoch": 2.1, + "learning_rate": 6.169128268481858e-05, + "loss": 1.4521, + "step": 26703 + }, + { + "epoch": 2.1, + "learning_rate": 6.168129221135079e-05, + "loss": 1.4737, + "step": 26704 + }, + { + "epoch": 2.1, + "learning_rate": 6.167130233751834e-05, + "loss": 1.4618, + "step": 26705 + }, + { + "epoch": 2.1, + "learning_rate": 6.1661313063389e-05, + "loss": 1.4364, + "step": 26706 + }, + { + "epoch": 2.1, + "learning_rate": 6.165132438903055e-05, + "loss": 1.4394, + "step": 26707 + }, + { + "epoch": 2.1, + "learning_rate": 6.164133631451091e-05, + "loss": 1.4575, + "step": 26708 + }, + { + "epoch": 2.1, + "learning_rate": 6.163134883989782e-05, + "loss": 1.5167, + "step": 26709 + }, + { + "epoch": 2.1, + "learning_rate": 6.162136196525907e-05, + "loss": 1.4884, + "step": 26710 + }, + { + "epoch": 2.1, + "learning_rate": 6.16113756906625e-05, + "loss": 1.4907, + "step": 26711 + }, + { + "epoch": 2.1, + "learning_rate": 6.160139001617597e-05, + "loss": 1.5291, + "step": 26712 + }, + { + "epoch": 2.1, + "learning_rate": 6.15914049418672e-05, + "loss": 1.5077, + "step": 26713 + }, + { + "epoch": 2.1, + "learning_rate": 6.158142046780396e-05, + "loss": 1.459, + "step": 26714 + }, + { + "epoch": 2.1, + "learning_rate": 6.157143659405412e-05, + "loss": 1.4186, + "step": 26715 + }, + { + "epoch": 2.1, + "learning_rate": 6.156145332068545e-05, + "loss": 1.4651, + "step": 26716 + }, + { + "epoch": 2.1, + "learning_rate": 6.15514706477657e-05, + "loss": 1.4465, + "step": 26717 + }, + { + "epoch": 2.1, + "learning_rate": 6.154148857536261e-05, + "loss": 1.464, + "step": 26718 + }, + { + "epoch": 2.1, + "learning_rate": 6.153150710354403e-05, + "loss": 1.4551, + "step": 26719 + }, + { + "epoch": 2.1, + "learning_rate": 6.152152623237771e-05, + "loss": 1.4867, + "step": 26720 + }, + { + "epoch": 2.1, + "learning_rate": 6.151154596193133e-05, + "loss": 1.4172, + "step": 26721 + }, + { + "epoch": 2.1, + "learning_rate": 6.150156629227279e-05, + "loss": 1.447, + "step": 26722 + }, + { + "epoch": 2.1, + "learning_rate": 6.149158722346977e-05, + "loss": 1.4921, + "step": 26723 + }, + { + "epoch": 2.1, + "learning_rate": 6.148160875558998e-05, + "loss": 1.4365, + "step": 26724 + }, + { + "epoch": 2.1, + "learning_rate": 6.147163088870127e-05, + "loss": 1.4825, + "step": 26725 + }, + { + "epoch": 2.1, + "learning_rate": 6.146165362287128e-05, + "loss": 1.4498, + "step": 26726 + }, + { + "epoch": 2.1, + "learning_rate": 6.145167695816787e-05, + "loss": 1.4566, + "step": 26727 + }, + { + "epoch": 2.1, + "learning_rate": 6.144170089465865e-05, + "loss": 1.4651, + "step": 26728 + }, + { + "epoch": 2.1, + "learning_rate": 6.143172543241144e-05, + "loss": 1.4144, + "step": 26729 + }, + { + "epoch": 2.1, + "learning_rate": 6.142175057149396e-05, + "loss": 1.4563, + "step": 26730 + }, + { + "epoch": 2.1, + "learning_rate": 6.141177631197385e-05, + "loss": 1.4688, + "step": 26731 + }, + { + "epoch": 2.1, + "learning_rate": 6.140180265391895e-05, + "loss": 1.4502, + "step": 26732 + }, + { + "epoch": 2.1, + "learning_rate": 6.139182959739692e-05, + "loss": 1.4782, + "step": 26733 + }, + { + "epoch": 2.1, + "learning_rate": 6.138185714247545e-05, + "loss": 1.4743, + "step": 26734 + }, + { + "epoch": 2.1, + "learning_rate": 6.137188528922224e-05, + "loss": 1.4717, + "step": 26735 + }, + { + "epoch": 2.1, + "learning_rate": 6.136191403770505e-05, + "loss": 1.4026, + "step": 26736 + }, + { + "epoch": 2.1, + "learning_rate": 6.135194338799156e-05, + "loss": 1.4782, + "step": 26737 + }, + { + "epoch": 2.1, + "learning_rate": 6.13419733401494e-05, + "loss": 1.4483, + "step": 26738 + }, + { + "epoch": 2.1, + "learning_rate": 6.133200389424638e-05, + "loss": 1.4046, + "step": 26739 + }, + { + "epoch": 2.1, + "learning_rate": 6.132203505035011e-05, + "loss": 1.4719, + "step": 26740 + }, + { + "epoch": 2.1, + "learning_rate": 6.131206680852823e-05, + "loss": 1.4734, + "step": 26741 + }, + { + "epoch": 2.1, + "learning_rate": 6.130209916884847e-05, + "loss": 1.489, + "step": 26742 + }, + { + "epoch": 2.1, + "learning_rate": 6.129213213137857e-05, + "loss": 1.4175, + "step": 26743 + }, + { + "epoch": 2.1, + "learning_rate": 6.128216569618614e-05, + "loss": 1.4407, + "step": 26744 + }, + { + "epoch": 2.1, + "learning_rate": 6.12721998633388e-05, + "loss": 1.4636, + "step": 26745 + }, + { + "epoch": 2.1, + "learning_rate": 6.126223463290429e-05, + "loss": 1.3967, + "step": 26746 + }, + { + "epoch": 2.1, + "learning_rate": 6.125227000495027e-05, + "loss": 1.4899, + "step": 26747 + }, + { + "epoch": 2.1, + "learning_rate": 6.12423059795443e-05, + "loss": 1.4523, + "step": 26748 + }, + { + "epoch": 2.1, + "learning_rate": 6.123234255675412e-05, + "loss": 1.4773, + "step": 26749 + }, + { + "epoch": 2.1, + "learning_rate": 6.122237973664736e-05, + "loss": 1.4904, + "step": 26750 + }, + { + "epoch": 2.1, + "learning_rate": 6.12124175192916e-05, + "loss": 1.545, + "step": 26751 + }, + { + "epoch": 2.1, + "learning_rate": 6.12024559047546e-05, + "loss": 1.4689, + "step": 26752 + }, + { + "epoch": 2.1, + "learning_rate": 6.11924948931039e-05, + "loss": 1.443, + "step": 26753 + }, + { + "epoch": 2.11, + "learning_rate": 6.118253448440714e-05, + "loss": 1.4758, + "step": 26754 + }, + { + "epoch": 2.11, + "learning_rate": 6.117257467873193e-05, + "loss": 1.4495, + "step": 26755 + }, + { + "epoch": 2.11, + "learning_rate": 6.116261547614597e-05, + "loss": 1.4677, + "step": 26756 + }, + { + "epoch": 2.11, + "learning_rate": 6.115265687671676e-05, + "loss": 1.4371, + "step": 26757 + }, + { + "epoch": 2.11, + "learning_rate": 6.114269888051203e-05, + "loss": 1.4328, + "step": 26758 + }, + { + "epoch": 2.11, + "learning_rate": 6.11327414875993e-05, + "loss": 1.4649, + "step": 26759 + }, + { + "epoch": 2.11, + "learning_rate": 6.112278469804626e-05, + "loss": 1.4364, + "step": 26760 + }, + { + "epoch": 2.11, + "learning_rate": 6.111282851192048e-05, + "loss": 1.4496, + "step": 26761 + }, + { + "epoch": 2.11, + "learning_rate": 6.110287292928945e-05, + "loss": 1.47, + "step": 26762 + }, + { + "epoch": 2.11, + "learning_rate": 6.109291795022094e-05, + "loss": 1.4864, + "step": 26763 + }, + { + "epoch": 2.11, + "learning_rate": 6.108296357478246e-05, + "loss": 1.4426, + "step": 26764 + }, + { + "epoch": 2.11, + "learning_rate": 6.107300980304153e-05, + "loss": 1.4674, + "step": 26765 + }, + { + "epoch": 2.11, + "learning_rate": 6.106305663506584e-05, + "loss": 1.4569, + "step": 26766 + }, + { + "epoch": 2.11, + "learning_rate": 6.10531040709229e-05, + "loss": 1.4797, + "step": 26767 + }, + { + "epoch": 2.11, + "learning_rate": 6.104315211068027e-05, + "loss": 1.4134, + "step": 26768 + }, + { + "epoch": 2.11, + "learning_rate": 6.103320075440559e-05, + "loss": 1.4139, + "step": 26769 + }, + { + "epoch": 2.11, + "learning_rate": 6.102325000216638e-05, + "loss": 1.457, + "step": 26770 + }, + { + "epoch": 2.11, + "learning_rate": 6.1013299854030196e-05, + "loss": 1.4548, + "step": 26771 + }, + { + "epoch": 2.11, + "learning_rate": 6.1003350310064545e-05, + "loss": 1.4527, + "step": 26772 + }, + { + "epoch": 2.11, + "learning_rate": 6.099340137033704e-05, + "loss": 1.4983, + "step": 26773 + }, + { + "epoch": 2.11, + "learning_rate": 6.0983453034915275e-05, + "loss": 1.4195, + "step": 26774 + }, + { + "epoch": 2.11, + "learning_rate": 6.097350530386674e-05, + "loss": 1.4714, + "step": 26775 + }, + { + "epoch": 2.11, + "learning_rate": 6.096355817725891e-05, + "loss": 1.4614, + "step": 26776 + }, + { + "epoch": 2.11, + "learning_rate": 6.095361165515945e-05, + "loss": 1.4223, + "step": 26777 + }, + { + "epoch": 2.11, + "learning_rate": 6.094366573763583e-05, + "loss": 1.4405, + "step": 26778 + }, + { + "epoch": 2.11, + "learning_rate": 6.093372042475552e-05, + "loss": 1.4823, + "step": 26779 + }, + { + "epoch": 2.11, + "learning_rate": 6.0923775716586146e-05, + "loss": 1.4427, + "step": 26780 + }, + { + "epoch": 2.11, + "learning_rate": 6.0913831613195175e-05, + "loss": 1.5158, + "step": 26781 + }, + { + "epoch": 2.11, + "learning_rate": 6.090388811465009e-05, + "loss": 1.4502, + "step": 26782 + }, + { + "epoch": 2.11, + "learning_rate": 6.0893945221018475e-05, + "loss": 1.4586, + "step": 26783 + }, + { + "epoch": 2.11, + "learning_rate": 6.088400293236781e-05, + "loss": 1.4643, + "step": 26784 + }, + { + "epoch": 2.11, + "learning_rate": 6.087406124876552e-05, + "loss": 1.4702, + "step": 26785 + }, + { + "epoch": 2.11, + "learning_rate": 6.0864120170279223e-05, + "loss": 1.4939, + "step": 26786 + }, + { + "epoch": 2.11, + "learning_rate": 6.085417969697638e-05, + "loss": 1.4703, + "step": 26787 + }, + { + "epoch": 2.11, + "learning_rate": 6.084423982892438e-05, + "loss": 1.466, + "step": 26788 + }, + { + "epoch": 2.11, + "learning_rate": 6.083430056619082e-05, + "loss": 1.474, + "step": 26789 + }, + { + "epoch": 2.11, + "learning_rate": 6.082436190884319e-05, + "loss": 1.506, + "step": 26790 + }, + { + "epoch": 2.11, + "learning_rate": 6.081442385694894e-05, + "loss": 1.4333, + "step": 26791 + }, + { + "epoch": 2.11, + "learning_rate": 6.080448641057547e-05, + "loss": 1.4539, + "step": 26792 + }, + { + "epoch": 2.11, + "learning_rate": 6.079454956979038e-05, + "loss": 1.4573, + "step": 26793 + }, + { + "epoch": 2.11, + "learning_rate": 6.078461333466107e-05, + "loss": 1.5236, + "step": 26794 + }, + { + "epoch": 2.11, + "learning_rate": 6.0774677705255004e-05, + "loss": 1.4498, + "step": 26795 + }, + { + "epoch": 2.11, + "learning_rate": 6.076474268163958e-05, + "loss": 1.4796, + "step": 26796 + }, + { + "epoch": 2.11, + "learning_rate": 6.0754808263882366e-05, + "loss": 1.4996, + "step": 26797 + }, + { + "epoch": 2.11, + "learning_rate": 6.074487445205075e-05, + "loss": 1.4523, + "step": 26798 + }, + { + "epoch": 2.11, + "learning_rate": 6.0734941246212134e-05, + "loss": 1.5089, + "step": 26799 + }, + { + "epoch": 2.11, + "learning_rate": 6.072500864643404e-05, + "loss": 1.4338, + "step": 26800 + }, + { + "epoch": 2.11, + "learning_rate": 6.071507665278389e-05, + "loss": 1.4667, + "step": 26801 + }, + { + "epoch": 2.11, + "learning_rate": 6.070514526532904e-05, + "loss": 1.4656, + "step": 26802 + }, + { + "epoch": 2.11, + "learning_rate": 6.069521448413704e-05, + "loss": 1.4841, + "step": 26803 + }, + { + "epoch": 2.11, + "learning_rate": 6.068528430927518e-05, + "loss": 1.5121, + "step": 26804 + }, + { + "epoch": 2.11, + "learning_rate": 6.067535474081102e-05, + "loss": 1.4047, + "step": 26805 + }, + { + "epoch": 2.11, + "learning_rate": 6.066542577881185e-05, + "loss": 1.3924, + "step": 26806 + }, + { + "epoch": 2.11, + "learning_rate": 6.065549742334519e-05, + "loss": 1.4338, + "step": 26807 + }, + { + "epoch": 2.11, + "learning_rate": 6.06455696744784e-05, + "loss": 1.445, + "step": 26808 + }, + { + "epoch": 2.11, + "learning_rate": 6.0635642532278825e-05, + "loss": 1.468, + "step": 26809 + }, + { + "epoch": 2.11, + "learning_rate": 6.0625715996813986e-05, + "loss": 1.4397, + "step": 26810 + }, + { + "epoch": 2.11, + "learning_rate": 6.0615790068151196e-05, + "loss": 1.4909, + "step": 26811 + }, + { + "epoch": 2.11, + "learning_rate": 6.060586474635789e-05, + "loss": 1.4624, + "step": 26812 + }, + { + "epoch": 2.11, + "learning_rate": 6.0595940031501355e-05, + "loss": 1.4446, + "step": 26813 + }, + { + "epoch": 2.11, + "learning_rate": 6.0586015923649103e-05, + "loss": 1.3941, + "step": 26814 + }, + { + "epoch": 2.11, + "learning_rate": 6.057609242286848e-05, + "loss": 1.4836, + "step": 26815 + }, + { + "epoch": 2.11, + "learning_rate": 6.0566169529226766e-05, + "loss": 1.5024, + "step": 26816 + }, + { + "epoch": 2.11, + "learning_rate": 6.055624724279148e-05, + "loss": 1.4696, + "step": 26817 + }, + { + "epoch": 2.11, + "learning_rate": 6.05463255636299e-05, + "loss": 1.4171, + "step": 26818 + }, + { + "epoch": 2.11, + "learning_rate": 6.053640449180936e-05, + "loss": 1.4913, + "step": 26819 + }, + { + "epoch": 2.11, + "learning_rate": 6.052648402739726e-05, + "loss": 1.4111, + "step": 26820 + }, + { + "epoch": 2.11, + "learning_rate": 6.0516564170461014e-05, + "loss": 1.4737, + "step": 26821 + }, + { + "epoch": 2.11, + "learning_rate": 6.050664492106792e-05, + "loss": 1.4494, + "step": 26822 + }, + { + "epoch": 2.11, + "learning_rate": 6.049672627928526e-05, + "loss": 1.4407, + "step": 26823 + }, + { + "epoch": 2.11, + "learning_rate": 6.0486808245180504e-05, + "loss": 1.4775, + "step": 26824 + }, + { + "epoch": 2.11, + "learning_rate": 6.047689081882091e-05, + "loss": 1.4963, + "step": 26825 + }, + { + "epoch": 2.11, + "learning_rate": 6.046697400027377e-05, + "loss": 1.4817, + "step": 26826 + }, + { + "epoch": 2.11, + "learning_rate": 6.045705778960653e-05, + "loss": 1.4151, + "step": 26827 + }, + { + "epoch": 2.11, + "learning_rate": 6.044714218688644e-05, + "loss": 1.457, + "step": 26828 + }, + { + "epoch": 2.11, + "learning_rate": 6.043722719218085e-05, + "loss": 1.4622, + "step": 26829 + }, + { + "epoch": 2.11, + "learning_rate": 6.0427312805556986e-05, + "loss": 1.487, + "step": 26830 + }, + { + "epoch": 2.11, + "learning_rate": 6.0417399027082326e-05, + "loss": 1.4734, + "step": 26831 + }, + { + "epoch": 2.11, + "learning_rate": 6.040748585682406e-05, + "loss": 1.4664, + "step": 26832 + }, + { + "epoch": 2.11, + "learning_rate": 6.039757329484949e-05, + "loss": 1.5012, + "step": 26833 + }, + { + "epoch": 2.11, + "learning_rate": 6.038766134122599e-05, + "loss": 1.4607, + "step": 26834 + }, + { + "epoch": 2.11, + "learning_rate": 6.037774999602082e-05, + "loss": 1.4989, + "step": 26835 + }, + { + "epoch": 2.11, + "learning_rate": 6.036783925930123e-05, + "loss": 1.4779, + "step": 26836 + }, + { + "epoch": 2.11, + "learning_rate": 6.035792913113454e-05, + "loss": 1.463, + "step": 26837 + }, + { + "epoch": 2.11, + "learning_rate": 6.034801961158808e-05, + "loss": 1.4409, + "step": 26838 + }, + { + "epoch": 2.11, + "learning_rate": 6.033811070072911e-05, + "loss": 1.4561, + "step": 26839 + }, + { + "epoch": 2.11, + "learning_rate": 6.032820239862484e-05, + "loss": 1.3805, + "step": 26840 + }, + { + "epoch": 2.11, + "learning_rate": 6.031829470534263e-05, + "loss": 1.4626, + "step": 26841 + }, + { + "epoch": 2.11, + "learning_rate": 6.030838762094972e-05, + "loss": 1.4856, + "step": 26842 + }, + { + "epoch": 2.11, + "learning_rate": 6.02984811455133e-05, + "loss": 1.4212, + "step": 26843 + }, + { + "epoch": 2.11, + "learning_rate": 6.028857527910076e-05, + "loss": 1.4824, + "step": 26844 + }, + { + "epoch": 2.11, + "learning_rate": 6.027867002177928e-05, + "loss": 1.4404, + "step": 26845 + }, + { + "epoch": 2.11, + "learning_rate": 6.026876537361611e-05, + "loss": 1.4337, + "step": 26846 + }, + { + "epoch": 2.11, + "learning_rate": 6.025886133467845e-05, + "loss": 1.4108, + "step": 26847 + }, + { + "epoch": 2.11, + "learning_rate": 6.0248957905033665e-05, + "loss": 1.4438, + "step": 26848 + }, + { + "epoch": 2.11, + "learning_rate": 6.0239055084748913e-05, + "loss": 1.5278, + "step": 26849 + }, + { + "epoch": 2.11, + "learning_rate": 6.02291528738914e-05, + "loss": 1.514, + "step": 26850 + }, + { + "epoch": 2.11, + "learning_rate": 6.02192512725284e-05, + "loss": 1.4844, + "step": 26851 + }, + { + "epoch": 2.11, + "learning_rate": 6.020935028072719e-05, + "loss": 1.4314, + "step": 26852 + }, + { + "epoch": 2.11, + "learning_rate": 6.019944989855493e-05, + "loss": 1.4695, + "step": 26853 + }, + { + "epoch": 2.11, + "learning_rate": 6.018955012607881e-05, + "loss": 1.5043, + "step": 26854 + }, + { + "epoch": 2.11, + "learning_rate": 6.017965096336613e-05, + "loss": 1.4415, + "step": 26855 + }, + { + "epoch": 2.11, + "learning_rate": 6.0169752410484055e-05, + "loss": 1.4453, + "step": 26856 + }, + { + "epoch": 2.11, + "learning_rate": 6.015985446749973e-05, + "loss": 1.4459, + "step": 26857 + }, + { + "epoch": 2.11, + "learning_rate": 6.014995713448048e-05, + "loss": 1.469, + "step": 26858 + }, + { + "epoch": 2.11, + "learning_rate": 6.0140060411493425e-05, + "loss": 1.4246, + "step": 26859 + }, + { + "epoch": 2.11, + "learning_rate": 6.013016429860572e-05, + "loss": 1.4535, + "step": 26860 + }, + { + "epoch": 2.11, + "learning_rate": 6.0120268795884666e-05, + "loss": 1.4324, + "step": 26861 + }, + { + "epoch": 2.11, + "learning_rate": 6.011037390339738e-05, + "loss": 1.3968, + "step": 26862 + }, + { + "epoch": 2.11, + "learning_rate": 6.0100479621211e-05, + "loss": 1.408, + "step": 26863 + }, + { + "epoch": 2.11, + "learning_rate": 6.009058594939281e-05, + "loss": 1.4342, + "step": 26864 + }, + { + "epoch": 2.11, + "learning_rate": 6.008069288800992e-05, + "loss": 1.431, + "step": 26865 + }, + { + "epoch": 2.11, + "learning_rate": 6.00708004371295e-05, + "loss": 1.4649, + "step": 26866 + }, + { + "epoch": 2.11, + "learning_rate": 6.006090859681862e-05, + "loss": 1.4547, + "step": 26867 + }, + { + "epoch": 2.11, + "learning_rate": 6.0051017367144654e-05, + "loss": 1.3959, + "step": 26868 + }, + { + "epoch": 2.11, + "learning_rate": 6.004112674817462e-05, + "loss": 1.4762, + "step": 26869 + }, + { + "epoch": 2.11, + "learning_rate": 6.003123673997571e-05, + "loss": 1.4862, + "step": 26870 + }, + { + "epoch": 2.11, + "learning_rate": 6.002134734261499e-05, + "loss": 1.4487, + "step": 26871 + }, + { + "epoch": 2.11, + "learning_rate": 6.001145855615972e-05, + "loss": 1.4827, + "step": 26872 + }, + { + "epoch": 2.11, + "learning_rate": 6.000157038067698e-05, + "loss": 1.418, + "step": 26873 + }, + { + "epoch": 2.11, + "learning_rate": 5.9991682816233875e-05, + "loss": 1.4418, + "step": 26874 + }, + { + "epoch": 2.11, + "learning_rate": 5.9981795862897626e-05, + "loss": 1.4815, + "step": 26875 + }, + { + "epoch": 2.11, + "learning_rate": 5.997190952073528e-05, + "loss": 1.4397, + "step": 26876 + }, + { + "epoch": 2.11, + "learning_rate": 5.996202378981397e-05, + "loss": 1.3879, + "step": 26877 + }, + { + "epoch": 2.11, + "learning_rate": 5.9952138670200856e-05, + "loss": 1.4393, + "step": 26878 + }, + { + "epoch": 2.11, + "learning_rate": 5.9942254161963045e-05, + "loss": 1.4496, + "step": 26879 + }, + { + "epoch": 2.11, + "learning_rate": 5.993237026516758e-05, + "loss": 1.4736, + "step": 26880 + }, + { + "epoch": 2.12, + "learning_rate": 5.992248697988166e-05, + "loss": 1.4365, + "step": 26881 + }, + { + "epoch": 2.12, + "learning_rate": 5.991260430617234e-05, + "loss": 1.4561, + "step": 26882 + }, + { + "epoch": 2.12, + "learning_rate": 5.9902722244106674e-05, + "loss": 1.4174, + "step": 26883 + }, + { + "epoch": 2.12, + "learning_rate": 5.989284079375181e-05, + "loss": 1.4648, + "step": 26884 + }, + { + "epoch": 2.12, + "learning_rate": 5.9882959955174874e-05, + "loss": 1.4571, + "step": 26885 + }, + { + "epoch": 2.12, + "learning_rate": 5.987307972844293e-05, + "loss": 1.46, + "step": 26886 + }, + { + "epoch": 2.12, + "learning_rate": 5.9863200113623025e-05, + "loss": 1.4948, + "step": 26887 + }, + { + "epoch": 2.12, + "learning_rate": 5.985332111078218e-05, + "loss": 1.4555, + "step": 26888 + }, + { + "epoch": 2.12, + "learning_rate": 5.984344271998762e-05, + "loss": 1.4595, + "step": 26889 + }, + { + "epoch": 2.12, + "learning_rate": 5.983356494130632e-05, + "loss": 1.4406, + "step": 26890 + }, + { + "epoch": 2.12, + "learning_rate": 5.9823687774805295e-05, + "loss": 1.4682, + "step": 26891 + }, + { + "epoch": 2.12, + "learning_rate": 5.981381122055172e-05, + "loss": 1.4646, + "step": 26892 + }, + { + "epoch": 2.12, + "learning_rate": 5.980393527861261e-05, + "loss": 1.496, + "step": 26893 + }, + { + "epoch": 2.12, + "learning_rate": 5.9794059949054954e-05, + "loss": 1.4664, + "step": 26894 + }, + { + "epoch": 2.12, + "learning_rate": 5.97841852319459e-05, + "loss": 1.4553, + "step": 26895 + }, + { + "epoch": 2.12, + "learning_rate": 5.977431112735243e-05, + "loss": 1.5042, + "step": 26896 + }, + { + "epoch": 2.12, + "learning_rate": 5.976443763534155e-05, + "loss": 1.4294, + "step": 26897 + }, + { + "epoch": 2.12, + "learning_rate": 5.975456475598035e-05, + "loss": 1.4579, + "step": 26898 + }, + { + "epoch": 2.12, + "learning_rate": 5.9744692489335896e-05, + "loss": 1.4247, + "step": 26899 + }, + { + "epoch": 2.12, + "learning_rate": 5.973482083547518e-05, + "loss": 1.4495, + "step": 26900 + }, + { + "epoch": 2.12, + "learning_rate": 5.972494979446516e-05, + "loss": 1.5311, + "step": 26901 + }, + { + "epoch": 2.12, + "learning_rate": 5.9715079366372984e-05, + "loss": 1.4634, + "step": 26902 + }, + { + "epoch": 2.12, + "learning_rate": 5.970520955126557e-05, + "loss": 1.4611, + "step": 26903 + }, + { + "epoch": 2.12, + "learning_rate": 5.969534034920991e-05, + "loss": 1.4431, + "step": 26904 + }, + { + "epoch": 2.12, + "learning_rate": 5.968547176027313e-05, + "loss": 1.465, + "step": 26905 + }, + { + "epoch": 2.12, + "learning_rate": 5.967560378452213e-05, + "loss": 1.4335, + "step": 26906 + }, + { + "epoch": 2.12, + "learning_rate": 5.9665736422023946e-05, + "loss": 1.4708, + "step": 26907 + }, + { + "epoch": 2.12, + "learning_rate": 5.965586967284551e-05, + "loss": 1.4932, + "step": 26908 + }, + { + "epoch": 2.12, + "learning_rate": 5.964600353705391e-05, + "loss": 1.482, + "step": 26909 + }, + { + "epoch": 2.12, + "learning_rate": 5.9636138014716087e-05, + "loss": 1.4573, + "step": 26910 + }, + { + "epoch": 2.12, + "learning_rate": 5.962627310589896e-05, + "loss": 1.4864, + "step": 26911 + }, + { + "epoch": 2.12, + "learning_rate": 5.961640881066963e-05, + "loss": 1.4803, + "step": 26912 + }, + { + "epoch": 2.12, + "learning_rate": 5.960654512909499e-05, + "loss": 1.4366, + "step": 26913 + }, + { + "epoch": 2.12, + "learning_rate": 5.9596682061242e-05, + "loss": 1.4655, + "step": 26914 + }, + { + "epoch": 2.12, + "learning_rate": 5.958681960717763e-05, + "loss": 1.4809, + "step": 26915 + }, + { + "epoch": 2.12, + "learning_rate": 5.957695776696892e-05, + "loss": 1.4473, + "step": 26916 + }, + { + "epoch": 2.12, + "learning_rate": 5.956709654068276e-05, + "loss": 1.49, + "step": 26917 + }, + { + "epoch": 2.12, + "learning_rate": 5.955723592838607e-05, + "loss": 1.4787, + "step": 26918 + }, + { + "epoch": 2.12, + "learning_rate": 5.954737593014588e-05, + "loss": 1.4459, + "step": 26919 + }, + { + "epoch": 2.12, + "learning_rate": 5.95375165460291e-05, + "loss": 1.4729, + "step": 26920 + }, + { + "epoch": 2.12, + "learning_rate": 5.9527657776102596e-05, + "loss": 1.4641, + "step": 26921 + }, + { + "epoch": 2.12, + "learning_rate": 5.951779962043343e-05, + "loss": 1.4835, + "step": 26922 + }, + { + "epoch": 2.12, + "learning_rate": 5.950794207908847e-05, + "loss": 1.4582, + "step": 26923 + }, + { + "epoch": 2.12, + "learning_rate": 5.949808515213465e-05, + "loss": 1.4249, + "step": 26924 + }, + { + "epoch": 2.12, + "learning_rate": 5.948822883963883e-05, + "loss": 1.4361, + "step": 26925 + }, + { + "epoch": 2.12, + "learning_rate": 5.947837314166804e-05, + "loss": 1.452, + "step": 26926 + }, + { + "epoch": 2.12, + "learning_rate": 5.9468518058289146e-05, + "loss": 1.4558, + "step": 26927 + }, + { + "epoch": 2.12, + "learning_rate": 5.945866358956899e-05, + "loss": 1.4652, + "step": 26928 + }, + { + "epoch": 2.12, + "learning_rate": 5.944880973557462e-05, + "loss": 1.4397, + "step": 26929 + }, + { + "epoch": 2.12, + "learning_rate": 5.9438956496372784e-05, + "loss": 1.4553, + "step": 26930 + }, + { + "epoch": 2.12, + "learning_rate": 5.9429103872030534e-05, + "loss": 1.4857, + "step": 26931 + }, + { + "epoch": 2.12, + "learning_rate": 5.941925186261462e-05, + "loss": 1.4443, + "step": 26932 + }, + { + "epoch": 2.12, + "learning_rate": 5.940940046819205e-05, + "loss": 1.4266, + "step": 26933 + }, + { + "epoch": 2.12, + "learning_rate": 5.939954968882966e-05, + "loss": 1.401, + "step": 26934 + }, + { + "epoch": 2.12, + "learning_rate": 5.938969952459429e-05, + "loss": 1.4706, + "step": 26935 + }, + { + "epoch": 2.12, + "learning_rate": 5.93798499755529e-05, + "loss": 1.5073, + "step": 26936 + }, + { + "epoch": 2.12, + "learning_rate": 5.9370001041772316e-05, + "loss": 1.4676, + "step": 26937 + }, + { + "epoch": 2.12, + "learning_rate": 5.936015272331938e-05, + "loss": 1.493, + "step": 26938 + }, + { + "epoch": 2.12, + "learning_rate": 5.935030502026102e-05, + "loss": 1.4458, + "step": 26939 + }, + { + "epoch": 2.12, + "learning_rate": 5.934045793266406e-05, + "loss": 1.4494, + "step": 26940 + }, + { + "epoch": 2.12, + "learning_rate": 5.9330611460595376e-05, + "loss": 1.4478, + "step": 26941 + }, + { + "epoch": 2.12, + "learning_rate": 5.932076560412174e-05, + "loss": 1.5166, + "step": 26942 + }, + { + "epoch": 2.12, + "learning_rate": 5.931092036331012e-05, + "loss": 1.4558, + "step": 26943 + }, + { + "epoch": 2.12, + "learning_rate": 5.930107573822732e-05, + "loss": 1.461, + "step": 26944 + }, + { + "epoch": 2.12, + "learning_rate": 5.9291231728940106e-05, + "loss": 1.4722, + "step": 26945 + }, + { + "epoch": 2.12, + "learning_rate": 5.9281388335515346e-05, + "loss": 1.4091, + "step": 26946 + }, + { + "epoch": 2.12, + "learning_rate": 5.927154555801998e-05, + "loss": 1.4797, + "step": 26947 + }, + { + "epoch": 2.12, + "learning_rate": 5.926170339652073e-05, + "loss": 1.4295, + "step": 26948 + }, + { + "epoch": 2.12, + "learning_rate": 5.92518618510844e-05, + "loss": 1.4632, + "step": 26949 + }, + { + "epoch": 2.12, + "learning_rate": 5.924202092177791e-05, + "loss": 1.4639, + "step": 26950 + }, + { + "epoch": 2.12, + "learning_rate": 5.9232180608667986e-05, + "loss": 1.4219, + "step": 26951 + }, + { + "epoch": 2.12, + "learning_rate": 5.9222340911821433e-05, + "loss": 1.4335, + "step": 26952 + }, + { + "epoch": 2.12, + "learning_rate": 5.921250183130514e-05, + "loss": 1.4671, + "step": 26953 + }, + { + "epoch": 2.12, + "learning_rate": 5.920266336718585e-05, + "loss": 1.4107, + "step": 26954 + }, + { + "epoch": 2.12, + "learning_rate": 5.919282551953034e-05, + "loss": 1.5062, + "step": 26955 + }, + { + "epoch": 2.12, + "learning_rate": 5.918298828840546e-05, + "loss": 1.4407, + "step": 26956 + }, + { + "epoch": 2.12, + "learning_rate": 5.9173151673877983e-05, + "loss": 1.4686, + "step": 26957 + }, + { + "epoch": 2.12, + "learning_rate": 5.916331567601464e-05, + "loss": 1.4507, + "step": 26958 + }, + { + "epoch": 2.12, + "learning_rate": 5.91534802948823e-05, + "loss": 1.4667, + "step": 26959 + }, + { + "epoch": 2.12, + "learning_rate": 5.9143645530547676e-05, + "loss": 1.4661, + "step": 26960 + }, + { + "epoch": 2.12, + "learning_rate": 5.913381138307754e-05, + "loss": 1.447, + "step": 26961 + }, + { + "epoch": 2.12, + "learning_rate": 5.912397785253866e-05, + "loss": 1.4467, + "step": 26962 + }, + { + "epoch": 2.12, + "learning_rate": 5.911414493899787e-05, + "loss": 1.5049, + "step": 26963 + }, + { + "epoch": 2.12, + "learning_rate": 5.910431264252191e-05, + "loss": 1.4286, + "step": 26964 + }, + { + "epoch": 2.12, + "learning_rate": 5.9094480963177475e-05, + "loss": 1.4703, + "step": 26965 + }, + { + "epoch": 2.12, + "learning_rate": 5.908464990103132e-05, + "loss": 1.4551, + "step": 26966 + }, + { + "epoch": 2.12, + "learning_rate": 5.9074819456150265e-05, + "loss": 1.4593, + "step": 26967 + }, + { + "epoch": 2.12, + "learning_rate": 5.906498962860099e-05, + "loss": 1.4228, + "step": 26968 + }, + { + "epoch": 2.12, + "learning_rate": 5.905516041845023e-05, + "loss": 1.4302, + "step": 26969 + }, + { + "epoch": 2.12, + "learning_rate": 5.9045331825764784e-05, + "loss": 1.4593, + "step": 26970 + }, + { + "epoch": 2.12, + "learning_rate": 5.903550385061134e-05, + "loss": 1.4495, + "step": 26971 + }, + { + "epoch": 2.12, + "learning_rate": 5.902567649305658e-05, + "loss": 1.5098, + "step": 26972 + }, + { + "epoch": 2.12, + "learning_rate": 5.901584975316732e-05, + "loss": 1.4301, + "step": 26973 + }, + { + "epoch": 2.12, + "learning_rate": 5.900602363101023e-05, + "loss": 1.4585, + "step": 26974 + }, + { + "epoch": 2.12, + "learning_rate": 5.899619812665197e-05, + "loss": 1.403, + "step": 26975 + }, + { + "epoch": 2.12, + "learning_rate": 5.898637324015936e-05, + "loss": 1.478, + "step": 26976 + }, + { + "epoch": 2.12, + "learning_rate": 5.8976548971599e-05, + "loss": 1.4594, + "step": 26977 + }, + { + "epoch": 2.12, + "learning_rate": 5.89667253210377e-05, + "loss": 1.4218, + "step": 26978 + }, + { + "epoch": 2.12, + "learning_rate": 5.8956902288542034e-05, + "loss": 1.468, + "step": 26979 + }, + { + "epoch": 2.12, + "learning_rate": 5.8947079874178814e-05, + "loss": 1.4653, + "step": 26980 + }, + { + "epoch": 2.12, + "learning_rate": 5.893725807801469e-05, + "loss": 1.4963, + "step": 26981 + }, + { + "epoch": 2.12, + "learning_rate": 5.892743690011631e-05, + "loss": 1.4131, + "step": 26982 + }, + { + "epoch": 2.12, + "learning_rate": 5.8917616340550325e-05, + "loss": 1.5062, + "step": 26983 + }, + { + "epoch": 2.12, + "learning_rate": 5.8907796399383523e-05, + "loss": 1.4741, + "step": 26984 + }, + { + "epoch": 2.12, + "learning_rate": 5.889797707668251e-05, + "loss": 1.4978, + "step": 26985 + }, + { + "epoch": 2.12, + "learning_rate": 5.888815837251391e-05, + "loss": 1.3676, + "step": 26986 + }, + { + "epoch": 2.12, + "learning_rate": 5.88783402869445e-05, + "loss": 1.4684, + "step": 26987 + }, + { + "epoch": 2.12, + "learning_rate": 5.8868522820040854e-05, + "loss": 1.508, + "step": 26988 + }, + { + "epoch": 2.12, + "learning_rate": 5.885870597186959e-05, + "loss": 1.5134, + "step": 26989 + }, + { + "epoch": 2.12, + "learning_rate": 5.884888974249749e-05, + "loss": 1.4643, + "step": 26990 + }, + { + "epoch": 2.12, + "learning_rate": 5.883907413199112e-05, + "loss": 1.4652, + "step": 26991 + }, + { + "epoch": 2.12, + "learning_rate": 5.882925914041708e-05, + "loss": 1.4091, + "step": 26992 + }, + { + "epoch": 2.12, + "learning_rate": 5.881944476784204e-05, + "loss": 1.4547, + "step": 26993 + }, + { + "epoch": 2.12, + "learning_rate": 5.8809631014332724e-05, + "loss": 1.4487, + "step": 26994 + }, + { + "epoch": 2.12, + "learning_rate": 5.879981787995569e-05, + "loss": 1.4429, + "step": 26995 + }, + { + "epoch": 2.12, + "learning_rate": 5.87900053647775e-05, + "loss": 1.4331, + "step": 26996 + }, + { + "epoch": 2.12, + "learning_rate": 5.8780193468864894e-05, + "loss": 1.4858, + "step": 26997 + }, + { + "epoch": 2.12, + "learning_rate": 5.8770382192284454e-05, + "loss": 1.4595, + "step": 26998 + }, + { + "epoch": 2.12, + "learning_rate": 5.8760571535102746e-05, + "loss": 1.4911, + "step": 26999 + }, + { + "epoch": 2.12, + "learning_rate": 5.8750761497386366e-05, + "loss": 1.4358, + "step": 27000 + }, + { + "epoch": 2.12, + "learning_rate": 5.8740952079202033e-05, + "loss": 1.4759, + "step": 27001 + }, + { + "epoch": 2.12, + "learning_rate": 5.873114328061625e-05, + "loss": 1.4858, + "step": 27002 + }, + { + "epoch": 2.12, + "learning_rate": 5.872133510169559e-05, + "loss": 1.4655, + "step": 27003 + }, + { + "epoch": 2.12, + "learning_rate": 5.871152754250674e-05, + "loss": 1.4684, + "step": 27004 + }, + { + "epoch": 2.12, + "learning_rate": 5.870172060311626e-05, + "loss": 1.4458, + "step": 27005 + }, + { + "epoch": 2.12, + "learning_rate": 5.8691914283590654e-05, + "loss": 1.3995, + "step": 27006 + }, + { + "epoch": 2.12, + "learning_rate": 5.86821085839966e-05, + "loss": 1.4587, + "step": 27007 + }, + { + "epoch": 2.13, + "learning_rate": 5.8672303504400604e-05, + "loss": 1.465, + "step": 27008 + }, + { + "epoch": 2.13, + "learning_rate": 5.866249904486931e-05, + "loss": 1.4327, + "step": 27009 + }, + { + "epoch": 2.13, + "learning_rate": 5.865269520546919e-05, + "loss": 1.4464, + "step": 27010 + }, + { + "epoch": 2.13, + "learning_rate": 5.864289198626691e-05, + "loss": 1.4797, + "step": 27011 + }, + { + "epoch": 2.13, + "learning_rate": 5.863308938732897e-05, + "loss": 1.458, + "step": 27012 + }, + { + "epoch": 2.13, + "learning_rate": 5.862328740872191e-05, + "loss": 1.4241, + "step": 27013 + }, + { + "epoch": 2.13, + "learning_rate": 5.861348605051233e-05, + "loss": 1.4754, + "step": 27014 + }, + { + "epoch": 2.13, + "learning_rate": 5.8603685312766755e-05, + "loss": 1.4611, + "step": 27015 + }, + { + "epoch": 2.13, + "learning_rate": 5.8593885195551665e-05, + "loss": 1.4739, + "step": 27016 + }, + { + "epoch": 2.13, + "learning_rate": 5.8584085698933715e-05, + "loss": 1.4808, + "step": 27017 + }, + { + "epoch": 2.13, + "learning_rate": 5.857428682297937e-05, + "loss": 1.5123, + "step": 27018 + }, + { + "epoch": 2.13, + "learning_rate": 5.856448856775515e-05, + "loss": 1.4517, + "step": 27019 + }, + { + "epoch": 2.13, + "learning_rate": 5.855469093332757e-05, + "loss": 1.4048, + "step": 27020 + }, + { + "epoch": 2.13, + "learning_rate": 5.854489391976321e-05, + "loss": 1.4372, + "step": 27021 + }, + { + "epoch": 2.13, + "learning_rate": 5.853509752712855e-05, + "loss": 1.4501, + "step": 27022 + }, + { + "epoch": 2.13, + "learning_rate": 5.8525301755490054e-05, + "loss": 1.4744, + "step": 27023 + }, + { + "epoch": 2.13, + "learning_rate": 5.851550660491428e-05, + "loss": 1.3978, + "step": 27024 + }, + { + "epoch": 2.13, + "learning_rate": 5.850571207546779e-05, + "loss": 1.4869, + "step": 27025 + }, + { + "epoch": 2.13, + "learning_rate": 5.849591816721702e-05, + "loss": 1.4823, + "step": 27026 + }, + { + "epoch": 2.13, + "learning_rate": 5.8486124880228414e-05, + "loss": 1.4361, + "step": 27027 + }, + { + "epoch": 2.13, + "learning_rate": 5.847633221456856e-05, + "loss": 1.4536, + "step": 27028 + }, + { + "epoch": 2.13, + "learning_rate": 5.8466540170303925e-05, + "loss": 1.4482, + "step": 27029 + }, + { + "epoch": 2.13, + "learning_rate": 5.845674874750091e-05, + "loss": 1.4559, + "step": 27030 + }, + { + "epoch": 2.13, + "learning_rate": 5.84469579462261e-05, + "loss": 1.5109, + "step": 27031 + }, + { + "epoch": 2.13, + "learning_rate": 5.8437167766545925e-05, + "loss": 1.4894, + "step": 27032 + }, + { + "epoch": 2.13, + "learning_rate": 5.84273782085268e-05, + "loss": 1.4531, + "step": 27033 + }, + { + "epoch": 2.13, + "learning_rate": 5.8417589272235296e-05, + "loss": 1.4589, + "step": 27034 + }, + { + "epoch": 2.13, + "learning_rate": 5.840780095773782e-05, + "loss": 1.5049, + "step": 27035 + }, + { + "epoch": 2.13, + "learning_rate": 5.839801326510083e-05, + "loss": 1.4677, + "step": 27036 + }, + { + "epoch": 2.13, + "learning_rate": 5.838822619439073e-05, + "loss": 1.4951, + "step": 27037 + }, + { + "epoch": 2.13, + "learning_rate": 5.8378439745674074e-05, + "loss": 1.4249, + "step": 27038 + }, + { + "epoch": 2.13, + "learning_rate": 5.836865391901725e-05, + "loss": 1.4443, + "step": 27039 + }, + { + "epoch": 2.13, + "learning_rate": 5.8358868714486644e-05, + "loss": 1.443, + "step": 27040 + }, + { + "epoch": 2.13, + "learning_rate": 5.834908413214874e-05, + "loss": 1.4644, + "step": 27041 + }, + { + "epoch": 2.13, + "learning_rate": 5.833930017207004e-05, + "loss": 1.4403, + "step": 27042 + }, + { + "epoch": 2.13, + "learning_rate": 5.832951683431692e-05, + "loss": 1.4523, + "step": 27043 + }, + { + "epoch": 2.13, + "learning_rate": 5.831973411895572e-05, + "loss": 1.4424, + "step": 27044 + }, + { + "epoch": 2.13, + "learning_rate": 5.830995202605298e-05, + "loss": 1.4776, + "step": 27045 + }, + { + "epoch": 2.13, + "learning_rate": 5.8300170555675087e-05, + "loss": 1.4388, + "step": 27046 + }, + { + "epoch": 2.13, + "learning_rate": 5.829038970788838e-05, + "loss": 1.4373, + "step": 27047 + }, + { + "epoch": 2.13, + "learning_rate": 5.828060948275935e-05, + "loss": 1.4793, + "step": 27048 + }, + { + "epoch": 2.13, + "learning_rate": 5.8270829880354394e-05, + "loss": 1.4632, + "step": 27049 + }, + { + "epoch": 2.13, + "learning_rate": 5.82610509007398e-05, + "loss": 1.4227, + "step": 27050 + }, + { + "epoch": 2.13, + "learning_rate": 5.8251272543982115e-05, + "loss": 1.4793, + "step": 27051 + }, + { + "epoch": 2.13, + "learning_rate": 5.8241494810147656e-05, + "loss": 1.4823, + "step": 27052 + }, + { + "epoch": 2.13, + "learning_rate": 5.8231717699302805e-05, + "loss": 1.4874, + "step": 27053 + }, + { + "epoch": 2.13, + "learning_rate": 5.822194121151391e-05, + "loss": 1.4836, + "step": 27054 + }, + { + "epoch": 2.13, + "learning_rate": 5.8212165346847424e-05, + "loss": 1.5146, + "step": 27055 + }, + { + "epoch": 2.13, + "learning_rate": 5.8202390105369634e-05, + "loss": 1.4302, + "step": 27056 + }, + { + "epoch": 2.13, + "learning_rate": 5.819261548714696e-05, + "loss": 1.4753, + "step": 27057 + }, + { + "epoch": 2.13, + "learning_rate": 5.818284149224581e-05, + "loss": 1.5221, + "step": 27058 + }, + { + "epoch": 2.13, + "learning_rate": 5.8173068120732505e-05, + "loss": 1.3962, + "step": 27059 + }, + { + "epoch": 2.13, + "learning_rate": 5.816329537267341e-05, + "loss": 1.51, + "step": 27060 + }, + { + "epoch": 2.13, + "learning_rate": 5.815352324813477e-05, + "loss": 1.4771, + "step": 27061 + }, + { + "epoch": 2.13, + "learning_rate": 5.8143751747183094e-05, + "loss": 1.5091, + "step": 27062 + }, + { + "epoch": 2.13, + "learning_rate": 5.813398086988466e-05, + "loss": 1.442, + "step": 27063 + }, + { + "epoch": 2.13, + "learning_rate": 5.812421061630574e-05, + "loss": 1.462, + "step": 27064 + }, + { + "epoch": 2.13, + "learning_rate": 5.8114440986512775e-05, + "loss": 1.4809, + "step": 27065 + }, + { + "epoch": 2.13, + "learning_rate": 5.8104671980572056e-05, + "loss": 1.4367, + "step": 27066 + }, + { + "epoch": 2.13, + "learning_rate": 5.8094903598549855e-05, + "loss": 1.5339, + "step": 27067 + }, + { + "epoch": 2.13, + "learning_rate": 5.808513584051258e-05, + "loss": 1.4809, + "step": 27068 + }, + { + "epoch": 2.13, + "learning_rate": 5.807536870652652e-05, + "loss": 1.4545, + "step": 27069 + }, + { + "epoch": 2.13, + "learning_rate": 5.806560219665792e-05, + "loss": 1.4615, + "step": 27070 + }, + { + "epoch": 2.13, + "learning_rate": 5.805583631097315e-05, + "loss": 1.4979, + "step": 27071 + }, + { + "epoch": 2.13, + "learning_rate": 5.804607104953857e-05, + "loss": 1.4864, + "step": 27072 + }, + { + "epoch": 2.13, + "learning_rate": 5.8036306412420405e-05, + "loss": 1.4267, + "step": 27073 + }, + { + "epoch": 2.13, + "learning_rate": 5.8026542399684936e-05, + "loss": 1.4676, + "step": 27074 + }, + { + "epoch": 2.13, + "learning_rate": 5.801677901139855e-05, + "loss": 1.4619, + "step": 27075 + }, + { + "epoch": 2.13, + "learning_rate": 5.800701624762746e-05, + "loss": 1.4532, + "step": 27076 + }, + { + "epoch": 2.13, + "learning_rate": 5.799725410843796e-05, + "loss": 1.4252, + "step": 27077 + }, + { + "epoch": 2.13, + "learning_rate": 5.7987492593896275e-05, + "loss": 1.434, + "step": 27078 + }, + { + "epoch": 2.13, + "learning_rate": 5.7977731704068806e-05, + "loss": 1.4241, + "step": 27079 + }, + { + "epoch": 2.13, + "learning_rate": 5.796797143902174e-05, + "loss": 1.4824, + "step": 27080 + }, + { + "epoch": 2.13, + "learning_rate": 5.795821179882132e-05, + "loss": 1.4433, + "step": 27081 + }, + { + "epoch": 2.13, + "learning_rate": 5.7948452783533914e-05, + "loss": 1.4817, + "step": 27082 + }, + { + "epoch": 2.13, + "learning_rate": 5.79386943932257e-05, + "loss": 1.4245, + "step": 27083 + }, + { + "epoch": 2.13, + "learning_rate": 5.7928936627962904e-05, + "loss": 1.3966, + "step": 27084 + }, + { + "epoch": 2.13, + "learning_rate": 5.791917948781185e-05, + "loss": 1.4252, + "step": 27085 + }, + { + "epoch": 2.13, + "learning_rate": 5.790942297283878e-05, + "loss": 1.4571, + "step": 27086 + }, + { + "epoch": 2.13, + "learning_rate": 5.789966708310984e-05, + "loss": 1.4312, + "step": 27087 + }, + { + "epoch": 2.13, + "learning_rate": 5.788991181869134e-05, + "loss": 1.4545, + "step": 27088 + }, + { + "epoch": 2.13, + "learning_rate": 5.788015717964956e-05, + "loss": 1.4625, + "step": 27089 + }, + { + "epoch": 2.13, + "learning_rate": 5.7870403166050674e-05, + "loss": 1.4477, + "step": 27090 + }, + { + "epoch": 2.13, + "learning_rate": 5.786064977796085e-05, + "loss": 1.4534, + "step": 27091 + }, + { + "epoch": 2.13, + "learning_rate": 5.785089701544644e-05, + "loss": 1.4206, + "step": 27092 + }, + { + "epoch": 2.13, + "learning_rate": 5.7841144878573565e-05, + "loss": 1.4171, + "step": 27093 + }, + { + "epoch": 2.13, + "learning_rate": 5.783139336740847e-05, + "loss": 1.4161, + "step": 27094 + }, + { + "epoch": 2.13, + "learning_rate": 5.78216424820173e-05, + "loss": 1.3806, + "step": 27095 + }, + { + "epoch": 2.13, + "learning_rate": 5.781189222246637e-05, + "loss": 1.4987, + "step": 27096 + }, + { + "epoch": 2.13, + "learning_rate": 5.7802142588821806e-05, + "loss": 1.4425, + "step": 27097 + }, + { + "epoch": 2.13, + "learning_rate": 5.779239358114976e-05, + "loss": 1.4802, + "step": 27098 + }, + { + "epoch": 2.13, + "learning_rate": 5.778264519951654e-05, + "loss": 1.4203, + "step": 27099 + }, + { + "epoch": 2.13, + "learning_rate": 5.7772897443988266e-05, + "loss": 1.4832, + "step": 27100 + }, + { + "epoch": 2.13, + "learning_rate": 5.776315031463106e-05, + "loss": 1.4261, + "step": 27101 + }, + { + "epoch": 2.13, + "learning_rate": 5.775340381151123e-05, + "loss": 1.5116, + "step": 27102 + }, + { + "epoch": 2.13, + "learning_rate": 5.774365793469482e-05, + "loss": 1.4642, + "step": 27103 + }, + { + "epoch": 2.13, + "learning_rate": 5.7733912684248115e-05, + "loss": 1.4629, + "step": 27104 + }, + { + "epoch": 2.13, + "learning_rate": 5.7724168060237186e-05, + "loss": 1.4911, + "step": 27105 + }, + { + "epoch": 2.13, + "learning_rate": 5.7714424062728275e-05, + "loss": 1.4637, + "step": 27106 + }, + { + "epoch": 2.13, + "learning_rate": 5.77046806917875e-05, + "loss": 1.4182, + "step": 27107 + }, + { + "epoch": 2.13, + "learning_rate": 5.769493794748095e-05, + "loss": 1.4455, + "step": 27108 + }, + { + "epoch": 2.13, + "learning_rate": 5.7685195829874886e-05, + "loss": 1.4486, + "step": 27109 + }, + { + "epoch": 2.13, + "learning_rate": 5.7675454339035414e-05, + "loss": 1.442, + "step": 27110 + }, + { + "epoch": 2.13, + "learning_rate": 5.766571347502865e-05, + "loss": 1.4889, + "step": 27111 + }, + { + "epoch": 2.13, + "learning_rate": 5.765597323792068e-05, + "loss": 1.5033, + "step": 27112 + }, + { + "epoch": 2.13, + "learning_rate": 5.764623362777776e-05, + "loss": 1.4208, + "step": 27113 + }, + { + "epoch": 2.13, + "learning_rate": 5.763649464466593e-05, + "loss": 1.4645, + "step": 27114 + }, + { + "epoch": 2.13, + "learning_rate": 5.7626756288651286e-05, + "loss": 1.5335, + "step": 27115 + }, + { + "epoch": 2.13, + "learning_rate": 5.761701855980004e-05, + "loss": 1.4643, + "step": 27116 + }, + { + "epoch": 2.13, + "learning_rate": 5.7607281458178256e-05, + "loss": 1.403, + "step": 27117 + }, + { + "epoch": 2.13, + "learning_rate": 5.7597544983852e-05, + "loss": 1.4031, + "step": 27118 + }, + { + "epoch": 2.13, + "learning_rate": 5.758780913688742e-05, + "loss": 1.4602, + "step": 27119 + }, + { + "epoch": 2.13, + "learning_rate": 5.757807391735066e-05, + "loss": 1.522, + "step": 27120 + }, + { + "epoch": 2.13, + "learning_rate": 5.756833932530779e-05, + "loss": 1.4805, + "step": 27121 + }, + { + "epoch": 2.13, + "learning_rate": 5.755860536082482e-05, + "loss": 1.4152, + "step": 27122 + }, + { + "epoch": 2.13, + "learning_rate": 5.7548872023967974e-05, + "loss": 1.4557, + "step": 27123 + }, + { + "epoch": 2.13, + "learning_rate": 5.753913931480327e-05, + "loss": 1.4562, + "step": 27124 + }, + { + "epoch": 2.13, + "learning_rate": 5.752940723339672e-05, + "loss": 1.4991, + "step": 27125 + }, + { + "epoch": 2.13, + "learning_rate": 5.751967577981452e-05, + "loss": 1.4257, + "step": 27126 + }, + { + "epoch": 2.13, + "learning_rate": 5.75099449541227e-05, + "loss": 1.4941, + "step": 27127 + }, + { + "epoch": 2.13, + "learning_rate": 5.750021475638725e-05, + "loss": 1.5313, + "step": 27128 + }, + { + "epoch": 2.13, + "learning_rate": 5.7490485186674346e-05, + "loss": 1.4647, + "step": 27129 + }, + { + "epoch": 2.13, + "learning_rate": 5.7480756245050006e-05, + "loss": 1.4946, + "step": 27130 + }, + { + "epoch": 2.13, + "learning_rate": 5.7471027931580266e-05, + "loss": 1.4743, + "step": 27131 + }, + { + "epoch": 2.13, + "learning_rate": 5.746130024633113e-05, + "loss": 1.4775, + "step": 27132 + }, + { + "epoch": 2.13, + "learning_rate": 5.7451573189368774e-05, + "loss": 1.4541, + "step": 27133 + }, + { + "epoch": 2.13, + "learning_rate": 5.744184676075908e-05, + "loss": 1.4587, + "step": 27134 + }, + { + "epoch": 2.14, + "learning_rate": 5.743212096056824e-05, + "loss": 1.513, + "step": 27135 + }, + { + "epoch": 2.14, + "learning_rate": 5.742239578886216e-05, + "loss": 1.4379, + "step": 27136 + }, + { + "epoch": 2.14, + "learning_rate": 5.7412671245706966e-05, + "loss": 1.4389, + "step": 27137 + }, + { + "epoch": 2.14, + "learning_rate": 5.740294733116866e-05, + "loss": 1.4523, + "step": 27138 + }, + { + "epoch": 2.14, + "learning_rate": 5.7393224045313176e-05, + "loss": 1.4587, + "step": 27139 + }, + { + "epoch": 2.14, + "learning_rate": 5.7383501388206645e-05, + "loss": 1.4225, + "step": 27140 + }, + { + "epoch": 2.14, + "learning_rate": 5.7373779359915045e-05, + "loss": 1.4708, + "step": 27141 + }, + { + "epoch": 2.14, + "learning_rate": 5.73640579605043e-05, + "loss": 1.4128, + "step": 27142 + }, + { + "epoch": 2.14, + "learning_rate": 5.735433719004054e-05, + "loss": 1.4464, + "step": 27143 + }, + { + "epoch": 2.14, + "learning_rate": 5.7344617048589706e-05, + "loss": 1.4844, + "step": 27144 + }, + { + "epoch": 2.14, + "learning_rate": 5.7334897536217735e-05, + "loss": 1.4422, + "step": 27145 + }, + { + "epoch": 2.14, + "learning_rate": 5.732517865299073e-05, + "loss": 1.4046, + "step": 27146 + }, + { + "epoch": 2.14, + "learning_rate": 5.73154603989746e-05, + "loss": 1.5025, + "step": 27147 + }, + { + "epoch": 2.14, + "learning_rate": 5.730574277423536e-05, + "loss": 1.4554, + "step": 27148 + }, + { + "epoch": 2.14, + "learning_rate": 5.729602577883893e-05, + "loss": 1.4344, + "step": 27149 + }, + { + "epoch": 2.14, + "learning_rate": 5.7286309412851325e-05, + "loss": 1.472, + "step": 27150 + }, + { + "epoch": 2.14, + "learning_rate": 5.7276593676338563e-05, + "loss": 1.4339, + "step": 27151 + }, + { + "epoch": 2.14, + "learning_rate": 5.726687856936657e-05, + "loss": 1.4988, + "step": 27152 + }, + { + "epoch": 2.14, + "learning_rate": 5.7257164092001235e-05, + "loss": 1.4222, + "step": 27153 + }, + { + "epoch": 2.14, + "learning_rate": 5.7247450244308615e-05, + "loss": 1.4461, + "step": 27154 + }, + { + "epoch": 2.14, + "learning_rate": 5.723773702635465e-05, + "loss": 1.4247, + "step": 27155 + }, + { + "epoch": 2.14, + "learning_rate": 5.7228024438205184e-05, + "loss": 1.483, + "step": 27156 + }, + { + "epoch": 2.14, + "learning_rate": 5.721831247992631e-05, + "loss": 1.4499, + "step": 27157 + }, + { + "epoch": 2.14, + "learning_rate": 5.7208601151583874e-05, + "loss": 1.4842, + "step": 27158 + }, + { + "epoch": 2.14, + "learning_rate": 5.7198890453243784e-05, + "loss": 1.4122, + "step": 27159 + }, + { + "epoch": 2.14, + "learning_rate": 5.718918038497208e-05, + "loss": 1.4824, + "step": 27160 + }, + { + "epoch": 2.14, + "learning_rate": 5.71794709468346e-05, + "loss": 1.4745, + "step": 27161 + }, + { + "epoch": 2.14, + "learning_rate": 5.716976213889726e-05, + "loss": 1.4854, + "step": 27162 + }, + { + "epoch": 2.14, + "learning_rate": 5.7160053961226046e-05, + "loss": 1.5423, + "step": 27163 + }, + { + "epoch": 2.14, + "learning_rate": 5.715034641388684e-05, + "loss": 1.4465, + "step": 27164 + }, + { + "epoch": 2.14, + "learning_rate": 5.714063949694554e-05, + "loss": 1.4466, + "step": 27165 + }, + { + "epoch": 2.14, + "learning_rate": 5.713093321046795e-05, + "loss": 1.4263, + "step": 27166 + }, + { + "epoch": 2.14, + "learning_rate": 5.712122755452018e-05, + "loss": 1.4939, + "step": 27167 + }, + { + "epoch": 2.14, + "learning_rate": 5.711152252916801e-05, + "loss": 1.4634, + "step": 27168 + }, + { + "epoch": 2.14, + "learning_rate": 5.710181813447731e-05, + "loss": 1.4487, + "step": 27169 + }, + { + "epoch": 2.14, + "learning_rate": 5.7092114370514044e-05, + "loss": 1.4627, + "step": 27170 + }, + { + "epoch": 2.14, + "learning_rate": 5.708241123734403e-05, + "loss": 1.4376, + "step": 27171 + }, + { + "epoch": 2.14, + "learning_rate": 5.70727087350332e-05, + "loss": 1.482, + "step": 27172 + }, + { + "epoch": 2.14, + "learning_rate": 5.706300686364731e-05, + "loss": 1.4567, + "step": 27173 + }, + { + "epoch": 2.14, + "learning_rate": 5.70533056232524e-05, + "loss": 1.4626, + "step": 27174 + }, + { + "epoch": 2.14, + "learning_rate": 5.704360501391423e-05, + "loss": 1.4547, + "step": 27175 + }, + { + "epoch": 2.14, + "learning_rate": 5.703390503569865e-05, + "loss": 1.444, + "step": 27176 + }, + { + "epoch": 2.14, + "learning_rate": 5.702420568867158e-05, + "loss": 1.4606, + "step": 27177 + }, + { + "epoch": 2.14, + "learning_rate": 5.701450697289886e-05, + "loss": 1.3835, + "step": 27178 + }, + { + "epoch": 2.14, + "learning_rate": 5.700480888844628e-05, + "loss": 1.427, + "step": 27179 + }, + { + "epoch": 2.14, + "learning_rate": 5.699511143537977e-05, + "loss": 1.4621, + "step": 27180 + }, + { + "epoch": 2.14, + "learning_rate": 5.6985414613765085e-05, + "loss": 1.4558, + "step": 27181 + }, + { + "epoch": 2.14, + "learning_rate": 5.6975718423668153e-05, + "loss": 1.3981, + "step": 27182 + }, + { + "epoch": 2.14, + "learning_rate": 5.696602286515471e-05, + "loss": 1.4852, + "step": 27183 + }, + { + "epoch": 2.14, + "learning_rate": 5.695632793829066e-05, + "loss": 1.4367, + "step": 27184 + }, + { + "epoch": 2.14, + "learning_rate": 5.694663364314183e-05, + "loss": 1.4527, + "step": 27185 + }, + { + "epoch": 2.14, + "learning_rate": 5.693693997977394e-05, + "loss": 1.4932, + "step": 27186 + }, + { + "epoch": 2.14, + "learning_rate": 5.6927246948252915e-05, + "loss": 1.4958, + "step": 27187 + }, + { + "epoch": 2.14, + "learning_rate": 5.691755454864454e-05, + "loss": 1.4931, + "step": 27188 + }, + { + "epoch": 2.14, + "learning_rate": 5.690786278101458e-05, + "loss": 1.4834, + "step": 27189 + }, + { + "epoch": 2.14, + "learning_rate": 5.689817164542883e-05, + "loss": 1.4708, + "step": 27190 + }, + { + "epoch": 2.14, + "learning_rate": 5.688848114195316e-05, + "loss": 1.4351, + "step": 27191 + }, + { + "epoch": 2.14, + "learning_rate": 5.6878791270653316e-05, + "loss": 1.4249, + "step": 27192 + }, + { + "epoch": 2.14, + "learning_rate": 5.686910203159504e-05, + "loss": 1.4609, + "step": 27193 + }, + { + "epoch": 2.14, + "learning_rate": 5.685941342484422e-05, + "loss": 1.4299, + "step": 27194 + }, + { + "epoch": 2.14, + "learning_rate": 5.684972545046659e-05, + "loss": 1.5034, + "step": 27195 + }, + { + "epoch": 2.14, + "learning_rate": 5.6840038108527847e-05, + "loss": 1.394, + "step": 27196 + }, + { + "epoch": 2.14, + "learning_rate": 5.6830351399093854e-05, + "loss": 1.4616, + "step": 27197 + }, + { + "epoch": 2.14, + "learning_rate": 5.682066532223041e-05, + "loss": 1.501, + "step": 27198 + }, + { + "epoch": 2.14, + "learning_rate": 5.681097987800322e-05, + "loss": 1.4552, + "step": 27199 + }, + { + "epoch": 2.14, + "learning_rate": 5.6801295066478006e-05, + "loss": 1.4769, + "step": 27200 + }, + { + "epoch": 2.14, + "learning_rate": 5.6791610887720616e-05, + "loss": 1.4454, + "step": 27201 + }, + { + "epoch": 2.14, + "learning_rate": 5.678192734179676e-05, + "loss": 1.403, + "step": 27202 + }, + { + "epoch": 2.14, + "learning_rate": 5.677224442877211e-05, + "loss": 1.4906, + "step": 27203 + }, + { + "epoch": 2.14, + "learning_rate": 5.676256214871253e-05, + "loss": 1.4573, + "step": 27204 + }, + { + "epoch": 2.14, + "learning_rate": 5.67528805016837e-05, + "loss": 1.4453, + "step": 27205 + }, + { + "epoch": 2.14, + "learning_rate": 5.674319948775136e-05, + "loss": 1.4641, + "step": 27206 + }, + { + "epoch": 2.14, + "learning_rate": 5.6733519106981176e-05, + "loss": 1.4609, + "step": 27207 + }, + { + "epoch": 2.14, + "learning_rate": 5.672383935943898e-05, + "loss": 1.4433, + "step": 27208 + }, + { + "epoch": 2.14, + "learning_rate": 5.6714160245190435e-05, + "loss": 1.4501, + "step": 27209 + }, + { + "epoch": 2.14, + "learning_rate": 5.670448176430123e-05, + "loss": 1.4519, + "step": 27210 + }, + { + "epoch": 2.14, + "learning_rate": 5.669480391683714e-05, + "loss": 1.4405, + "step": 27211 + }, + { + "epoch": 2.14, + "learning_rate": 5.668512670286385e-05, + "loss": 1.4193, + "step": 27212 + }, + { + "epoch": 2.14, + "learning_rate": 5.6675450122446994e-05, + "loss": 1.5023, + "step": 27213 + }, + { + "epoch": 2.14, + "learning_rate": 5.666577417565234e-05, + "loss": 1.4784, + "step": 27214 + }, + { + "epoch": 2.14, + "learning_rate": 5.6656098862545626e-05, + "loss": 1.456, + "step": 27215 + }, + { + "epoch": 2.14, + "learning_rate": 5.664642418319248e-05, + "loss": 1.4333, + "step": 27216 + }, + { + "epoch": 2.14, + "learning_rate": 5.663675013765855e-05, + "loss": 1.4918, + "step": 27217 + }, + { + "epoch": 2.14, + "learning_rate": 5.662707672600961e-05, + "loss": 1.3908, + "step": 27218 + }, + { + "epoch": 2.14, + "learning_rate": 5.66174039483113e-05, + "loss": 1.4674, + "step": 27219 + }, + { + "epoch": 2.14, + "learning_rate": 5.660773180462923e-05, + "loss": 1.5126, + "step": 27220 + }, + { + "epoch": 2.14, + "learning_rate": 5.659806029502918e-05, + "loss": 1.4369, + "step": 27221 + }, + { + "epoch": 2.14, + "learning_rate": 5.6588389419576766e-05, + "loss": 1.462, + "step": 27222 + }, + { + "epoch": 2.14, + "learning_rate": 5.657871917833761e-05, + "loss": 1.4628, + "step": 27223 + }, + { + "epoch": 2.14, + "learning_rate": 5.656904957137737e-05, + "loss": 1.4239, + "step": 27224 + }, + { + "epoch": 2.14, + "learning_rate": 5.655938059876176e-05, + "loss": 1.4566, + "step": 27225 + }, + { + "epoch": 2.14, + "learning_rate": 5.6549712260556406e-05, + "loss": 1.4044, + "step": 27226 + }, + { + "epoch": 2.14, + "learning_rate": 5.6540044556826874e-05, + "loss": 1.4386, + "step": 27227 + }, + { + "epoch": 2.14, + "learning_rate": 5.653037748763886e-05, + "loss": 1.5016, + "step": 27228 + }, + { + "epoch": 2.14, + "learning_rate": 5.652071105305807e-05, + "loss": 1.4427, + "step": 27229 + }, + { + "epoch": 2.14, + "learning_rate": 5.651104525315005e-05, + "loss": 1.4709, + "step": 27230 + }, + { + "epoch": 2.14, + "learning_rate": 5.65013800879804e-05, + "loss": 1.5034, + "step": 27231 + }, + { + "epoch": 2.14, + "learning_rate": 5.649171555761482e-05, + "loss": 1.4305, + "step": 27232 + }, + { + "epoch": 2.14, + "learning_rate": 5.64820516621189e-05, + "loss": 1.4265, + "step": 27233 + }, + { + "epoch": 2.14, + "learning_rate": 5.647238840155818e-05, + "loss": 1.4474, + "step": 27234 + }, + { + "epoch": 2.14, + "learning_rate": 5.6462725775998405e-05, + "loss": 1.3929, + "step": 27235 + }, + { + "epoch": 2.14, + "learning_rate": 5.6453063785505086e-05, + "loss": 1.4856, + "step": 27236 + }, + { + "epoch": 2.14, + "learning_rate": 5.644340243014378e-05, + "loss": 1.4374, + "step": 27237 + }, + { + "epoch": 2.14, + "learning_rate": 5.643374170998021e-05, + "loss": 1.46, + "step": 27238 + }, + { + "epoch": 2.14, + "learning_rate": 5.64240816250799e-05, + "loss": 1.4212, + "step": 27239 + }, + { + "epoch": 2.14, + "learning_rate": 5.641442217550837e-05, + "loss": 1.4714, + "step": 27240 + }, + { + "epoch": 2.14, + "learning_rate": 5.640476336133134e-05, + "loss": 1.4772, + "step": 27241 + }, + { + "epoch": 2.14, + "learning_rate": 5.639510518261431e-05, + "loss": 1.4966, + "step": 27242 + }, + { + "epoch": 2.14, + "learning_rate": 5.638544763942286e-05, + "loss": 1.4051, + "step": 27243 + }, + { + "epoch": 2.14, + "learning_rate": 5.637579073182245e-05, + "loss": 1.4229, + "step": 27244 + }, + { + "epoch": 2.14, + "learning_rate": 5.6366134459878855e-05, + "loss": 1.3949, + "step": 27245 + }, + { + "epoch": 2.14, + "learning_rate": 5.635647882365755e-05, + "loss": 1.4815, + "step": 27246 + }, + { + "epoch": 2.14, + "learning_rate": 5.634682382322406e-05, + "loss": 1.4897, + "step": 27247 + }, + { + "epoch": 2.14, + "learning_rate": 5.6337169458643914e-05, + "loss": 1.4694, + "step": 27248 + }, + { + "epoch": 2.14, + "learning_rate": 5.632751572998275e-05, + "loss": 1.4716, + "step": 27249 + }, + { + "epoch": 2.14, + "learning_rate": 5.631786263730607e-05, + "loss": 1.466, + "step": 27250 + }, + { + "epoch": 2.14, + "learning_rate": 5.6308210180679336e-05, + "loss": 1.4731, + "step": 27251 + }, + { + "epoch": 2.14, + "learning_rate": 5.629855836016821e-05, + "loss": 1.4193, + "step": 27252 + }, + { + "epoch": 2.14, + "learning_rate": 5.628890717583818e-05, + "loss": 1.4728, + "step": 27253 + }, + { + "epoch": 2.14, + "learning_rate": 5.627925662775468e-05, + "loss": 1.4568, + "step": 27254 + }, + { + "epoch": 2.14, + "learning_rate": 5.6269606715983375e-05, + "loss": 1.4518, + "step": 27255 + }, + { + "epoch": 2.14, + "learning_rate": 5.625995744058971e-05, + "loss": 1.42, + "step": 27256 + }, + { + "epoch": 2.14, + "learning_rate": 5.625030880163915e-05, + "loss": 1.4628, + "step": 27257 + }, + { + "epoch": 2.14, + "learning_rate": 5.6240660799197306e-05, + "loss": 1.454, + "step": 27258 + }, + { + "epoch": 2.14, + "learning_rate": 5.6231013433329655e-05, + "loss": 1.4587, + "step": 27259 + }, + { + "epoch": 2.14, + "learning_rate": 5.62213667041016e-05, + "loss": 1.437, + "step": 27260 + }, + { + "epoch": 2.14, + "learning_rate": 5.621172061157873e-05, + "loss": 1.5211, + "step": 27261 + }, + { + "epoch": 2.15, + "learning_rate": 5.620207515582656e-05, + "loss": 1.4807, + "step": 27262 + }, + { + "epoch": 2.15, + "learning_rate": 5.6192430336910556e-05, + "loss": 1.4691, + "step": 27263 + }, + { + "epoch": 2.15, + "learning_rate": 5.6182786154896165e-05, + "loss": 1.4273, + "step": 27264 + }, + { + "epoch": 2.15, + "learning_rate": 5.6173142609848835e-05, + "loss": 1.5012, + "step": 27265 + }, + { + "epoch": 2.15, + "learning_rate": 5.6163499701834135e-05, + "loss": 1.4546, + "step": 27266 + }, + { + "epoch": 2.15, + "learning_rate": 5.615385743091751e-05, + "loss": 1.4866, + "step": 27267 + }, + { + "epoch": 2.15, + "learning_rate": 5.614421579716434e-05, + "loss": 1.4893, + "step": 27268 + }, + { + "epoch": 2.15, + "learning_rate": 5.6134574800640206e-05, + "loss": 1.4457, + "step": 27269 + }, + { + "epoch": 2.15, + "learning_rate": 5.61249344414105e-05, + "loss": 1.4062, + "step": 27270 + }, + { + "epoch": 2.15, + "learning_rate": 5.611529471954063e-05, + "loss": 1.4384, + "step": 27271 + }, + { + "epoch": 2.15, + "learning_rate": 5.610565563509616e-05, + "loss": 1.4578, + "step": 27272 + }, + { + "epoch": 2.15, + "learning_rate": 5.6096017188142477e-05, + "loss": 1.4949, + "step": 27273 + }, + { + "epoch": 2.15, + "learning_rate": 5.6086379378744956e-05, + "loss": 1.4693, + "step": 27274 + }, + { + "epoch": 2.15, + "learning_rate": 5.607674220696915e-05, + "loss": 1.413, + "step": 27275 + }, + { + "epoch": 2.15, + "learning_rate": 5.606710567288039e-05, + "loss": 1.4653, + "step": 27276 + }, + { + "epoch": 2.15, + "learning_rate": 5.605746977654418e-05, + "loss": 1.5028, + "step": 27277 + }, + { + "epoch": 2.15, + "learning_rate": 5.6047834518025864e-05, + "loss": 1.4799, + "step": 27278 + }, + { + "epoch": 2.15, + "learning_rate": 5.603819989739096e-05, + "loss": 1.4582, + "step": 27279 + }, + { + "epoch": 2.15, + "learning_rate": 5.6028565914704834e-05, + "loss": 1.5207, + "step": 27280 + }, + { + "epoch": 2.15, + "learning_rate": 5.601893257003282e-05, + "loss": 1.442, + "step": 27281 + }, + { + "epoch": 2.15, + "learning_rate": 5.6009299863440446e-05, + "loss": 1.4587, + "step": 27282 + }, + { + "epoch": 2.15, + "learning_rate": 5.599966779499307e-05, + "loss": 1.4518, + "step": 27283 + }, + { + "epoch": 2.15, + "learning_rate": 5.5990036364756066e-05, + "loss": 1.4481, + "step": 27284 + }, + { + "epoch": 2.15, + "learning_rate": 5.598040557279477e-05, + "loss": 1.4499, + "step": 27285 + }, + { + "epoch": 2.15, + "learning_rate": 5.597077541917471e-05, + "loss": 1.4222, + "step": 27286 + }, + { + "epoch": 2.15, + "learning_rate": 5.5961145903961196e-05, + "loss": 1.4737, + "step": 27287 + }, + { + "epoch": 2.15, + "learning_rate": 5.595151702721954e-05, + "loss": 1.4929, + "step": 27288 + }, + { + "epoch": 2.15, + "learning_rate": 5.594188878901524e-05, + "loss": 1.4386, + "step": 27289 + }, + { + "epoch": 2.15, + "learning_rate": 5.593226118941361e-05, + "loss": 1.4781, + "step": 27290 + }, + { + "epoch": 2.15, + "learning_rate": 5.592263422847996e-05, + "loss": 1.4835, + "step": 27291 + }, + { + "epoch": 2.15, + "learning_rate": 5.5913007906279714e-05, + "loss": 1.4308, + "step": 27292 + }, + { + "epoch": 2.15, + "learning_rate": 5.5903382222878283e-05, + "loss": 1.4292, + "step": 27293 + }, + { + "epoch": 2.15, + "learning_rate": 5.589375717834095e-05, + "loss": 1.4788, + "step": 27294 + }, + { + "epoch": 2.15, + "learning_rate": 5.588413277273302e-05, + "loss": 1.4049, + "step": 27295 + }, + { + "epoch": 2.15, + "learning_rate": 5.5874509006119935e-05, + "loss": 1.4614, + "step": 27296 + }, + { + "epoch": 2.15, + "learning_rate": 5.5864885878567e-05, + "loss": 1.4551, + "step": 27297 + }, + { + "epoch": 2.15, + "learning_rate": 5.5855263390139485e-05, + "loss": 1.4577, + "step": 27298 + }, + { + "epoch": 2.15, + "learning_rate": 5.5845641540902845e-05, + "loss": 1.4628, + "step": 27299 + }, + { + "epoch": 2.15, + "learning_rate": 5.583602033092233e-05, + "loss": 1.4551, + "step": 27300 + }, + { + "epoch": 2.15, + "learning_rate": 5.5826399760263274e-05, + "loss": 1.4584, + "step": 27301 + }, + { + "epoch": 2.15, + "learning_rate": 5.581677982899095e-05, + "loss": 1.4782, + "step": 27302 + }, + { + "epoch": 2.15, + "learning_rate": 5.5807160537170745e-05, + "loss": 1.4218, + "step": 27303 + }, + { + "epoch": 2.15, + "learning_rate": 5.579754188486797e-05, + "loss": 1.4601, + "step": 27304 + }, + { + "epoch": 2.15, + "learning_rate": 5.5787923872147824e-05, + "loss": 1.4116, + "step": 27305 + }, + { + "epoch": 2.15, + "learning_rate": 5.5778306499075754e-05, + "loss": 1.4156, + "step": 27306 + }, + { + "epoch": 2.15, + "learning_rate": 5.576868976571693e-05, + "loss": 1.4388, + "step": 27307 + }, + { + "epoch": 2.15, + "learning_rate": 5.5759073672136736e-05, + "loss": 1.4491, + "step": 27308 + }, + { + "epoch": 2.15, + "learning_rate": 5.57494582184004e-05, + "loss": 1.4842, + "step": 27309 + }, + { + "epoch": 2.15, + "learning_rate": 5.573984340457326e-05, + "loss": 1.4153, + "step": 27310 + }, + { + "epoch": 2.15, + "learning_rate": 5.573022923072058e-05, + "loss": 1.4603, + "step": 27311 + }, + { + "epoch": 2.15, + "learning_rate": 5.572061569690756e-05, + "loss": 1.4564, + "step": 27312 + }, + { + "epoch": 2.15, + "learning_rate": 5.57110028031996e-05, + "loss": 1.4994, + "step": 27313 + }, + { + "epoch": 2.15, + "learning_rate": 5.5701390549661886e-05, + "loss": 1.5029, + "step": 27314 + }, + { + "epoch": 2.15, + "learning_rate": 5.569177893635965e-05, + "loss": 1.4399, + "step": 27315 + }, + { + "epoch": 2.15, + "learning_rate": 5.568216796335823e-05, + "loss": 1.4364, + "step": 27316 + }, + { + "epoch": 2.15, + "learning_rate": 5.567255763072284e-05, + "loss": 1.4718, + "step": 27317 + }, + { + "epoch": 2.15, + "learning_rate": 5.566294793851874e-05, + "loss": 1.462, + "step": 27318 + }, + { + "epoch": 2.15, + "learning_rate": 5.5653338886811114e-05, + "loss": 1.4397, + "step": 27319 + }, + { + "epoch": 2.15, + "learning_rate": 5.564373047566529e-05, + "loss": 1.4298, + "step": 27320 + }, + { + "epoch": 2.15, + "learning_rate": 5.563412270514647e-05, + "loss": 1.4713, + "step": 27321 + }, + { + "epoch": 2.15, + "learning_rate": 5.5624515575319825e-05, + "loss": 1.4292, + "step": 27322 + }, + { + "epoch": 2.15, + "learning_rate": 5.5614909086250654e-05, + "loss": 1.4375, + "step": 27323 + }, + { + "epoch": 2.15, + "learning_rate": 5.5605303238004206e-05, + "loss": 1.4472, + "step": 27324 + }, + { + "epoch": 2.15, + "learning_rate": 5.559569803064567e-05, + "loss": 1.4787, + "step": 27325 + }, + { + "epoch": 2.15, + "learning_rate": 5.558609346424019e-05, + "loss": 1.4614, + "step": 27326 + }, + { + "epoch": 2.15, + "learning_rate": 5.557648953885308e-05, + "loss": 1.4684, + "step": 27327 + }, + { + "epoch": 2.15, + "learning_rate": 5.5566886254549494e-05, + "loss": 1.4495, + "step": 27328 + }, + { + "epoch": 2.15, + "learning_rate": 5.5557283611394586e-05, + "loss": 1.4323, + "step": 27329 + }, + { + "epoch": 2.15, + "learning_rate": 5.554768160945367e-05, + "loss": 1.4648, + "step": 27330 + }, + { + "epoch": 2.15, + "learning_rate": 5.5538080248791874e-05, + "loss": 1.5077, + "step": 27331 + }, + { + "epoch": 2.15, + "learning_rate": 5.552847952947432e-05, + "loss": 1.4622, + "step": 27332 + }, + { + "epoch": 2.15, + "learning_rate": 5.551887945156632e-05, + "loss": 1.4462, + "step": 27333 + }, + { + "epoch": 2.15, + "learning_rate": 5.550928001513297e-05, + "loss": 1.4792, + "step": 27334 + }, + { + "epoch": 2.15, + "learning_rate": 5.549968122023942e-05, + "loss": 1.4569, + "step": 27335 + }, + { + "epoch": 2.15, + "learning_rate": 5.549008306695095e-05, + "loss": 1.4534, + "step": 27336 + }, + { + "epoch": 2.15, + "learning_rate": 5.548048555533265e-05, + "loss": 1.4526, + "step": 27337 + }, + { + "epoch": 2.15, + "learning_rate": 5.547088868544964e-05, + "loss": 1.4382, + "step": 27338 + }, + { + "epoch": 2.15, + "learning_rate": 5.5461292457367144e-05, + "loss": 1.48, + "step": 27339 + }, + { + "epoch": 2.15, + "learning_rate": 5.545169687115034e-05, + "loss": 1.4027, + "step": 27340 + }, + { + "epoch": 2.15, + "learning_rate": 5.5442101926864344e-05, + "loss": 1.4344, + "step": 27341 + }, + { + "epoch": 2.15, + "learning_rate": 5.543250762457429e-05, + "loss": 1.4515, + "step": 27342 + }, + { + "epoch": 2.15, + "learning_rate": 5.542291396434527e-05, + "loss": 1.431, + "step": 27343 + }, + { + "epoch": 2.15, + "learning_rate": 5.541332094624252e-05, + "loss": 1.4797, + "step": 27344 + }, + { + "epoch": 2.15, + "learning_rate": 5.540372857033114e-05, + "loss": 1.4685, + "step": 27345 + }, + { + "epoch": 2.15, + "learning_rate": 5.539413683667617e-05, + "loss": 1.4959, + "step": 27346 + }, + { + "epoch": 2.15, + "learning_rate": 5.538454574534287e-05, + "loss": 1.4794, + "step": 27347 + }, + { + "epoch": 2.15, + "learning_rate": 5.537495529639629e-05, + "loss": 1.4685, + "step": 27348 + }, + { + "epoch": 2.15, + "learning_rate": 5.536536548990149e-05, + "loss": 1.4376, + "step": 27349 + }, + { + "epoch": 2.15, + "learning_rate": 5.535577632592367e-05, + "loss": 1.4847, + "step": 27350 + }, + { + "epoch": 2.15, + "learning_rate": 5.534618780452793e-05, + "loss": 1.4189, + "step": 27351 + }, + { + "epoch": 2.15, + "learning_rate": 5.5336599925779275e-05, + "loss": 1.4838, + "step": 27352 + }, + { + "epoch": 2.15, + "learning_rate": 5.5327012689742914e-05, + "loss": 1.4547, + "step": 27353 + }, + { + "epoch": 2.15, + "learning_rate": 5.531742609648384e-05, + "loss": 1.4357, + "step": 27354 + }, + { + "epoch": 2.15, + "learning_rate": 5.530784014606724e-05, + "loss": 1.4615, + "step": 27355 + }, + { + "epoch": 2.15, + "learning_rate": 5.529825483855811e-05, + "loss": 1.4533, + "step": 27356 + }, + { + "epoch": 2.15, + "learning_rate": 5.5288670174021614e-05, + "loss": 1.4774, + "step": 27357 + }, + { + "epoch": 2.15, + "learning_rate": 5.5279086152522796e-05, + "loss": 1.4859, + "step": 27358 + }, + { + "epoch": 2.15, + "learning_rate": 5.5269502774126696e-05, + "loss": 1.5221, + "step": 27359 + }, + { + "epoch": 2.15, + "learning_rate": 5.5259920038898346e-05, + "loss": 1.428, + "step": 27360 + }, + { + "epoch": 2.15, + "learning_rate": 5.52503379469029e-05, + "loss": 1.491, + "step": 27361 + }, + { + "epoch": 2.15, + "learning_rate": 5.524075649820539e-05, + "loss": 1.4413, + "step": 27362 + }, + { + "epoch": 2.15, + "learning_rate": 5.52311756928708e-05, + "loss": 1.5091, + "step": 27363 + }, + { + "epoch": 2.15, + "learning_rate": 5.5221595530964256e-05, + "loss": 1.3943, + "step": 27364 + }, + { + "epoch": 2.15, + "learning_rate": 5.521201601255079e-05, + "loss": 1.4715, + "step": 27365 + }, + { + "epoch": 2.15, + "learning_rate": 5.520243713769538e-05, + "loss": 1.4315, + "step": 27366 + }, + { + "epoch": 2.15, + "learning_rate": 5.519285890646316e-05, + "loss": 1.467, + "step": 27367 + }, + { + "epoch": 2.15, + "learning_rate": 5.518328131891911e-05, + "loss": 1.4762, + "step": 27368 + }, + { + "epoch": 2.15, + "learning_rate": 5.5173704375128206e-05, + "loss": 1.4535, + "step": 27369 + }, + { + "epoch": 2.15, + "learning_rate": 5.5164128075155505e-05, + "loss": 1.4346, + "step": 27370 + }, + { + "epoch": 2.15, + "learning_rate": 5.51545524190661e-05, + "loss": 1.4603, + "step": 27371 + }, + { + "epoch": 2.15, + "learning_rate": 5.514497740692494e-05, + "loss": 1.4752, + "step": 27372 + }, + { + "epoch": 2.15, + "learning_rate": 5.5135403038797005e-05, + "loss": 1.4203, + "step": 27373 + }, + { + "epoch": 2.15, + "learning_rate": 5.512582931474736e-05, + "loss": 1.4906, + "step": 27374 + }, + { + "epoch": 2.15, + "learning_rate": 5.511625623484099e-05, + "loss": 1.4563, + "step": 27375 + }, + { + "epoch": 2.15, + "learning_rate": 5.510668379914289e-05, + "loss": 1.4425, + "step": 27376 + }, + { + "epoch": 2.15, + "learning_rate": 5.509711200771797e-05, + "loss": 1.4121, + "step": 27377 + }, + { + "epoch": 2.15, + "learning_rate": 5.5087540860631336e-05, + "loss": 1.4374, + "step": 27378 + }, + { + "epoch": 2.15, + "learning_rate": 5.507797035794793e-05, + "loss": 1.4718, + "step": 27379 + }, + { + "epoch": 2.15, + "learning_rate": 5.506840049973267e-05, + "loss": 1.4395, + "step": 27380 + }, + { + "epoch": 2.15, + "learning_rate": 5.505883128605064e-05, + "loss": 1.454, + "step": 27381 + }, + { + "epoch": 2.15, + "learning_rate": 5.504926271696675e-05, + "loss": 1.4069, + "step": 27382 + }, + { + "epoch": 2.15, + "learning_rate": 5.503969479254592e-05, + "loss": 1.4176, + "step": 27383 + }, + { + "epoch": 2.15, + "learning_rate": 5.503012751285321e-05, + "loss": 1.4284, + "step": 27384 + }, + { + "epoch": 2.15, + "learning_rate": 5.502056087795353e-05, + "loss": 1.4809, + "step": 27385 + }, + { + "epoch": 2.15, + "learning_rate": 5.501099488791177e-05, + "loss": 1.4386, + "step": 27386 + }, + { + "epoch": 2.15, + "learning_rate": 5.500142954279293e-05, + "loss": 1.4882, + "step": 27387 + }, + { + "epoch": 2.15, + "learning_rate": 5.4991864842662006e-05, + "loss": 1.4752, + "step": 27388 + }, + { + "epoch": 2.16, + "learning_rate": 5.49823007875839e-05, + "loss": 1.4109, + "step": 27389 + }, + { + "epoch": 2.16, + "learning_rate": 5.4972737377623494e-05, + "loss": 1.415, + "step": 27390 + }, + { + "epoch": 2.16, + "learning_rate": 5.4963174612845805e-05, + "loss": 1.4549, + "step": 27391 + }, + { + "epoch": 2.16, + "learning_rate": 5.495361249331571e-05, + "loss": 1.4512, + "step": 27392 + }, + { + "epoch": 2.16, + "learning_rate": 5.494405101909808e-05, + "loss": 1.4385, + "step": 27393 + }, + { + "epoch": 2.16, + "learning_rate": 5.493449019025795e-05, + "loss": 1.4561, + "step": 27394 + }, + { + "epoch": 2.16, + "learning_rate": 5.4924930006860156e-05, + "loss": 1.3984, + "step": 27395 + }, + { + "epoch": 2.16, + "learning_rate": 5.491537046896963e-05, + "loss": 1.4833, + "step": 27396 + }, + { + "epoch": 2.16, + "learning_rate": 5.490581157665121e-05, + "loss": 1.4905, + "step": 27397 + }, + { + "epoch": 2.16, + "learning_rate": 5.489625332996992e-05, + "loss": 1.4676, + "step": 27398 + }, + { + "epoch": 2.16, + "learning_rate": 5.488669572899057e-05, + "loss": 1.4485, + "step": 27399 + }, + { + "epoch": 2.16, + "learning_rate": 5.487713877377803e-05, + "loss": 1.4694, + "step": 27400 + }, + { + "epoch": 2.16, + "learning_rate": 5.486758246439721e-05, + "loss": 1.4613, + "step": 27401 + }, + { + "epoch": 2.16, + "learning_rate": 5.485802680091306e-05, + "loss": 1.4582, + "step": 27402 + }, + { + "epoch": 2.16, + "learning_rate": 5.4848471783390404e-05, + "loss": 1.4767, + "step": 27403 + }, + { + "epoch": 2.16, + "learning_rate": 5.483891741189407e-05, + "loss": 1.4578, + "step": 27404 + }, + { + "epoch": 2.16, + "learning_rate": 5.482936368648904e-05, + "loss": 1.5014, + "step": 27405 + }, + { + "epoch": 2.16, + "learning_rate": 5.4819810607240075e-05, + "loss": 1.4297, + "step": 27406 + }, + { + "epoch": 2.16, + "learning_rate": 5.481025817421205e-05, + "loss": 1.4921, + "step": 27407 + }, + { + "epoch": 2.16, + "learning_rate": 5.480070638746987e-05, + "loss": 1.505, + "step": 27408 + }, + { + "epoch": 2.16, + "learning_rate": 5.4791155247078374e-05, + "loss": 1.5074, + "step": 27409 + }, + { + "epoch": 2.16, + "learning_rate": 5.478160475310234e-05, + "loss": 1.4732, + "step": 27410 + }, + { + "epoch": 2.16, + "learning_rate": 5.477205490560672e-05, + "loss": 1.422, + "step": 27411 + }, + { + "epoch": 2.16, + "learning_rate": 5.476250570465629e-05, + "loss": 1.474, + "step": 27412 + }, + { + "epoch": 2.16, + "learning_rate": 5.475295715031588e-05, + "loss": 1.4626, + "step": 27413 + }, + { + "epoch": 2.16, + "learning_rate": 5.47434092426503e-05, + "loss": 1.3765, + "step": 27414 + }, + { + "epoch": 2.16, + "learning_rate": 5.473386198172443e-05, + "loss": 1.4467, + "step": 27415 + }, + { + "epoch": 2.16, + "learning_rate": 5.472431536760309e-05, + "loss": 1.4202, + "step": 27416 + }, + { + "epoch": 2.16, + "learning_rate": 5.4714769400351005e-05, + "loss": 1.4298, + "step": 27417 + }, + { + "epoch": 2.16, + "learning_rate": 5.470522408003306e-05, + "loss": 1.4242, + "step": 27418 + }, + { + "epoch": 2.16, + "learning_rate": 5.4695679406714086e-05, + "loss": 1.4702, + "step": 27419 + }, + { + "epoch": 2.16, + "learning_rate": 5.468613538045888e-05, + "loss": 1.4871, + "step": 27420 + }, + { + "epoch": 2.16, + "learning_rate": 5.467659200133216e-05, + "loss": 1.4621, + "step": 27421 + }, + { + "epoch": 2.16, + "learning_rate": 5.4667049269398826e-05, + "loss": 1.4593, + "step": 27422 + }, + { + "epoch": 2.16, + "learning_rate": 5.465750718472362e-05, + "loss": 1.49, + "step": 27423 + }, + { + "epoch": 2.16, + "learning_rate": 5.4647965747371274e-05, + "loss": 1.4442, + "step": 27424 + }, + { + "epoch": 2.16, + "learning_rate": 5.4638424957406654e-05, + "loss": 1.5056, + "step": 27425 + }, + { + "epoch": 2.16, + "learning_rate": 5.462888481489453e-05, + "loss": 1.4293, + "step": 27426 + }, + { + "epoch": 2.16, + "learning_rate": 5.4619345319899594e-05, + "loss": 1.4756, + "step": 27427 + }, + { + "epoch": 2.16, + "learning_rate": 5.460980647248671e-05, + "loss": 1.4764, + "step": 27428 + }, + { + "epoch": 2.16, + "learning_rate": 5.46002682727206e-05, + "loss": 1.4386, + "step": 27429 + }, + { + "epoch": 2.16, + "learning_rate": 5.459073072066602e-05, + "loss": 1.4322, + "step": 27430 + }, + { + "epoch": 2.16, + "learning_rate": 5.4581193816387674e-05, + "loss": 1.4925, + "step": 27431 + }, + { + "epoch": 2.16, + "learning_rate": 5.457165755995043e-05, + "loss": 1.4681, + "step": 27432 + }, + { + "epoch": 2.16, + "learning_rate": 5.456212195141891e-05, + "loss": 1.4558, + "step": 27433 + }, + { + "epoch": 2.16, + "learning_rate": 5.4552586990857914e-05, + "loss": 1.4504, + "step": 27434 + }, + { + "epoch": 2.16, + "learning_rate": 5.454305267833223e-05, + "loss": 1.4685, + "step": 27435 + }, + { + "epoch": 2.16, + "learning_rate": 5.453351901390654e-05, + "loss": 1.4634, + "step": 27436 + }, + { + "epoch": 2.16, + "learning_rate": 5.4523985997645584e-05, + "loss": 1.4212, + "step": 27437 + }, + { + "epoch": 2.16, + "learning_rate": 5.4514453629614016e-05, + "loss": 1.4925, + "step": 27438 + }, + { + "epoch": 2.16, + "learning_rate": 5.450492190987667e-05, + "loss": 1.5116, + "step": 27439 + }, + { + "epoch": 2.16, + "learning_rate": 5.44953908384982e-05, + "loss": 1.4875, + "step": 27440 + }, + { + "epoch": 2.16, + "learning_rate": 5.448586041554327e-05, + "loss": 1.3963, + "step": 27441 + }, + { + "epoch": 2.16, + "learning_rate": 5.44763306410767e-05, + "loss": 1.4292, + "step": 27442 + }, + { + "epoch": 2.16, + "learning_rate": 5.446680151516312e-05, + "loss": 1.445, + "step": 27443 + }, + { + "epoch": 2.16, + "learning_rate": 5.445727303786719e-05, + "loss": 1.4459, + "step": 27444 + }, + { + "epoch": 2.16, + "learning_rate": 5.4447745209253696e-05, + "loss": 1.4724, + "step": 27445 + }, + { + "epoch": 2.16, + "learning_rate": 5.443821802938729e-05, + "loss": 1.45, + "step": 27446 + }, + { + "epoch": 2.16, + "learning_rate": 5.442869149833261e-05, + "loss": 1.4881, + "step": 27447 + }, + { + "epoch": 2.16, + "learning_rate": 5.441916561615435e-05, + "loss": 1.4767, + "step": 27448 + }, + { + "epoch": 2.16, + "learning_rate": 5.440964038291727e-05, + "loss": 1.4391, + "step": 27449 + }, + { + "epoch": 2.16, + "learning_rate": 5.440011579868599e-05, + "loss": 1.4819, + "step": 27450 + }, + { + "epoch": 2.16, + "learning_rate": 5.439059186352511e-05, + "loss": 1.472, + "step": 27451 + }, + { + "epoch": 2.16, + "learning_rate": 5.4381068577499385e-05, + "loss": 1.4174, + "step": 27452 + }, + { + "epoch": 2.16, + "learning_rate": 5.437154594067346e-05, + "loss": 1.4235, + "step": 27453 + }, + { + "epoch": 2.16, + "learning_rate": 5.436202395311196e-05, + "loss": 1.4665, + "step": 27454 + }, + { + "epoch": 2.16, + "learning_rate": 5.435250261487948e-05, + "loss": 1.4331, + "step": 27455 + }, + { + "epoch": 2.16, + "learning_rate": 5.434298192604078e-05, + "loss": 1.4817, + "step": 27456 + }, + { + "epoch": 2.16, + "learning_rate": 5.4333461886660446e-05, + "loss": 1.4969, + "step": 27457 + }, + { + "epoch": 2.16, + "learning_rate": 5.4323942496803064e-05, + "loss": 1.4949, + "step": 27458 + }, + { + "epoch": 2.16, + "learning_rate": 5.4314423756533365e-05, + "loss": 1.4807, + "step": 27459 + }, + { + "epoch": 2.16, + "learning_rate": 5.430490566591591e-05, + "loss": 1.4365, + "step": 27460 + }, + { + "epoch": 2.16, + "learning_rate": 5.4295388225015315e-05, + "loss": 1.4274, + "step": 27461 + }, + { + "epoch": 2.16, + "learning_rate": 5.4285871433896255e-05, + "loss": 1.4686, + "step": 27462 + }, + { + "epoch": 2.16, + "learning_rate": 5.427635529262331e-05, + "loss": 1.5194, + "step": 27463 + }, + { + "epoch": 2.16, + "learning_rate": 5.4266839801261035e-05, + "loss": 1.4439, + "step": 27464 + }, + { + "epoch": 2.16, + "learning_rate": 5.4257324959874086e-05, + "loss": 1.4378, + "step": 27465 + }, + { + "epoch": 2.16, + "learning_rate": 5.424781076852711e-05, + "loss": 1.4533, + "step": 27466 + }, + { + "epoch": 2.16, + "learning_rate": 5.423829722728467e-05, + "loss": 1.503, + "step": 27467 + }, + { + "epoch": 2.16, + "learning_rate": 5.42287843362113e-05, + "loss": 1.4334, + "step": 27468 + }, + { + "epoch": 2.16, + "learning_rate": 5.421927209537166e-05, + "loss": 1.4586, + "step": 27469 + }, + { + "epoch": 2.16, + "learning_rate": 5.420976050483032e-05, + "loss": 1.5076, + "step": 27470 + }, + { + "epoch": 2.16, + "learning_rate": 5.4200249564651865e-05, + "loss": 1.4815, + "step": 27471 + }, + { + "epoch": 2.16, + "learning_rate": 5.419073927490077e-05, + "loss": 1.5408, + "step": 27472 + }, + { + "epoch": 2.16, + "learning_rate": 5.418122963564175e-05, + "loss": 1.4493, + "step": 27473 + }, + { + "epoch": 2.16, + "learning_rate": 5.4171720646939306e-05, + "loss": 1.5015, + "step": 27474 + }, + { + "epoch": 2.16, + "learning_rate": 5.4162212308857934e-05, + "loss": 1.4704, + "step": 27475 + }, + { + "epoch": 2.16, + "learning_rate": 5.41527046214623e-05, + "loss": 1.4095, + "step": 27476 + }, + { + "epoch": 2.16, + "learning_rate": 5.414319758481692e-05, + "loss": 1.4041, + "step": 27477 + }, + { + "epoch": 2.16, + "learning_rate": 5.4133691198986276e-05, + "loss": 1.5019, + "step": 27478 + }, + { + "epoch": 2.16, + "learning_rate": 5.412418546403502e-05, + "loss": 1.4777, + "step": 27479 + }, + { + "epoch": 2.16, + "learning_rate": 5.411468038002758e-05, + "loss": 1.4177, + "step": 27480 + }, + { + "epoch": 2.16, + "learning_rate": 5.41051759470286e-05, + "loss": 1.4639, + "step": 27481 + }, + { + "epoch": 2.16, + "learning_rate": 5.409567216510249e-05, + "loss": 1.3983, + "step": 27482 + }, + { + "epoch": 2.16, + "learning_rate": 5.40861690343139e-05, + "loss": 1.4174, + "step": 27483 + }, + { + "epoch": 2.16, + "learning_rate": 5.40766665547273e-05, + "loss": 1.4702, + "step": 27484 + }, + { + "epoch": 2.16, + "learning_rate": 5.4067164726407146e-05, + "loss": 1.4823, + "step": 27485 + }, + { + "epoch": 2.16, + "learning_rate": 5.405766354941806e-05, + "loss": 1.4728, + "step": 27486 + }, + { + "epoch": 2.16, + "learning_rate": 5.4048163023824496e-05, + "loss": 1.4661, + "step": 27487 + }, + { + "epoch": 2.16, + "learning_rate": 5.4038663149690936e-05, + "loss": 1.4242, + "step": 27488 + }, + { + "epoch": 2.16, + "learning_rate": 5.402916392708186e-05, + "loss": 1.4934, + "step": 27489 + }, + { + "epoch": 2.16, + "learning_rate": 5.4019665356061844e-05, + "loss": 1.4638, + "step": 27490 + }, + { + "epoch": 2.16, + "learning_rate": 5.4010167436695354e-05, + "loss": 1.443, + "step": 27491 + }, + { + "epoch": 2.16, + "learning_rate": 5.400067016904678e-05, + "loss": 1.4559, + "step": 27492 + }, + { + "epoch": 2.16, + "learning_rate": 5.399117355318073e-05, + "loss": 1.4414, + "step": 27493 + }, + { + "epoch": 2.16, + "learning_rate": 5.398167758916165e-05, + "loss": 1.4441, + "step": 27494 + }, + { + "epoch": 2.16, + "learning_rate": 5.397218227705393e-05, + "loss": 1.4193, + "step": 27495 + }, + { + "epoch": 2.16, + "learning_rate": 5.39626876169221e-05, + "loss": 1.3986, + "step": 27496 + }, + { + "epoch": 2.16, + "learning_rate": 5.395319360883067e-05, + "loss": 1.5084, + "step": 27497 + }, + { + "epoch": 2.16, + "learning_rate": 5.394370025284405e-05, + "loss": 1.4682, + "step": 27498 + }, + { + "epoch": 2.16, + "learning_rate": 5.393420754902664e-05, + "loss": 1.4535, + "step": 27499 + }, + { + "epoch": 2.16, + "learning_rate": 5.392471549744302e-05, + "loss": 1.4683, + "step": 27500 + }, + { + "epoch": 2.16, + "learning_rate": 5.391522409815755e-05, + "loss": 1.448, + "step": 27501 + }, + { + "epoch": 2.16, + "learning_rate": 5.3905733351234624e-05, + "loss": 1.4522, + "step": 27502 + }, + { + "epoch": 2.16, + "learning_rate": 5.3896243256738815e-05, + "loss": 1.4302, + "step": 27503 + }, + { + "epoch": 2.16, + "learning_rate": 5.388675381473446e-05, + "loss": 1.4711, + "step": 27504 + }, + { + "epoch": 2.16, + "learning_rate": 5.387726502528597e-05, + "loss": 1.5136, + "step": 27505 + }, + { + "epoch": 2.16, + "learning_rate": 5.386777688845785e-05, + "loss": 1.4327, + "step": 27506 + }, + { + "epoch": 2.16, + "learning_rate": 5.3858289404314476e-05, + "loss": 1.4249, + "step": 27507 + }, + { + "epoch": 2.16, + "learning_rate": 5.3848802572920255e-05, + "loss": 1.4532, + "step": 27508 + }, + { + "epoch": 2.16, + "learning_rate": 5.383931639433955e-05, + "loss": 1.4714, + "step": 27509 + }, + { + "epoch": 2.16, + "learning_rate": 5.382983086863688e-05, + "loss": 1.4858, + "step": 27510 + }, + { + "epoch": 2.16, + "learning_rate": 5.3820345995876545e-05, + "loss": 1.4591, + "step": 27511 + }, + { + "epoch": 2.16, + "learning_rate": 5.3810861776123025e-05, + "loss": 1.448, + "step": 27512 + }, + { + "epoch": 2.16, + "learning_rate": 5.380137820944062e-05, + "loss": 1.4594, + "step": 27513 + }, + { + "epoch": 2.16, + "learning_rate": 5.3791895295893825e-05, + "loss": 1.4655, + "step": 27514 + }, + { + "epoch": 2.16, + "learning_rate": 5.378241303554696e-05, + "loss": 1.4109, + "step": 27515 + }, + { + "epoch": 2.16, + "learning_rate": 5.377293142846437e-05, + "loss": 1.5096, + "step": 27516 + }, + { + "epoch": 2.17, + "learning_rate": 5.3763450474710526e-05, + "loss": 1.4883, + "step": 27517 + }, + { + "epoch": 2.17, + "learning_rate": 5.375397017434975e-05, + "loss": 1.4645, + "step": 27518 + }, + { + "epoch": 2.17, + "learning_rate": 5.3744490527446345e-05, + "loss": 1.4582, + "step": 27519 + }, + { + "epoch": 2.17, + "learning_rate": 5.373501153406477e-05, + "loss": 1.4413, + "step": 27520 + }, + { + "epoch": 2.17, + "learning_rate": 5.372553319426936e-05, + "loss": 1.4711, + "step": 27521 + }, + { + "epoch": 2.17, + "learning_rate": 5.3716055508124395e-05, + "loss": 1.4797, + "step": 27522 + }, + { + "epoch": 2.17, + "learning_rate": 5.370657847569433e-05, + "loss": 1.452, + "step": 27523 + }, + { + "epoch": 2.17, + "learning_rate": 5.369710209704346e-05, + "loss": 1.4673, + "step": 27524 + }, + { + "epoch": 2.17, + "learning_rate": 5.368762637223612e-05, + "loss": 1.4625, + "step": 27525 + }, + { + "epoch": 2.17, + "learning_rate": 5.367815130133661e-05, + "loss": 1.4701, + "step": 27526 + }, + { + "epoch": 2.17, + "learning_rate": 5.366867688440927e-05, + "loss": 1.4386, + "step": 27527 + }, + { + "epoch": 2.17, + "learning_rate": 5.365920312151853e-05, + "loss": 1.4863, + "step": 27528 + }, + { + "epoch": 2.17, + "learning_rate": 5.3649730012728626e-05, + "loss": 1.4436, + "step": 27529 + }, + { + "epoch": 2.17, + "learning_rate": 5.364025755810383e-05, + "loss": 1.4038, + "step": 27530 + }, + { + "epoch": 2.17, + "learning_rate": 5.3630785757708567e-05, + "loss": 1.521, + "step": 27531 + }, + { + "epoch": 2.17, + "learning_rate": 5.362131461160709e-05, + "loss": 1.5084, + "step": 27532 + }, + { + "epoch": 2.17, + "learning_rate": 5.361184411986363e-05, + "loss": 1.4888, + "step": 27533 + }, + { + "epoch": 2.17, + "learning_rate": 5.360237428254264e-05, + "loss": 1.4319, + "step": 27534 + }, + { + "epoch": 2.17, + "learning_rate": 5.3592905099708314e-05, + "loss": 1.4449, + "step": 27535 + }, + { + "epoch": 2.17, + "learning_rate": 5.3583436571424904e-05, + "loss": 1.4624, + "step": 27536 + }, + { + "epoch": 2.17, + "learning_rate": 5.357396869775682e-05, + "loss": 1.4153, + "step": 27537 + }, + { + "epoch": 2.17, + "learning_rate": 5.3564501478768265e-05, + "loss": 1.4584, + "step": 27538 + }, + { + "epoch": 2.17, + "learning_rate": 5.3555034914523466e-05, + "loss": 1.4667, + "step": 27539 + }, + { + "epoch": 2.17, + "learning_rate": 5.3545569005086825e-05, + "loss": 1.4451, + "step": 27540 + }, + { + "epoch": 2.17, + "learning_rate": 5.353610375052254e-05, + "loss": 1.4443, + "step": 27541 + }, + { + "epoch": 2.17, + "learning_rate": 5.352663915089488e-05, + "loss": 1.4587, + "step": 27542 + }, + { + "epoch": 2.17, + "learning_rate": 5.351717520626799e-05, + "loss": 1.4558, + "step": 27543 + }, + { + "epoch": 2.17, + "learning_rate": 5.3507711916706346e-05, + "loss": 1.4671, + "step": 27544 + }, + { + "epoch": 2.17, + "learning_rate": 5.349824928227408e-05, + "loss": 1.4792, + "step": 27545 + }, + { + "epoch": 2.17, + "learning_rate": 5.34887873030354e-05, + "loss": 1.4521, + "step": 27546 + }, + { + "epoch": 2.17, + "learning_rate": 5.347932597905466e-05, + "loss": 1.4865, + "step": 27547 + }, + { + "epoch": 2.17, + "learning_rate": 5.3469865310396015e-05, + "loss": 1.4095, + "step": 27548 + }, + { + "epoch": 2.17, + "learning_rate": 5.3460405297123716e-05, + "loss": 1.4546, + "step": 27549 + }, + { + "epoch": 2.17, + "learning_rate": 5.3450945939301944e-05, + "loss": 1.4733, + "step": 27550 + }, + { + "epoch": 2.17, + "learning_rate": 5.3441487236995025e-05, + "loss": 1.4205, + "step": 27551 + }, + { + "epoch": 2.17, + "learning_rate": 5.3432029190267126e-05, + "loss": 1.4632, + "step": 27552 + }, + { + "epoch": 2.17, + "learning_rate": 5.342257179918239e-05, + "loss": 1.458, + "step": 27553 + }, + { + "epoch": 2.17, + "learning_rate": 5.341311506380516e-05, + "loss": 1.5016, + "step": 27554 + }, + { + "epoch": 2.17, + "learning_rate": 5.340365898419957e-05, + "loss": 1.4691, + "step": 27555 + }, + { + "epoch": 2.17, + "learning_rate": 5.339420356042978e-05, + "loss": 1.5226, + "step": 27556 + }, + { + "epoch": 2.17, + "learning_rate": 5.338474879256008e-05, + "loss": 1.4528, + "step": 27557 + }, + { + "epoch": 2.17, + "learning_rate": 5.3375294680654576e-05, + "loss": 1.4736, + "step": 27558 + }, + { + "epoch": 2.17, + "learning_rate": 5.336584122477755e-05, + "loss": 1.4066, + "step": 27559 + }, + { + "epoch": 2.17, + "learning_rate": 5.335638842499309e-05, + "loss": 1.4075, + "step": 27560 + }, + { + "epoch": 2.17, + "learning_rate": 5.334693628136546e-05, + "loss": 1.5, + "step": 27561 + }, + { + "epoch": 2.17, + "learning_rate": 5.333748479395881e-05, + "loss": 1.4631, + "step": 27562 + }, + { + "epoch": 2.17, + "learning_rate": 5.332803396283723e-05, + "loss": 1.4353, + "step": 27563 + }, + { + "epoch": 2.17, + "learning_rate": 5.331858378806501e-05, + "loss": 1.4869, + "step": 27564 + }, + { + "epoch": 2.17, + "learning_rate": 5.330913426970625e-05, + "loss": 1.4251, + "step": 27565 + }, + { + "epoch": 2.17, + "learning_rate": 5.329968540782511e-05, + "loss": 1.434, + "step": 27566 + }, + { + "epoch": 2.17, + "learning_rate": 5.3290237202485694e-05, + "loss": 1.4219, + "step": 27567 + }, + { + "epoch": 2.17, + "learning_rate": 5.328078965375224e-05, + "loss": 1.4713, + "step": 27568 + }, + { + "epoch": 2.17, + "learning_rate": 5.327134276168886e-05, + "loss": 1.4157, + "step": 27569 + }, + { + "epoch": 2.17, + "learning_rate": 5.326189652635963e-05, + "loss": 1.3995, + "step": 27570 + }, + { + "epoch": 2.17, + "learning_rate": 5.3252450947828786e-05, + "loss": 1.4293, + "step": 27571 + }, + { + "epoch": 2.17, + "learning_rate": 5.324300602616042e-05, + "loss": 1.4555, + "step": 27572 + }, + { + "epoch": 2.17, + "learning_rate": 5.323356176141858e-05, + "loss": 1.418, + "step": 27573 + }, + { + "epoch": 2.17, + "learning_rate": 5.322411815366747e-05, + "loss": 1.4371, + "step": 27574 + }, + { + "epoch": 2.17, + "learning_rate": 5.321467520297124e-05, + "loss": 1.5066, + "step": 27575 + }, + { + "epoch": 2.17, + "learning_rate": 5.320523290939395e-05, + "loss": 1.4834, + "step": 27576 + }, + { + "epoch": 2.17, + "learning_rate": 5.319579127299967e-05, + "loss": 1.4922, + "step": 27577 + }, + { + "epoch": 2.17, + "learning_rate": 5.3186350293852595e-05, + "loss": 1.455, + "step": 27578 + }, + { + "epoch": 2.17, + "learning_rate": 5.317690997201678e-05, + "loss": 1.3756, + "step": 27579 + }, + { + "epoch": 2.17, + "learning_rate": 5.316747030755625e-05, + "loss": 1.4329, + "step": 27580 + }, + { + "epoch": 2.17, + "learning_rate": 5.315803130053522e-05, + "loss": 1.3656, + "step": 27581 + }, + { + "epoch": 2.17, + "learning_rate": 5.314859295101771e-05, + "loss": 1.467, + "step": 27582 + }, + { + "epoch": 2.17, + "learning_rate": 5.313915525906782e-05, + "loss": 1.4049, + "step": 27583 + }, + { + "epoch": 2.17, + "learning_rate": 5.3129718224749543e-05, + "loss": 1.44, + "step": 27584 + }, + { + "epoch": 2.17, + "learning_rate": 5.312028184812708e-05, + "loss": 1.4775, + "step": 27585 + }, + { + "epoch": 2.17, + "learning_rate": 5.3110846129264443e-05, + "loss": 1.3787, + "step": 27586 + }, + { + "epoch": 2.17, + "learning_rate": 5.310141106822564e-05, + "loss": 1.4553, + "step": 27587 + }, + { + "epoch": 2.17, + "learning_rate": 5.309197666507485e-05, + "loss": 1.4108, + "step": 27588 + }, + { + "epoch": 2.17, + "learning_rate": 5.3082542919876046e-05, + "loss": 1.3812, + "step": 27589 + }, + { + "epoch": 2.17, + "learning_rate": 5.307310983269324e-05, + "loss": 1.4989, + "step": 27590 + }, + { + "epoch": 2.17, + "learning_rate": 5.306367740359052e-05, + "loss": 1.4844, + "step": 27591 + }, + { + "epoch": 2.17, + "learning_rate": 5.305424563263201e-05, + "loss": 1.4619, + "step": 27592 + }, + { + "epoch": 2.17, + "learning_rate": 5.3044814519881666e-05, + "loss": 1.4231, + "step": 27593 + }, + { + "epoch": 2.17, + "learning_rate": 5.3035384065403466e-05, + "loss": 1.4489, + "step": 27594 + }, + { + "epoch": 2.17, + "learning_rate": 5.302595426926156e-05, + "loss": 1.4557, + "step": 27595 + }, + { + "epoch": 2.17, + "learning_rate": 5.3016525131519895e-05, + "loss": 1.4104, + "step": 27596 + }, + { + "epoch": 2.17, + "learning_rate": 5.300709665224247e-05, + "loss": 1.4368, + "step": 27597 + }, + { + "epoch": 2.17, + "learning_rate": 5.299766883149337e-05, + "loss": 1.5037, + "step": 27598 + }, + { + "epoch": 2.17, + "learning_rate": 5.298824166933658e-05, + "loss": 1.4026, + "step": 27599 + }, + { + "epoch": 2.17, + "learning_rate": 5.297881516583609e-05, + "loss": 1.4583, + "step": 27600 + }, + { + "epoch": 2.17, + "learning_rate": 5.296938932105586e-05, + "loss": 1.437, + "step": 27601 + }, + { + "epoch": 2.17, + "learning_rate": 5.2959964135059975e-05, + "loss": 1.4798, + "step": 27602 + }, + { + "epoch": 2.17, + "learning_rate": 5.2950539607912376e-05, + "loss": 1.4201, + "step": 27603 + }, + { + "epoch": 2.17, + "learning_rate": 5.2941115739677025e-05, + "loss": 1.4488, + "step": 27604 + }, + { + "epoch": 2.17, + "learning_rate": 5.2931692530417966e-05, + "loss": 1.4353, + "step": 27605 + }, + { + "epoch": 2.17, + "learning_rate": 5.2922269980199105e-05, + "loss": 1.4261, + "step": 27606 + }, + { + "epoch": 2.17, + "learning_rate": 5.291284808908452e-05, + "loss": 1.4965, + "step": 27607 + }, + { + "epoch": 2.17, + "learning_rate": 5.2903426857138054e-05, + "loss": 1.4453, + "step": 27608 + }, + { + "epoch": 2.17, + "learning_rate": 5.289400628442379e-05, + "loss": 1.4281, + "step": 27609 + }, + { + "epoch": 2.17, + "learning_rate": 5.288458637100564e-05, + "loss": 1.4662, + "step": 27610 + }, + { + "epoch": 2.17, + "learning_rate": 5.2875167116947516e-05, + "loss": 1.4321, + "step": 27611 + }, + { + "epoch": 2.17, + "learning_rate": 5.286574852231344e-05, + "loss": 1.4433, + "step": 27612 + }, + { + "epoch": 2.17, + "learning_rate": 5.285633058716733e-05, + "loss": 1.4317, + "step": 27613 + }, + { + "epoch": 2.17, + "learning_rate": 5.28469133115731e-05, + "loss": 1.4623, + "step": 27614 + }, + { + "epoch": 2.17, + "learning_rate": 5.283749669559474e-05, + "loss": 1.4589, + "step": 27615 + }, + { + "epoch": 2.17, + "learning_rate": 5.282808073929617e-05, + "loss": 1.5102, + "step": 27616 + }, + { + "epoch": 2.17, + "learning_rate": 5.2818665442741256e-05, + "loss": 1.4178, + "step": 27617 + }, + { + "epoch": 2.17, + "learning_rate": 5.2809250805994024e-05, + "loss": 1.407, + "step": 27618 + }, + { + "epoch": 2.17, + "learning_rate": 5.279983682911834e-05, + "loss": 1.4291, + "step": 27619 + }, + { + "epoch": 2.17, + "learning_rate": 5.2790423512178134e-05, + "loss": 1.4659, + "step": 27620 + }, + { + "epoch": 2.17, + "learning_rate": 5.2781010855237196e-05, + "loss": 1.4105, + "step": 27621 + }, + { + "epoch": 2.17, + "learning_rate": 5.277159885835965e-05, + "loss": 1.482, + "step": 27622 + }, + { + "epoch": 2.17, + "learning_rate": 5.27621875216093e-05, + "loss": 1.4794, + "step": 27623 + }, + { + "epoch": 2.17, + "learning_rate": 5.275277684505003e-05, + "loss": 1.4431, + "step": 27624 + }, + { + "epoch": 2.17, + "learning_rate": 5.274336682874568e-05, + "loss": 1.4757, + "step": 27625 + }, + { + "epoch": 2.17, + "learning_rate": 5.273395747276026e-05, + "loss": 1.4753, + "step": 27626 + }, + { + "epoch": 2.17, + "learning_rate": 5.272454877715759e-05, + "loss": 1.4287, + "step": 27627 + }, + { + "epoch": 2.17, + "learning_rate": 5.271514074200151e-05, + "loss": 1.4122, + "step": 27628 + }, + { + "epoch": 2.17, + "learning_rate": 5.2705733367355976e-05, + "loss": 1.4596, + "step": 27629 + }, + { + "epoch": 2.17, + "learning_rate": 5.269632665328483e-05, + "loss": 1.4581, + "step": 27630 + }, + { + "epoch": 2.17, + "learning_rate": 5.268692059985188e-05, + "loss": 1.4623, + "step": 27631 + }, + { + "epoch": 2.17, + "learning_rate": 5.267751520712108e-05, + "loss": 1.4574, + "step": 27632 + }, + { + "epoch": 2.17, + "learning_rate": 5.266811047515625e-05, + "loss": 1.4338, + "step": 27633 + }, + { + "epoch": 2.17, + "learning_rate": 5.265870640402119e-05, + "loss": 1.4219, + "step": 27634 + }, + { + "epoch": 2.17, + "learning_rate": 5.264930299377985e-05, + "loss": 1.5054, + "step": 27635 + }, + { + "epoch": 2.17, + "learning_rate": 5.2639900244496e-05, + "loss": 1.5123, + "step": 27636 + }, + { + "epoch": 2.17, + "learning_rate": 5.263049815623348e-05, + "loss": 1.4644, + "step": 27637 + }, + { + "epoch": 2.17, + "learning_rate": 5.262109672905612e-05, + "loss": 1.4973, + "step": 27638 + }, + { + "epoch": 2.17, + "learning_rate": 5.261169596302783e-05, + "loss": 1.4549, + "step": 27639 + }, + { + "epoch": 2.17, + "learning_rate": 5.260229585821239e-05, + "loss": 1.4811, + "step": 27640 + }, + { + "epoch": 2.17, + "learning_rate": 5.2592896414673604e-05, + "loss": 1.4159, + "step": 27641 + }, + { + "epoch": 2.17, + "learning_rate": 5.258349763247525e-05, + "loss": 1.4752, + "step": 27642 + }, + { + "epoch": 2.17, + "learning_rate": 5.257409951168124e-05, + "loss": 1.5128, + "step": 27643 + }, + { + "epoch": 2.18, + "learning_rate": 5.256470205235533e-05, + "loss": 1.3962, + "step": 27644 + }, + { + "epoch": 2.18, + "learning_rate": 5.2555305254561266e-05, + "loss": 1.4772, + "step": 27645 + }, + { + "epoch": 2.18, + "learning_rate": 5.254590911836296e-05, + "loss": 1.4691, + "step": 27646 + }, + { + "epoch": 2.18, + "learning_rate": 5.253651364382415e-05, + "loss": 1.5008, + "step": 27647 + }, + { + "epoch": 2.18, + "learning_rate": 5.2527118831008585e-05, + "loss": 1.4641, + "step": 27648 + }, + { + "epoch": 2.18, + "learning_rate": 5.2517724679980126e-05, + "loss": 1.4415, + "step": 27649 + }, + { + "epoch": 2.18, + "learning_rate": 5.2508331190802545e-05, + "loss": 1.4425, + "step": 27650 + }, + { + "epoch": 2.18, + "learning_rate": 5.249893836353953e-05, + "loss": 1.4503, + "step": 27651 + }, + { + "epoch": 2.18, + "learning_rate": 5.248954619825498e-05, + "loss": 1.4628, + "step": 27652 + }, + { + "epoch": 2.18, + "learning_rate": 5.248015469501253e-05, + "loss": 1.4062, + "step": 27653 + }, + { + "epoch": 2.18, + "learning_rate": 5.247076385387608e-05, + "loss": 1.4401, + "step": 27654 + }, + { + "epoch": 2.18, + "learning_rate": 5.246137367490927e-05, + "loss": 1.4362, + "step": 27655 + }, + { + "epoch": 2.18, + "learning_rate": 5.245198415817596e-05, + "loss": 1.4153, + "step": 27656 + }, + { + "epoch": 2.18, + "learning_rate": 5.244259530373983e-05, + "loss": 1.4375, + "step": 27657 + }, + { + "epoch": 2.18, + "learning_rate": 5.24332071116646e-05, + "loss": 1.4307, + "step": 27658 + }, + { + "epoch": 2.18, + "learning_rate": 5.242381958201411e-05, + "loss": 1.4616, + "step": 27659 + }, + { + "epoch": 2.18, + "learning_rate": 5.241443271485203e-05, + "loss": 1.48, + "step": 27660 + }, + { + "epoch": 2.18, + "learning_rate": 5.240504651024209e-05, + "loss": 1.4385, + "step": 27661 + }, + { + "epoch": 2.18, + "learning_rate": 5.2395660968248005e-05, + "loss": 1.451, + "step": 27662 + }, + { + "epoch": 2.18, + "learning_rate": 5.2386276088933545e-05, + "loss": 1.4887, + "step": 27663 + }, + { + "epoch": 2.18, + "learning_rate": 5.237689187236241e-05, + "loss": 1.4436, + "step": 27664 + }, + { + "epoch": 2.18, + "learning_rate": 5.236750831859825e-05, + "loss": 1.4729, + "step": 27665 + }, + { + "epoch": 2.18, + "learning_rate": 5.23581254277049e-05, + "loss": 1.4838, + "step": 27666 + }, + { + "epoch": 2.18, + "learning_rate": 5.2348743199745975e-05, + "loss": 1.513, + "step": 27667 + }, + { + "epoch": 2.18, + "learning_rate": 5.2339361634785155e-05, + "loss": 1.4655, + "step": 27668 + }, + { + "epoch": 2.18, + "learning_rate": 5.232998073288617e-05, + "loss": 1.4126, + "step": 27669 + }, + { + "epoch": 2.18, + "learning_rate": 5.232060049411278e-05, + "loss": 1.4288, + "step": 27670 + }, + { + "epoch": 2.18, + "learning_rate": 5.231122091852859e-05, + "loss": 1.4427, + "step": 27671 + }, + { + "epoch": 2.18, + "learning_rate": 5.230184200619727e-05, + "loss": 1.4581, + "step": 27672 + }, + { + "epoch": 2.18, + "learning_rate": 5.2292463757182565e-05, + "loss": 1.4542, + "step": 27673 + }, + { + "epoch": 2.18, + "learning_rate": 5.2283086171548115e-05, + "loss": 1.4963, + "step": 27674 + }, + { + "epoch": 2.18, + "learning_rate": 5.227370924935753e-05, + "loss": 1.4741, + "step": 27675 + }, + { + "epoch": 2.18, + "learning_rate": 5.226433299067458e-05, + "loss": 1.4762, + "step": 27676 + }, + { + "epoch": 2.18, + "learning_rate": 5.225495739556289e-05, + "loss": 1.4389, + "step": 27677 + }, + { + "epoch": 2.18, + "learning_rate": 5.224558246408608e-05, + "loss": 1.5038, + "step": 27678 + }, + { + "epoch": 2.18, + "learning_rate": 5.2236208196307775e-05, + "loss": 1.466, + "step": 27679 + }, + { + "epoch": 2.18, + "learning_rate": 5.2226834592291724e-05, + "loss": 1.4866, + "step": 27680 + }, + { + "epoch": 2.18, + "learning_rate": 5.22174616521015e-05, + "loss": 1.5459, + "step": 27681 + }, + { + "epoch": 2.18, + "learning_rate": 5.2208089375800705e-05, + "loss": 1.4999, + "step": 27682 + }, + { + "epoch": 2.18, + "learning_rate": 5.219871776345307e-05, + "loss": 1.4578, + "step": 27683 + }, + { + "epoch": 2.18, + "learning_rate": 5.2189346815122124e-05, + "loss": 1.4662, + "step": 27684 + }, + { + "epoch": 2.18, + "learning_rate": 5.217997653087157e-05, + "loss": 1.4823, + "step": 27685 + }, + { + "epoch": 2.18, + "learning_rate": 5.2170606910764954e-05, + "loss": 1.4267, + "step": 27686 + }, + { + "epoch": 2.18, + "learning_rate": 5.216123795486598e-05, + "loss": 1.4724, + "step": 27687 + }, + { + "epoch": 2.18, + "learning_rate": 5.215186966323821e-05, + "loss": 1.4899, + "step": 27688 + }, + { + "epoch": 2.18, + "learning_rate": 5.2142502035945195e-05, + "loss": 1.428, + "step": 27689 + }, + { + "epoch": 2.18, + "learning_rate": 5.213313507305065e-05, + "loss": 1.4193, + "step": 27690 + }, + { + "epoch": 2.18, + "learning_rate": 5.2123768774618105e-05, + "loss": 1.4726, + "step": 27691 + }, + { + "epoch": 2.18, + "learning_rate": 5.211440314071109e-05, + "loss": 1.451, + "step": 27692 + }, + { + "epoch": 2.18, + "learning_rate": 5.210503817139333e-05, + "loss": 1.4431, + "step": 27693 + }, + { + "epoch": 2.18, + "learning_rate": 5.2095673866728336e-05, + "loss": 1.4823, + "step": 27694 + }, + { + "epoch": 2.18, + "learning_rate": 5.208631022677968e-05, + "loss": 1.4634, + "step": 27695 + }, + { + "epoch": 2.18, + "learning_rate": 5.20769472516109e-05, + "loss": 1.4219, + "step": 27696 + }, + { + "epoch": 2.18, + "learning_rate": 5.206758494128566e-05, + "loss": 1.5075, + "step": 27697 + }, + { + "epoch": 2.18, + "learning_rate": 5.2058223295867475e-05, + "loss": 1.4414, + "step": 27698 + }, + { + "epoch": 2.18, + "learning_rate": 5.204886231541985e-05, + "loss": 1.4392, + "step": 27699 + }, + { + "epoch": 2.18, + "learning_rate": 5.20395020000064e-05, + "loss": 1.4694, + "step": 27700 + }, + { + "epoch": 2.18, + "learning_rate": 5.203014234969071e-05, + "loss": 1.4742, + "step": 27701 + }, + { + "epoch": 2.18, + "learning_rate": 5.20207833645363e-05, + "loss": 1.4623, + "step": 27702 + }, + { + "epoch": 2.18, + "learning_rate": 5.201142504460666e-05, + "loss": 1.4485, + "step": 27703 + }, + { + "epoch": 2.18, + "learning_rate": 5.20020673899654e-05, + "loss": 1.4727, + "step": 27704 + }, + { + "epoch": 2.18, + "learning_rate": 5.199271040067605e-05, + "loss": 1.4331, + "step": 27705 + }, + { + "epoch": 2.18, + "learning_rate": 5.198335407680203e-05, + "loss": 1.4327, + "step": 27706 + }, + { + "epoch": 2.18, + "learning_rate": 5.197399841840702e-05, + "loss": 1.4356, + "step": 27707 + }, + { + "epoch": 2.18, + "learning_rate": 5.1964643425554447e-05, + "loss": 1.4902, + "step": 27708 + }, + { + "epoch": 2.18, + "learning_rate": 5.195528909830781e-05, + "loss": 1.4518, + "step": 27709 + }, + { + "epoch": 2.18, + "learning_rate": 5.19459354367307e-05, + "loss": 1.5232, + "step": 27710 + }, + { + "epoch": 2.18, + "learning_rate": 5.193658244088658e-05, + "loss": 1.4425, + "step": 27711 + }, + { + "epoch": 2.18, + "learning_rate": 5.1927230110838884e-05, + "loss": 1.4312, + "step": 27712 + }, + { + "epoch": 2.18, + "learning_rate": 5.191787844665124e-05, + "loss": 1.4901, + "step": 27713 + }, + { + "epoch": 2.18, + "learning_rate": 5.1908527448387075e-05, + "loss": 1.4617, + "step": 27714 + }, + { + "epoch": 2.18, + "learning_rate": 5.189917711610988e-05, + "loss": 1.4726, + "step": 27715 + }, + { + "epoch": 2.18, + "learning_rate": 5.188982744988303e-05, + "loss": 1.452, + "step": 27716 + }, + { + "epoch": 2.18, + "learning_rate": 5.18804784497702e-05, + "loss": 1.4279, + "step": 27717 + }, + { + "epoch": 2.18, + "learning_rate": 5.187113011583479e-05, + "loss": 1.4469, + "step": 27718 + }, + { + "epoch": 2.18, + "learning_rate": 5.1861782448140246e-05, + "loss": 1.4399, + "step": 27719 + }, + { + "epoch": 2.18, + "learning_rate": 5.185243544675e-05, + "loss": 1.4738, + "step": 27720 + }, + { + "epoch": 2.18, + "learning_rate": 5.18430891117276e-05, + "loss": 1.4296, + "step": 27721 + }, + { + "epoch": 2.18, + "learning_rate": 5.1833743443136456e-05, + "loss": 1.4516, + "step": 27722 + }, + { + "epoch": 2.18, + "learning_rate": 5.182439844103997e-05, + "loss": 1.4424, + "step": 27723 + }, + { + "epoch": 2.18, + "learning_rate": 5.18150541055017e-05, + "loss": 1.4667, + "step": 27724 + }, + { + "epoch": 2.18, + "learning_rate": 5.180571043658501e-05, + "loss": 1.4443, + "step": 27725 + }, + { + "epoch": 2.18, + "learning_rate": 5.179636743435332e-05, + "loss": 1.4871, + "step": 27726 + }, + { + "epoch": 2.18, + "learning_rate": 5.1787025098870164e-05, + "loss": 1.5139, + "step": 27727 + }, + { + "epoch": 2.18, + "learning_rate": 5.177768343019888e-05, + "loss": 1.4379, + "step": 27728 + }, + { + "epoch": 2.18, + "learning_rate": 5.176834242840291e-05, + "loss": 1.4596, + "step": 27729 + }, + { + "epoch": 2.18, + "learning_rate": 5.1759002093545705e-05, + "loss": 1.4512, + "step": 27730 + }, + { + "epoch": 2.18, + "learning_rate": 5.174966242569062e-05, + "loss": 1.4246, + "step": 27731 + }, + { + "epoch": 2.18, + "learning_rate": 5.174032342490117e-05, + "loss": 1.4788, + "step": 27732 + }, + { + "epoch": 2.18, + "learning_rate": 5.173098509124064e-05, + "loss": 1.4471, + "step": 27733 + }, + { + "epoch": 2.18, + "learning_rate": 5.172164742477255e-05, + "loss": 1.4302, + "step": 27734 + }, + { + "epoch": 2.18, + "learning_rate": 5.171231042556023e-05, + "loss": 1.447, + "step": 27735 + }, + { + "epoch": 2.18, + "learning_rate": 5.170297409366709e-05, + "loss": 1.4785, + "step": 27736 + }, + { + "epoch": 2.18, + "learning_rate": 5.169363842915644e-05, + "loss": 1.4824, + "step": 27737 + }, + { + "epoch": 2.18, + "learning_rate": 5.168430343209181e-05, + "loss": 1.469, + "step": 27738 + }, + { + "epoch": 2.18, + "learning_rate": 5.1674969102536494e-05, + "loss": 1.4546, + "step": 27739 + }, + { + "epoch": 2.18, + "learning_rate": 5.166563544055383e-05, + "loss": 1.4133, + "step": 27740 + }, + { + "epoch": 2.18, + "learning_rate": 5.165630244620729e-05, + "loss": 1.4716, + "step": 27741 + }, + { + "epoch": 2.18, + "learning_rate": 5.164697011956018e-05, + "loss": 1.4701, + "step": 27742 + }, + { + "epoch": 2.18, + "learning_rate": 5.1637638460675815e-05, + "loss": 1.4541, + "step": 27743 + }, + { + "epoch": 2.18, + "learning_rate": 5.162830746961766e-05, + "loss": 1.4438, + "step": 27744 + }, + { + "epoch": 2.18, + "learning_rate": 5.1618977146449e-05, + "loss": 1.5184, + "step": 27745 + }, + { + "epoch": 2.18, + "learning_rate": 5.160964749123316e-05, + "loss": 1.4985, + "step": 27746 + }, + { + "epoch": 2.18, + "learning_rate": 5.1600318504033505e-05, + "loss": 1.3676, + "step": 27747 + }, + { + "epoch": 2.18, + "learning_rate": 5.159099018491344e-05, + "loss": 1.4896, + "step": 27748 + }, + { + "epoch": 2.18, + "learning_rate": 5.158166253393625e-05, + "loss": 1.4644, + "step": 27749 + }, + { + "epoch": 2.18, + "learning_rate": 5.157233555116521e-05, + "loss": 1.4595, + "step": 27750 + }, + { + "epoch": 2.18, + "learning_rate": 5.1563009236663735e-05, + "loss": 1.4255, + "step": 27751 + }, + { + "epoch": 2.18, + "learning_rate": 5.155368359049511e-05, + "loss": 1.4832, + "step": 27752 + }, + { + "epoch": 2.18, + "learning_rate": 5.154435861272264e-05, + "loss": 1.4875, + "step": 27753 + }, + { + "epoch": 2.18, + "learning_rate": 5.1535034303409614e-05, + "loss": 1.4609, + "step": 27754 + }, + { + "epoch": 2.18, + "learning_rate": 5.15257106626194e-05, + "loss": 1.4728, + "step": 27755 + }, + { + "epoch": 2.18, + "learning_rate": 5.151638769041526e-05, + "loss": 1.4643, + "step": 27756 + }, + { + "epoch": 2.18, + "learning_rate": 5.150706538686048e-05, + "loss": 1.4467, + "step": 27757 + }, + { + "epoch": 2.18, + "learning_rate": 5.1497743752018386e-05, + "loss": 1.4376, + "step": 27758 + }, + { + "epoch": 2.18, + "learning_rate": 5.148842278595229e-05, + "loss": 1.399, + "step": 27759 + }, + { + "epoch": 2.18, + "learning_rate": 5.147910248872535e-05, + "loss": 1.4039, + "step": 27760 + }, + { + "epoch": 2.18, + "learning_rate": 5.146978286040102e-05, + "loss": 1.4623, + "step": 27761 + }, + { + "epoch": 2.18, + "learning_rate": 5.1460463901042484e-05, + "loss": 1.4046, + "step": 27762 + }, + { + "epoch": 2.18, + "learning_rate": 5.145114561071295e-05, + "loss": 1.4393, + "step": 27763 + }, + { + "epoch": 2.18, + "learning_rate": 5.144182798947578e-05, + "loss": 1.5334, + "step": 27764 + }, + { + "epoch": 2.18, + "learning_rate": 5.1432511037394244e-05, + "loss": 1.4064, + "step": 27765 + }, + { + "epoch": 2.18, + "learning_rate": 5.1423194754531565e-05, + "loss": 1.4187, + "step": 27766 + }, + { + "epoch": 2.18, + "learning_rate": 5.141387914095095e-05, + "loss": 1.4536, + "step": 27767 + }, + { + "epoch": 2.18, + "learning_rate": 5.140456419671574e-05, + "loss": 1.4904, + "step": 27768 + }, + { + "epoch": 2.18, + "learning_rate": 5.139524992188913e-05, + "loss": 1.4809, + "step": 27769 + }, + { + "epoch": 2.18, + "learning_rate": 5.1385936316534305e-05, + "loss": 1.4276, + "step": 27770 + }, + { + "epoch": 2.19, + "learning_rate": 5.1376623380714606e-05, + "loss": 1.4188, + "step": 27771 + }, + { + "epoch": 2.19, + "learning_rate": 5.1367311114493195e-05, + "loss": 1.4623, + "step": 27772 + }, + { + "epoch": 2.19, + "learning_rate": 5.1357999517933335e-05, + "loss": 1.4744, + "step": 27773 + }, + { + "epoch": 2.19, + "learning_rate": 5.1348688591098147e-05, + "loss": 1.4458, + "step": 27774 + }, + { + "epoch": 2.19, + "learning_rate": 5.1339378334051e-05, + "loss": 1.4368, + "step": 27775 + }, + { + "epoch": 2.19, + "learning_rate": 5.1330068746855015e-05, + "loss": 1.4673, + "step": 27776 + }, + { + "epoch": 2.19, + "learning_rate": 5.132075982957337e-05, + "loss": 1.4096, + "step": 27777 + }, + { + "epoch": 2.19, + "learning_rate": 5.1311451582269344e-05, + "loss": 1.4511, + "step": 27778 + }, + { + "epoch": 2.19, + "learning_rate": 5.130214400500606e-05, + "loss": 1.4302, + "step": 27779 + }, + { + "epoch": 2.19, + "learning_rate": 5.129283709784681e-05, + "loss": 1.4507, + "step": 27780 + }, + { + "epoch": 2.19, + "learning_rate": 5.1283530860854655e-05, + "loss": 1.4633, + "step": 27781 + }, + { + "epoch": 2.19, + "learning_rate": 5.127422529409292e-05, + "loss": 1.4984, + "step": 27782 + }, + { + "epoch": 2.19, + "learning_rate": 5.12649203976247e-05, + "loss": 1.3867, + "step": 27783 + }, + { + "epoch": 2.19, + "learning_rate": 5.125561617151314e-05, + "loss": 1.507, + "step": 27784 + }, + { + "epoch": 2.19, + "learning_rate": 5.124631261582152e-05, + "loss": 1.494, + "step": 27785 + }, + { + "epoch": 2.19, + "learning_rate": 5.123700973061291e-05, + "loss": 1.4224, + "step": 27786 + }, + { + "epoch": 2.19, + "learning_rate": 5.122770751595047e-05, + "loss": 1.4046, + "step": 27787 + }, + { + "epoch": 2.19, + "learning_rate": 5.121840597189743e-05, + "loss": 1.4673, + "step": 27788 + }, + { + "epoch": 2.19, + "learning_rate": 5.1209105098516916e-05, + "loss": 1.4744, + "step": 27789 + }, + { + "epoch": 2.19, + "learning_rate": 5.119980489587205e-05, + "loss": 1.4598, + "step": 27790 + }, + { + "epoch": 2.19, + "learning_rate": 5.1190505364025946e-05, + "loss": 1.4553, + "step": 27791 + }, + { + "epoch": 2.19, + "learning_rate": 5.118120650304183e-05, + "loss": 1.5134, + "step": 27792 + }, + { + "epoch": 2.19, + "learning_rate": 5.117190831298277e-05, + "loss": 1.4295, + "step": 27793 + }, + { + "epoch": 2.19, + "learning_rate": 5.1162610793911884e-05, + "loss": 1.4362, + "step": 27794 + }, + { + "epoch": 2.19, + "learning_rate": 5.115331394589233e-05, + "loss": 1.4445, + "step": 27795 + }, + { + "epoch": 2.19, + "learning_rate": 5.114401776898727e-05, + "loss": 1.4254, + "step": 27796 + }, + { + "epoch": 2.19, + "learning_rate": 5.113472226325977e-05, + "loss": 1.4709, + "step": 27797 + }, + { + "epoch": 2.19, + "learning_rate": 5.11254274287729e-05, + "loss": 1.4383, + "step": 27798 + }, + { + "epoch": 2.19, + "learning_rate": 5.1116133265589864e-05, + "loss": 1.4875, + "step": 27799 + }, + { + "epoch": 2.19, + "learning_rate": 5.110683977377372e-05, + "loss": 1.4018, + "step": 27800 + }, + { + "epoch": 2.19, + "learning_rate": 5.109754695338751e-05, + "loss": 1.5055, + "step": 27801 + }, + { + "epoch": 2.19, + "learning_rate": 5.108825480449442e-05, + "loss": 1.4028, + "step": 27802 + }, + { + "epoch": 2.19, + "learning_rate": 5.107896332715751e-05, + "loss": 1.4849, + "step": 27803 + }, + { + "epoch": 2.19, + "learning_rate": 5.10696725214398e-05, + "loss": 1.4359, + "step": 27804 + }, + { + "epoch": 2.19, + "learning_rate": 5.106038238740446e-05, + "loss": 1.4408, + "step": 27805 + }, + { + "epoch": 2.19, + "learning_rate": 5.105109292511451e-05, + "loss": 1.464, + "step": 27806 + }, + { + "epoch": 2.19, + "learning_rate": 5.1041804134633055e-05, + "loss": 1.4176, + "step": 27807 + }, + { + "epoch": 2.19, + "learning_rate": 5.103251601602308e-05, + "loss": 1.489, + "step": 27808 + }, + { + "epoch": 2.19, + "learning_rate": 5.102322856934777e-05, + "loss": 1.4677, + "step": 27809 + }, + { + "epoch": 2.19, + "learning_rate": 5.1013941794670063e-05, + "loss": 1.4712, + "step": 27810 + }, + { + "epoch": 2.19, + "learning_rate": 5.100465569205306e-05, + "loss": 1.4269, + "step": 27811 + }, + { + "epoch": 2.19, + "learning_rate": 5.099537026155985e-05, + "loss": 1.418, + "step": 27812 + }, + { + "epoch": 2.19, + "learning_rate": 5.098608550325346e-05, + "loss": 1.472, + "step": 27813 + }, + { + "epoch": 2.19, + "learning_rate": 5.097680141719692e-05, + "loss": 1.4933, + "step": 27814 + }, + { + "epoch": 2.19, + "learning_rate": 5.096751800345319e-05, + "loss": 1.431, + "step": 27815 + }, + { + "epoch": 2.19, + "learning_rate": 5.095823526208541e-05, + "loss": 1.4859, + "step": 27816 + }, + { + "epoch": 2.19, + "learning_rate": 5.0948953193156554e-05, + "loss": 1.4167, + "step": 27817 + }, + { + "epoch": 2.19, + "learning_rate": 5.09396717967296e-05, + "loss": 1.4347, + "step": 27818 + }, + { + "epoch": 2.19, + "learning_rate": 5.0930391072867654e-05, + "loss": 1.4064, + "step": 27819 + }, + { + "epoch": 2.19, + "learning_rate": 5.0921111021633695e-05, + "loss": 1.4878, + "step": 27820 + }, + { + "epoch": 2.19, + "learning_rate": 5.091183164309065e-05, + "loss": 1.4083, + "step": 27821 + }, + { + "epoch": 2.19, + "learning_rate": 5.0902552937301646e-05, + "loss": 1.4486, + "step": 27822 + }, + { + "epoch": 2.19, + "learning_rate": 5.089327490432961e-05, + "loss": 1.4661, + "step": 27823 + }, + { + "epoch": 2.19, + "learning_rate": 5.08839975442375e-05, + "loss": 1.4436, + "step": 27824 + }, + { + "epoch": 2.19, + "learning_rate": 5.087472085708842e-05, + "loss": 1.4709, + "step": 27825 + }, + { + "epoch": 2.19, + "learning_rate": 5.08654448429452e-05, + "loss": 1.4499, + "step": 27826 + }, + { + "epoch": 2.19, + "learning_rate": 5.085616950187098e-05, + "loss": 1.4325, + "step": 27827 + }, + { + "epoch": 2.19, + "learning_rate": 5.08468948339286e-05, + "loss": 1.4007, + "step": 27828 + }, + { + "epoch": 2.19, + "learning_rate": 5.083762083918114e-05, + "loss": 1.4655, + "step": 27829 + }, + { + "epoch": 2.19, + "learning_rate": 5.0828347517691505e-05, + "loss": 1.4389, + "step": 27830 + }, + { + "epoch": 2.19, + "learning_rate": 5.081907486952265e-05, + "loss": 1.4688, + "step": 27831 + }, + { + "epoch": 2.19, + "learning_rate": 5.080980289473752e-05, + "loss": 1.4344, + "step": 27832 + }, + { + "epoch": 2.19, + "learning_rate": 5.080053159339911e-05, + "loss": 1.446, + "step": 27833 + }, + { + "epoch": 2.19, + "learning_rate": 5.079126096557038e-05, + "loss": 1.4709, + "step": 27834 + }, + { + "epoch": 2.19, + "learning_rate": 5.078199101131416e-05, + "loss": 1.4605, + "step": 27835 + }, + { + "epoch": 2.19, + "learning_rate": 5.0772721730693555e-05, + "loss": 1.4707, + "step": 27836 + }, + { + "epoch": 2.19, + "learning_rate": 5.0763453123771376e-05, + "loss": 1.5137, + "step": 27837 + }, + { + "epoch": 2.19, + "learning_rate": 5.075418519061056e-05, + "loss": 1.458, + "step": 27838 + }, + { + "epoch": 2.19, + "learning_rate": 5.07449179312741e-05, + "loss": 1.479, + "step": 27839 + }, + { + "epoch": 2.19, + "learning_rate": 5.073565134582488e-05, + "loss": 1.4208, + "step": 27840 + }, + { + "epoch": 2.19, + "learning_rate": 5.072638543432575e-05, + "loss": 1.4854, + "step": 27841 + }, + { + "epoch": 2.19, + "learning_rate": 5.071712019683969e-05, + "loss": 1.4285, + "step": 27842 + }, + { + "epoch": 2.19, + "learning_rate": 5.070785563342963e-05, + "loss": 1.435, + "step": 27843 + }, + { + "epoch": 2.19, + "learning_rate": 5.0698591744158436e-05, + "loss": 1.4455, + "step": 27844 + }, + { + "epoch": 2.19, + "learning_rate": 5.0689328529088965e-05, + "loss": 1.4568, + "step": 27845 + }, + { + "epoch": 2.19, + "learning_rate": 5.0680065988284196e-05, + "loss": 1.4387, + "step": 27846 + }, + { + "epoch": 2.19, + "learning_rate": 5.067080412180697e-05, + "loss": 1.4497, + "step": 27847 + }, + { + "epoch": 2.19, + "learning_rate": 5.0661542929720166e-05, + "loss": 1.4513, + "step": 27848 + }, + { + "epoch": 2.19, + "learning_rate": 5.0652282412086625e-05, + "loss": 1.4392, + "step": 27849 + }, + { + "epoch": 2.19, + "learning_rate": 5.064302256896929e-05, + "loss": 1.5183, + "step": 27850 + }, + { + "epoch": 2.19, + "learning_rate": 5.063376340043102e-05, + "loss": 1.3761, + "step": 27851 + }, + { + "epoch": 2.19, + "learning_rate": 5.062450490653463e-05, + "loss": 1.4755, + "step": 27852 + }, + { + "epoch": 2.19, + "learning_rate": 5.0615247087343034e-05, + "loss": 1.4388, + "step": 27853 + }, + { + "epoch": 2.19, + "learning_rate": 5.0605989942919075e-05, + "loss": 1.443, + "step": 27854 + }, + { + "epoch": 2.19, + "learning_rate": 5.0596733473325534e-05, + "loss": 1.4785, + "step": 27855 + }, + { + "epoch": 2.19, + "learning_rate": 5.058747767862537e-05, + "loss": 1.4355, + "step": 27856 + }, + { + "epoch": 2.19, + "learning_rate": 5.0578222558881334e-05, + "loss": 1.4392, + "step": 27857 + }, + { + "epoch": 2.19, + "learning_rate": 5.056896811415635e-05, + "loss": 1.4313, + "step": 27858 + }, + { + "epoch": 2.19, + "learning_rate": 5.055971434451314e-05, + "loss": 1.3836, + "step": 27859 + }, + { + "epoch": 2.19, + "learning_rate": 5.055046125001466e-05, + "loss": 1.4552, + "step": 27860 + }, + { + "epoch": 2.19, + "learning_rate": 5.0541208830723645e-05, + "loss": 1.4141, + "step": 27861 + }, + { + "epoch": 2.19, + "learning_rate": 5.053195708670291e-05, + "loss": 1.4257, + "step": 27862 + }, + { + "epoch": 2.19, + "learning_rate": 5.0522706018015327e-05, + "loss": 1.4328, + "step": 27863 + }, + { + "epoch": 2.19, + "learning_rate": 5.051345562472368e-05, + "loss": 1.3691, + "step": 27864 + }, + { + "epoch": 2.19, + "learning_rate": 5.050420590689078e-05, + "loss": 1.5239, + "step": 27865 + }, + { + "epoch": 2.19, + "learning_rate": 5.0494956864579346e-05, + "loss": 1.4071, + "step": 27866 + }, + { + "epoch": 2.19, + "learning_rate": 5.04857084978523e-05, + "loss": 1.4928, + "step": 27867 + }, + { + "epoch": 2.19, + "learning_rate": 5.0476460806772395e-05, + "loss": 1.4379, + "step": 27868 + }, + { + "epoch": 2.19, + "learning_rate": 5.046721379140233e-05, + "loss": 1.4247, + "step": 27869 + }, + { + "epoch": 2.19, + "learning_rate": 5.0457967451805016e-05, + "loss": 1.4525, + "step": 27870 + }, + { + "epoch": 2.19, + "learning_rate": 5.0448721788043155e-05, + "loss": 1.4298, + "step": 27871 + }, + { + "epoch": 2.19, + "learning_rate": 5.04394768001795e-05, + "loss": 1.4565, + "step": 27872 + }, + { + "epoch": 2.19, + "learning_rate": 5.043023248827685e-05, + "loss": 1.4714, + "step": 27873 + }, + { + "epoch": 2.19, + "learning_rate": 5.042098885239804e-05, + "loss": 1.4496, + "step": 27874 + }, + { + "epoch": 2.19, + "learning_rate": 5.0411745892605746e-05, + "loss": 1.4032, + "step": 27875 + }, + { + "epoch": 2.19, + "learning_rate": 5.040250360896269e-05, + "loss": 1.4723, + "step": 27876 + }, + { + "epoch": 2.19, + "learning_rate": 5.0393262001531734e-05, + "loss": 1.4765, + "step": 27877 + }, + { + "epoch": 2.19, + "learning_rate": 5.0384021070375544e-05, + "loss": 1.4756, + "step": 27878 + }, + { + "epoch": 2.19, + "learning_rate": 5.037478081555683e-05, + "loss": 1.4415, + "step": 27879 + }, + { + "epoch": 2.19, + "learning_rate": 5.036554123713844e-05, + "loss": 1.3896, + "step": 27880 + }, + { + "epoch": 2.19, + "learning_rate": 5.035630233518304e-05, + "loss": 1.4712, + "step": 27881 + }, + { + "epoch": 2.19, + "learning_rate": 5.03470641097533e-05, + "loss": 1.4, + "step": 27882 + }, + { + "epoch": 2.19, + "learning_rate": 5.033782656091206e-05, + "loss": 1.5031, + "step": 27883 + }, + { + "epoch": 2.19, + "learning_rate": 5.032858968872199e-05, + "loss": 1.4282, + "step": 27884 + }, + { + "epoch": 2.19, + "learning_rate": 5.031935349324577e-05, + "loss": 1.4457, + "step": 27885 + }, + { + "epoch": 2.19, + "learning_rate": 5.03101179745461e-05, + "loss": 1.4613, + "step": 27886 + }, + { + "epoch": 2.19, + "learning_rate": 5.030088313268575e-05, + "loss": 1.4634, + "step": 27887 + }, + { + "epoch": 2.19, + "learning_rate": 5.029164896772738e-05, + "loss": 1.4419, + "step": 27888 + }, + { + "epoch": 2.19, + "learning_rate": 5.028241547973367e-05, + "loss": 1.4775, + "step": 27889 + }, + { + "epoch": 2.19, + "learning_rate": 5.0273182668767304e-05, + "loss": 1.4336, + "step": 27890 + }, + { + "epoch": 2.19, + "learning_rate": 5.0263950534891055e-05, + "loss": 1.4292, + "step": 27891 + }, + { + "epoch": 2.19, + "learning_rate": 5.0254719078167545e-05, + "loss": 1.4602, + "step": 27892 + }, + { + "epoch": 2.19, + "learning_rate": 5.024548829865938e-05, + "loss": 1.373, + "step": 27893 + }, + { + "epoch": 2.19, + "learning_rate": 5.023625819642937e-05, + "loss": 1.4195, + "step": 27894 + }, + { + "epoch": 2.19, + "learning_rate": 5.022702877154011e-05, + "loss": 1.4833, + "step": 27895 + }, + { + "epoch": 2.19, + "learning_rate": 5.021780002405421e-05, + "loss": 1.4985, + "step": 27896 + }, + { + "epoch": 2.19, + "learning_rate": 5.020857195403443e-05, + "loss": 1.458, + "step": 27897 + }, + { + "epoch": 2.2, + "learning_rate": 5.0199344561543385e-05, + "loss": 1.4595, + "step": 27898 + }, + { + "epoch": 2.2, + "learning_rate": 5.019011784664366e-05, + "loss": 1.4585, + "step": 27899 + }, + { + "epoch": 2.2, + "learning_rate": 5.018089180939801e-05, + "loss": 1.4827, + "step": 27900 + }, + { + "epoch": 2.2, + "learning_rate": 5.017166644986902e-05, + "loss": 1.4556, + "step": 27901 + }, + { + "epoch": 2.2, + "learning_rate": 5.016244176811932e-05, + "loss": 1.4789, + "step": 27902 + }, + { + "epoch": 2.2, + "learning_rate": 5.01532177642115e-05, + "loss": 1.3989, + "step": 27903 + }, + { + "epoch": 2.2, + "learning_rate": 5.0143994438208236e-05, + "loss": 1.4385, + "step": 27904 + }, + { + "epoch": 2.2, + "learning_rate": 5.013477179017218e-05, + "loss": 1.4706, + "step": 27905 + }, + { + "epoch": 2.2, + "learning_rate": 5.0125549820165916e-05, + "loss": 1.4706, + "step": 27906 + }, + { + "epoch": 2.2, + "learning_rate": 5.011632852825201e-05, + "loss": 1.4772, + "step": 27907 + }, + { + "epoch": 2.2, + "learning_rate": 5.010710791449318e-05, + "loss": 1.4653, + "step": 27908 + }, + { + "epoch": 2.2, + "learning_rate": 5.009788797895194e-05, + "loss": 1.4883, + "step": 27909 + }, + { + "epoch": 2.2, + "learning_rate": 5.008866872169087e-05, + "loss": 1.4753, + "step": 27910 + }, + { + "epoch": 2.2, + "learning_rate": 5.0079450142772645e-05, + "loss": 1.4263, + "step": 27911 + }, + { + "epoch": 2.2, + "learning_rate": 5.00702322422598e-05, + "loss": 1.3759, + "step": 27912 + }, + { + "epoch": 2.2, + "learning_rate": 5.0061015020214904e-05, + "loss": 1.5047, + "step": 27913 + }, + { + "epoch": 2.2, + "learning_rate": 5.005179847670061e-05, + "loss": 1.4721, + "step": 27914 + }, + { + "epoch": 2.2, + "learning_rate": 5.0042582611779445e-05, + "loss": 1.477, + "step": 27915 + }, + { + "epoch": 2.2, + "learning_rate": 5.003336742551393e-05, + "loss": 1.457, + "step": 27916 + }, + { + "epoch": 2.2, + "learning_rate": 5.002415291796675e-05, + "loss": 1.4027, + "step": 27917 + }, + { + "epoch": 2.2, + "learning_rate": 5.00149390892004e-05, + "loss": 1.4846, + "step": 27918 + }, + { + "epoch": 2.2, + "learning_rate": 5.0005725939277407e-05, + "loss": 1.5141, + "step": 27919 + }, + { + "epoch": 2.2, + "learning_rate": 4.999651346826029e-05, + "loss": 1.4485, + "step": 27920 + }, + { + "epoch": 2.2, + "learning_rate": 4.998730167621173e-05, + "loss": 1.5029, + "step": 27921 + }, + { + "epoch": 2.2, + "learning_rate": 4.997809056319422e-05, + "loss": 1.4695, + "step": 27922 + }, + { + "epoch": 2.2, + "learning_rate": 4.9968880129270225e-05, + "loss": 1.4936, + "step": 27923 + }, + { + "epoch": 2.2, + "learning_rate": 4.995967037450238e-05, + "loss": 1.416, + "step": 27924 + }, + { + "epoch": 2.2, + "learning_rate": 4.995046129895316e-05, + "loss": 1.4916, + "step": 27925 + }, + { + "epoch": 2.2, + "learning_rate": 4.994125290268511e-05, + "loss": 1.515, + "step": 27926 + }, + { + "epoch": 2.2, + "learning_rate": 4.9932045185760673e-05, + "loss": 1.4071, + "step": 27927 + }, + { + "epoch": 2.2, + "learning_rate": 4.992283814824248e-05, + "loss": 1.4286, + "step": 27928 + }, + { + "epoch": 2.2, + "learning_rate": 4.991363179019299e-05, + "loss": 1.4352, + "step": 27929 + }, + { + "epoch": 2.2, + "learning_rate": 4.990442611167465e-05, + "loss": 1.5264, + "step": 27930 + }, + { + "epoch": 2.2, + "learning_rate": 4.989522111275009e-05, + "loss": 1.4908, + "step": 27931 + }, + { + "epoch": 2.2, + "learning_rate": 4.988601679348173e-05, + "loss": 1.4235, + "step": 27932 + }, + { + "epoch": 2.2, + "learning_rate": 4.9876813153931994e-05, + "loss": 1.4379, + "step": 27933 + }, + { + "epoch": 2.2, + "learning_rate": 4.9867610194163524e-05, + "loss": 1.5151, + "step": 27934 + }, + { + "epoch": 2.2, + "learning_rate": 4.9858407914238706e-05, + "loss": 1.4836, + "step": 27935 + }, + { + "epoch": 2.2, + "learning_rate": 4.9849206314219984e-05, + "loss": 1.4528, + "step": 27936 + }, + { + "epoch": 2.2, + "learning_rate": 4.9840005394169897e-05, + "loss": 1.461, + "step": 27937 + }, + { + "epoch": 2.2, + "learning_rate": 4.9830805154150955e-05, + "loss": 1.4215, + "step": 27938 + }, + { + "epoch": 2.2, + "learning_rate": 4.982160559422555e-05, + "loss": 1.47, + "step": 27939 + }, + { + "epoch": 2.2, + "learning_rate": 4.981240671445612e-05, + "loss": 1.4645, + "step": 27940 + }, + { + "epoch": 2.2, + "learning_rate": 4.98032085149052e-05, + "loss": 1.4642, + "step": 27941 + }, + { + "epoch": 2.2, + "learning_rate": 4.979401099563522e-05, + "loss": 1.4667, + "step": 27942 + }, + { + "epoch": 2.2, + "learning_rate": 4.9784814156708586e-05, + "loss": 1.4493, + "step": 27943 + }, + { + "epoch": 2.2, + "learning_rate": 4.9775617998187716e-05, + "loss": 1.4741, + "step": 27944 + }, + { + "epoch": 2.2, + "learning_rate": 4.976642252013515e-05, + "loss": 1.4536, + "step": 27945 + }, + { + "epoch": 2.2, + "learning_rate": 4.975722772261326e-05, + "loss": 1.4898, + "step": 27946 + }, + { + "epoch": 2.2, + "learning_rate": 4.9748033605684416e-05, + "loss": 1.3754, + "step": 27947 + }, + { + "epoch": 2.2, + "learning_rate": 4.973884016941116e-05, + "loss": 1.4409, + "step": 27948 + }, + { + "epoch": 2.2, + "learning_rate": 4.972964741385585e-05, + "loss": 1.4417, + "step": 27949 + }, + { + "epoch": 2.2, + "learning_rate": 4.972045533908086e-05, + "loss": 1.4638, + "step": 27950 + }, + { + "epoch": 2.2, + "learning_rate": 4.971126394514861e-05, + "loss": 1.4803, + "step": 27951 + }, + { + "epoch": 2.2, + "learning_rate": 4.970207323212161e-05, + "loss": 1.4429, + "step": 27952 + }, + { + "epoch": 2.2, + "learning_rate": 4.969288320006217e-05, + "loss": 1.5004, + "step": 27953 + }, + { + "epoch": 2.2, + "learning_rate": 4.968369384903265e-05, + "loss": 1.4608, + "step": 27954 + }, + { + "epoch": 2.2, + "learning_rate": 4.9674505179095556e-05, + "loss": 1.45, + "step": 27955 + }, + { + "epoch": 2.2, + "learning_rate": 4.9665317190313186e-05, + "loss": 1.4734, + "step": 27956 + }, + { + "epoch": 2.2, + "learning_rate": 4.96561298827479e-05, + "loss": 1.4909, + "step": 27957 + }, + { + "epoch": 2.2, + "learning_rate": 4.964694325646217e-05, + "loss": 1.4622, + "step": 27958 + }, + { + "epoch": 2.2, + "learning_rate": 4.963775731151832e-05, + "loss": 1.4851, + "step": 27959 + }, + { + "epoch": 2.2, + "learning_rate": 4.9628572047978715e-05, + "loss": 1.4281, + "step": 27960 + }, + { + "epoch": 2.2, + "learning_rate": 4.961938746590565e-05, + "loss": 1.4883, + "step": 27961 + }, + { + "epoch": 2.2, + "learning_rate": 4.961020356536161e-05, + "loss": 1.4298, + "step": 27962 + }, + { + "epoch": 2.2, + "learning_rate": 4.960102034640889e-05, + "loss": 1.4756, + "step": 27963 + }, + { + "epoch": 2.2, + "learning_rate": 4.9591837809109794e-05, + "loss": 1.5244, + "step": 27964 + }, + { + "epoch": 2.2, + "learning_rate": 4.958265595352674e-05, + "loss": 1.4688, + "step": 27965 + }, + { + "epoch": 2.2, + "learning_rate": 4.9573474779722056e-05, + "loss": 1.4641, + "step": 27966 + }, + { + "epoch": 2.2, + "learning_rate": 4.956429428775799e-05, + "loss": 1.4226, + "step": 27967 + }, + { + "epoch": 2.2, + "learning_rate": 4.955511447769696e-05, + "loss": 1.4619, + "step": 27968 + }, + { + "epoch": 2.2, + "learning_rate": 4.954593534960131e-05, + "loss": 1.4902, + "step": 27969 + }, + { + "epoch": 2.2, + "learning_rate": 4.953675690353333e-05, + "loss": 1.4607, + "step": 27970 + }, + { + "epoch": 2.2, + "learning_rate": 4.952757913955528e-05, + "loss": 1.4146, + "step": 27971 + }, + { + "epoch": 2.2, + "learning_rate": 4.951840205772957e-05, + "loss": 1.4271, + "step": 27972 + }, + { + "epoch": 2.2, + "learning_rate": 4.9509225658118456e-05, + "loss": 1.4947, + "step": 27973 + }, + { + "epoch": 2.2, + "learning_rate": 4.95000499407842e-05, + "loss": 1.4699, + "step": 27974 + }, + { + "epoch": 2.2, + "learning_rate": 4.949087490578919e-05, + "loss": 1.4431, + "step": 27975 + }, + { + "epoch": 2.2, + "learning_rate": 4.948170055319567e-05, + "loss": 1.4664, + "step": 27976 + }, + { + "epoch": 2.2, + "learning_rate": 4.947252688306595e-05, + "loss": 1.474, + "step": 27977 + }, + { + "epoch": 2.2, + "learning_rate": 4.9463353895462235e-05, + "loss": 1.4223, + "step": 27978 + }, + { + "epoch": 2.2, + "learning_rate": 4.9454181590446914e-05, + "loss": 1.5026, + "step": 27979 + }, + { + "epoch": 2.2, + "learning_rate": 4.944500996808222e-05, + "loss": 1.4591, + "step": 27980 + }, + { + "epoch": 2.2, + "learning_rate": 4.943583902843036e-05, + "loss": 1.4784, + "step": 27981 + }, + { + "epoch": 2.2, + "learning_rate": 4.9426668771553704e-05, + "loss": 1.4172, + "step": 27982 + }, + { + "epoch": 2.2, + "learning_rate": 4.941749919751444e-05, + "loss": 1.4211, + "step": 27983 + }, + { + "epoch": 2.2, + "learning_rate": 4.9408330306374874e-05, + "loss": 1.4409, + "step": 27984 + }, + { + "epoch": 2.2, + "learning_rate": 4.939916209819719e-05, + "loss": 1.4276, + "step": 27985 + }, + { + "epoch": 2.2, + "learning_rate": 4.938999457304375e-05, + "loss": 1.3878, + "step": 27986 + }, + { + "epoch": 2.2, + "learning_rate": 4.9380827730976695e-05, + "loss": 1.4321, + "step": 27987 + }, + { + "epoch": 2.2, + "learning_rate": 4.9371661572058263e-05, + "loss": 1.4748, + "step": 27988 + }, + { + "epoch": 2.2, + "learning_rate": 4.9362496096350766e-05, + "loss": 1.4177, + "step": 27989 + }, + { + "epoch": 2.2, + "learning_rate": 4.9353331303916376e-05, + "loss": 1.4492, + "step": 27990 + }, + { + "epoch": 2.2, + "learning_rate": 4.934416719481729e-05, + "loss": 1.4296, + "step": 27991 + }, + { + "epoch": 2.2, + "learning_rate": 4.933500376911579e-05, + "loss": 1.455, + "step": 27992 + }, + { + "epoch": 2.2, + "learning_rate": 4.9325841026874085e-05, + "loss": 1.4902, + "step": 27993 + }, + { + "epoch": 2.2, + "learning_rate": 4.9316678968154296e-05, + "loss": 1.4936, + "step": 27994 + }, + { + "epoch": 2.2, + "learning_rate": 4.930751759301875e-05, + "loss": 1.4709, + "step": 27995 + }, + { + "epoch": 2.2, + "learning_rate": 4.929835690152959e-05, + "loss": 1.4598, + "step": 27996 + }, + { + "epoch": 2.2, + "learning_rate": 4.928919689374903e-05, + "loss": 1.5004, + "step": 27997 + }, + { + "epoch": 2.2, + "learning_rate": 4.9280037569739186e-05, + "loss": 1.4492, + "step": 27998 + }, + { + "epoch": 2.2, + "learning_rate": 4.927087892956231e-05, + "loss": 1.4401, + "step": 27999 + }, + { + "epoch": 2.2, + "learning_rate": 4.926172097328062e-05, + "loss": 1.4432, + "step": 28000 + }, + { + "epoch": 2.2, + "learning_rate": 4.925256370095626e-05, + "loss": 1.4244, + "step": 28001 + }, + { + "epoch": 2.2, + "learning_rate": 4.9243407112651346e-05, + "loss": 1.4528, + "step": 28002 + }, + { + "epoch": 2.2, + "learning_rate": 4.923425120842814e-05, + "loss": 1.4602, + "step": 28003 + }, + { + "epoch": 2.2, + "learning_rate": 4.922509598834876e-05, + "loss": 1.4916, + "step": 28004 + }, + { + "epoch": 2.2, + "learning_rate": 4.9215941452475313e-05, + "loss": 1.4671, + "step": 28005 + }, + { + "epoch": 2.2, + "learning_rate": 4.920678760087007e-05, + "loss": 1.465, + "step": 28006 + }, + { + "epoch": 2.2, + "learning_rate": 4.919763443359511e-05, + "loss": 1.4664, + "step": 28007 + }, + { + "epoch": 2.2, + "learning_rate": 4.918848195071253e-05, + "loss": 1.482, + "step": 28008 + }, + { + "epoch": 2.2, + "learning_rate": 4.917933015228458e-05, + "loss": 1.4122, + "step": 28009 + }, + { + "epoch": 2.2, + "learning_rate": 4.917017903837334e-05, + "loss": 1.4794, + "step": 28010 + }, + { + "epoch": 2.2, + "learning_rate": 4.916102860904089e-05, + "loss": 1.4807, + "step": 28011 + }, + { + "epoch": 2.2, + "learning_rate": 4.9151878864349464e-05, + "loss": 1.4032, + "step": 28012 + }, + { + "epoch": 2.2, + "learning_rate": 4.914272980436112e-05, + "loss": 1.4704, + "step": 28013 + }, + { + "epoch": 2.2, + "learning_rate": 4.9133581429137935e-05, + "loss": 1.4318, + "step": 28014 + }, + { + "epoch": 2.2, + "learning_rate": 4.912443373874208e-05, + "loss": 1.4459, + "step": 28015 + }, + { + "epoch": 2.2, + "learning_rate": 4.9115286733235686e-05, + "loss": 1.5126, + "step": 28016 + }, + { + "epoch": 2.2, + "learning_rate": 4.910614041268084e-05, + "loss": 1.461, + "step": 28017 + }, + { + "epoch": 2.2, + "learning_rate": 4.90969947771396e-05, + "loss": 1.4801, + "step": 28018 + }, + { + "epoch": 2.2, + "learning_rate": 4.9087849826674045e-05, + "loss": 1.4356, + "step": 28019 + }, + { + "epoch": 2.2, + "learning_rate": 4.9078705561346354e-05, + "loss": 1.453, + "step": 28020 + }, + { + "epoch": 2.2, + "learning_rate": 4.906956198121856e-05, + "loss": 1.4619, + "step": 28021 + }, + { + "epoch": 2.2, + "learning_rate": 4.906041908635269e-05, + "loss": 1.4329, + "step": 28022 + }, + { + "epoch": 2.2, + "learning_rate": 4.905127687681092e-05, + "loss": 1.4675, + "step": 28023 + }, + { + "epoch": 2.2, + "learning_rate": 4.904213535265527e-05, + "loss": 1.5015, + "step": 28024 + }, + { + "epoch": 2.21, + "learning_rate": 4.9032994513947764e-05, + "loss": 1.4516, + "step": 28025 + }, + { + "epoch": 2.21, + "learning_rate": 4.902385436075056e-05, + "loss": 1.472, + "step": 28026 + }, + { + "epoch": 2.21, + "learning_rate": 4.901471489312565e-05, + "loss": 1.4907, + "step": 28027 + }, + { + "epoch": 2.21, + "learning_rate": 4.900557611113506e-05, + "loss": 1.4626, + "step": 28028 + }, + { + "epoch": 2.21, + "learning_rate": 4.899643801484091e-05, + "loss": 1.4465, + "step": 28029 + }, + { + "epoch": 2.21, + "learning_rate": 4.898730060430517e-05, + "loss": 1.4587, + "step": 28030 + }, + { + "epoch": 2.21, + "learning_rate": 4.897816387958995e-05, + "loss": 1.4285, + "step": 28031 + }, + { + "epoch": 2.21, + "learning_rate": 4.8969027840757225e-05, + "loss": 1.4247, + "step": 28032 + }, + { + "epoch": 2.21, + "learning_rate": 4.895989248786907e-05, + "loss": 1.4778, + "step": 28033 + }, + { + "epoch": 2.21, + "learning_rate": 4.89507578209875e-05, + "loss": 1.4282, + "step": 28034 + }, + { + "epoch": 2.21, + "learning_rate": 4.8941623840174476e-05, + "loss": 1.4524, + "step": 28035 + }, + { + "epoch": 2.21, + "learning_rate": 4.893249054549209e-05, + "loss": 1.4589, + "step": 28036 + }, + { + "epoch": 2.21, + "learning_rate": 4.892335793700233e-05, + "loss": 1.4198, + "step": 28037 + }, + { + "epoch": 2.21, + "learning_rate": 4.89142260147672e-05, + "loss": 1.5035, + "step": 28038 + }, + { + "epoch": 2.21, + "learning_rate": 4.890509477884862e-05, + "loss": 1.47, + "step": 28039 + }, + { + "epoch": 2.21, + "learning_rate": 4.8895964229308735e-05, + "loss": 1.4139, + "step": 28040 + }, + { + "epoch": 2.21, + "learning_rate": 4.888683436620944e-05, + "loss": 1.4564, + "step": 28041 + }, + { + "epoch": 2.21, + "learning_rate": 4.887770518961269e-05, + "loss": 1.4377, + "step": 28042 + }, + { + "epoch": 2.21, + "learning_rate": 4.886857669958057e-05, + "loss": 1.4134, + "step": 28043 + }, + { + "epoch": 2.21, + "learning_rate": 4.885944889617502e-05, + "loss": 1.4132, + "step": 28044 + }, + { + "epoch": 2.21, + "learning_rate": 4.8850321779457925e-05, + "loss": 1.4254, + "step": 28045 + }, + { + "epoch": 2.21, + "learning_rate": 4.884119534949135e-05, + "loss": 1.4565, + "step": 28046 + }, + { + "epoch": 2.21, + "learning_rate": 4.883206960633727e-05, + "loss": 1.4466, + "step": 28047 + }, + { + "epoch": 2.21, + "learning_rate": 4.8822944550057616e-05, + "loss": 1.4788, + "step": 28048 + }, + { + "epoch": 2.21, + "learning_rate": 4.881382018071426e-05, + "loss": 1.4722, + "step": 28049 + }, + { + "epoch": 2.21, + "learning_rate": 4.88046964983693e-05, + "loss": 1.4285, + "step": 28050 + }, + { + "epoch": 2.21, + "learning_rate": 4.8795573503084604e-05, + "loss": 1.4704, + "step": 28051 + }, + { + "epoch": 2.21, + "learning_rate": 4.8786451194922065e-05, + "loss": 1.4401, + "step": 28052 + }, + { + "epoch": 2.21, + "learning_rate": 4.877732957394372e-05, + "loss": 1.4305, + "step": 28053 + }, + { + "epoch": 2.21, + "learning_rate": 4.876820864021143e-05, + "loss": 1.4731, + "step": 28054 + }, + { + "epoch": 2.21, + "learning_rate": 4.8759088393787155e-05, + "loss": 1.439, + "step": 28055 + }, + { + "epoch": 2.21, + "learning_rate": 4.874996883473275e-05, + "loss": 1.4705, + "step": 28056 + }, + { + "epoch": 2.21, + "learning_rate": 4.8740849963110234e-05, + "loss": 1.4623, + "step": 28057 + }, + { + "epoch": 2.21, + "learning_rate": 4.873173177898146e-05, + "loss": 1.4883, + "step": 28058 + }, + { + "epoch": 2.21, + "learning_rate": 4.87226142824083e-05, + "loss": 1.4432, + "step": 28059 + }, + { + "epoch": 2.21, + "learning_rate": 4.8713497473452744e-05, + "loss": 1.4416, + "step": 28060 + }, + { + "epoch": 2.21, + "learning_rate": 4.870438135217659e-05, + "loss": 1.427, + "step": 28061 + }, + { + "epoch": 2.21, + "learning_rate": 4.869526591864185e-05, + "loss": 1.4412, + "step": 28062 + }, + { + "epoch": 2.21, + "learning_rate": 4.868615117291029e-05, + "loss": 1.459, + "step": 28063 + }, + { + "epoch": 2.21, + "learning_rate": 4.8677037115043916e-05, + "loss": 1.4599, + "step": 28064 + }, + { + "epoch": 2.21, + "learning_rate": 4.866792374510452e-05, + "loss": 1.475, + "step": 28065 + }, + { + "epoch": 2.21, + "learning_rate": 4.8658811063153976e-05, + "loss": 1.4477, + "step": 28066 + }, + { + "epoch": 2.21, + "learning_rate": 4.864969906925423e-05, + "loss": 1.4513, + "step": 28067 + }, + { + "epoch": 2.21, + "learning_rate": 4.864058776346708e-05, + "loss": 1.4903, + "step": 28068 + }, + { + "epoch": 2.21, + "learning_rate": 4.863147714585437e-05, + "loss": 1.5022, + "step": 28069 + }, + { + "epoch": 2.21, + "learning_rate": 4.862236721647804e-05, + "loss": 1.4449, + "step": 28070 + }, + { + "epoch": 2.21, + "learning_rate": 4.861325797539988e-05, + "loss": 1.4877, + "step": 28071 + }, + { + "epoch": 2.21, + "learning_rate": 4.860414942268176e-05, + "loss": 1.4994, + "step": 28072 + }, + { + "epoch": 2.21, + "learning_rate": 4.8595041558385454e-05, + "loss": 1.4703, + "step": 28073 + }, + { + "epoch": 2.21, + "learning_rate": 4.8585934382572905e-05, + "loss": 1.5322, + "step": 28074 + }, + { + "epoch": 2.21, + "learning_rate": 4.857682789530591e-05, + "loss": 1.4338, + "step": 28075 + }, + { + "epoch": 2.21, + "learning_rate": 4.8567722096646215e-05, + "loss": 1.4745, + "step": 28076 + }, + { + "epoch": 2.21, + "learning_rate": 4.855861698665573e-05, + "loss": 1.4234, + "step": 28077 + }, + { + "epoch": 2.21, + "learning_rate": 4.85495125653963e-05, + "loss": 1.4131, + "step": 28078 + }, + { + "epoch": 2.21, + "learning_rate": 4.854040883292969e-05, + "loss": 1.4713, + "step": 28079 + }, + { + "epoch": 2.21, + "learning_rate": 4.8531305789317655e-05, + "loss": 1.4615, + "step": 28080 + }, + { + "epoch": 2.21, + "learning_rate": 4.852220343462213e-05, + "loss": 1.4626, + "step": 28081 + }, + { + "epoch": 2.21, + "learning_rate": 4.851310176890482e-05, + "loss": 1.4903, + "step": 28082 + }, + { + "epoch": 2.21, + "learning_rate": 4.850400079222751e-05, + "loss": 1.4207, + "step": 28083 + }, + { + "epoch": 2.21, + "learning_rate": 4.8494900504652075e-05, + "loss": 1.4972, + "step": 28084 + }, + { + "epoch": 2.21, + "learning_rate": 4.848580090624025e-05, + "loss": 1.4636, + "step": 28085 + }, + { + "epoch": 2.21, + "learning_rate": 4.8476701997053764e-05, + "loss": 1.4347, + "step": 28086 + }, + { + "epoch": 2.21, + "learning_rate": 4.846760377715449e-05, + "loss": 1.449, + "step": 28087 + }, + { + "epoch": 2.21, + "learning_rate": 4.845850624660416e-05, + "loss": 1.4396, + "step": 28088 + }, + { + "epoch": 2.21, + "learning_rate": 4.8449409405464476e-05, + "loss": 1.4563, + "step": 28089 + }, + { + "epoch": 2.21, + "learning_rate": 4.844031325379734e-05, + "loss": 1.4345, + "step": 28090 + }, + { + "epoch": 2.21, + "learning_rate": 4.8431217791664414e-05, + "loss": 1.4713, + "step": 28091 + }, + { + "epoch": 2.21, + "learning_rate": 4.8422123019127476e-05, + "loss": 1.458, + "step": 28092 + }, + { + "epoch": 2.21, + "learning_rate": 4.841302893624816e-05, + "loss": 1.3999, + "step": 28093 + }, + { + "epoch": 2.21, + "learning_rate": 4.840393554308841e-05, + "loss": 1.471, + "step": 28094 + }, + { + "epoch": 2.21, + "learning_rate": 4.839484283970988e-05, + "loss": 1.459, + "step": 28095 + }, + { + "epoch": 2.21, + "learning_rate": 4.83857508261743e-05, + "loss": 1.4403, + "step": 28096 + }, + { + "epoch": 2.21, + "learning_rate": 4.837665950254335e-05, + "loss": 1.4374, + "step": 28097 + }, + { + "epoch": 2.21, + "learning_rate": 4.836756886887885e-05, + "loss": 1.5062, + "step": 28098 + }, + { + "epoch": 2.21, + "learning_rate": 4.835847892524247e-05, + "loss": 1.5252, + "step": 28099 + }, + { + "epoch": 2.21, + "learning_rate": 4.834938967169587e-05, + "loss": 1.4594, + "step": 28100 + }, + { + "epoch": 2.21, + "learning_rate": 4.834030110830088e-05, + "loss": 1.4875, + "step": 28101 + }, + { + "epoch": 2.21, + "learning_rate": 4.833121323511914e-05, + "loss": 1.4216, + "step": 28102 + }, + { + "epoch": 2.21, + "learning_rate": 4.8322126052212304e-05, + "loss": 1.4079, + "step": 28103 + }, + { + "epoch": 2.21, + "learning_rate": 4.8313039559642166e-05, + "loss": 1.4874, + "step": 28104 + }, + { + "epoch": 2.21, + "learning_rate": 4.8303953757470396e-05, + "loss": 1.4428, + "step": 28105 + }, + { + "epoch": 2.21, + "learning_rate": 4.829486864575859e-05, + "loss": 1.5167, + "step": 28106 + }, + { + "epoch": 2.21, + "learning_rate": 4.828578422456856e-05, + "loss": 1.4307, + "step": 28107 + }, + { + "epoch": 2.21, + "learning_rate": 4.827670049396192e-05, + "loss": 1.4553, + "step": 28108 + }, + { + "epoch": 2.21, + "learning_rate": 4.82676174540003e-05, + "loss": 1.4967, + "step": 28109 + }, + { + "epoch": 2.21, + "learning_rate": 4.825853510474541e-05, + "loss": 1.4575, + "step": 28110 + }, + { + "epoch": 2.21, + "learning_rate": 4.824945344625898e-05, + "loss": 1.4381, + "step": 28111 + }, + { + "epoch": 2.21, + "learning_rate": 4.824037247860261e-05, + "loss": 1.4504, + "step": 28112 + }, + { + "epoch": 2.21, + "learning_rate": 4.823129220183795e-05, + "loss": 1.4499, + "step": 28113 + }, + { + "epoch": 2.21, + "learning_rate": 4.822221261602661e-05, + "loss": 1.4823, + "step": 28114 + }, + { + "epoch": 2.21, + "learning_rate": 4.8213133721230324e-05, + "loss": 1.3937, + "step": 28115 + }, + { + "epoch": 2.21, + "learning_rate": 4.8204055517510695e-05, + "loss": 1.4539, + "step": 28116 + }, + { + "epoch": 2.21, + "learning_rate": 4.81949780049293e-05, + "loss": 1.4807, + "step": 28117 + }, + { + "epoch": 2.21, + "learning_rate": 4.8185901183547884e-05, + "loss": 1.4447, + "step": 28118 + }, + { + "epoch": 2.21, + "learning_rate": 4.8176825053428003e-05, + "loss": 1.4403, + "step": 28119 + }, + { + "epoch": 2.21, + "learning_rate": 4.8167749614631234e-05, + "loss": 1.4744, + "step": 28120 + }, + { + "epoch": 2.21, + "learning_rate": 4.8158674867219314e-05, + "loss": 1.4279, + "step": 28121 + }, + { + "epoch": 2.21, + "learning_rate": 4.814960081125378e-05, + "loss": 1.4417, + "step": 28122 + }, + { + "epoch": 2.21, + "learning_rate": 4.814052744679621e-05, + "loss": 1.4512, + "step": 28123 + }, + { + "epoch": 2.21, + "learning_rate": 4.8131454773908246e-05, + "loss": 1.4625, + "step": 28124 + }, + { + "epoch": 2.21, + "learning_rate": 4.812238279265153e-05, + "loss": 1.4908, + "step": 28125 + }, + { + "epoch": 2.21, + "learning_rate": 4.811331150308762e-05, + "loss": 1.4366, + "step": 28126 + }, + { + "epoch": 2.21, + "learning_rate": 4.8104240905278045e-05, + "loss": 1.4236, + "step": 28127 + }, + { + "epoch": 2.21, + "learning_rate": 4.8095170999284495e-05, + "loss": 1.4085, + "step": 28128 + }, + { + "epoch": 2.21, + "learning_rate": 4.808610178516851e-05, + "loss": 1.4572, + "step": 28129 + }, + { + "epoch": 2.21, + "learning_rate": 4.807703326299164e-05, + "loss": 1.4642, + "step": 28130 + }, + { + "epoch": 2.21, + "learning_rate": 4.806796543281542e-05, + "loss": 1.3985, + "step": 28131 + }, + { + "epoch": 2.21, + "learning_rate": 4.805889829470151e-05, + "loss": 1.4802, + "step": 28132 + }, + { + "epoch": 2.21, + "learning_rate": 4.804983184871144e-05, + "loss": 1.4869, + "step": 28133 + }, + { + "epoch": 2.21, + "learning_rate": 4.804076609490668e-05, + "loss": 1.5123, + "step": 28134 + }, + { + "epoch": 2.21, + "learning_rate": 4.803170103334891e-05, + "loss": 1.4677, + "step": 28135 + }, + { + "epoch": 2.21, + "learning_rate": 4.8022636664099636e-05, + "loss": 1.4601, + "step": 28136 + }, + { + "epoch": 2.21, + "learning_rate": 4.801357298722031e-05, + "loss": 1.4122, + "step": 28137 + }, + { + "epoch": 2.21, + "learning_rate": 4.800451000277261e-05, + "loss": 1.472, + "step": 28138 + }, + { + "epoch": 2.21, + "learning_rate": 4.7995447710817994e-05, + "loss": 1.5081, + "step": 28139 + }, + { + "epoch": 2.21, + "learning_rate": 4.798638611141795e-05, + "loss": 1.3878, + "step": 28140 + }, + { + "epoch": 2.21, + "learning_rate": 4.797732520463404e-05, + "loss": 1.4752, + "step": 28141 + }, + { + "epoch": 2.21, + "learning_rate": 4.796826499052785e-05, + "loss": 1.486, + "step": 28142 + }, + { + "epoch": 2.21, + "learning_rate": 4.7959205469160836e-05, + "loss": 1.4218, + "step": 28143 + }, + { + "epoch": 2.21, + "learning_rate": 4.795014664059444e-05, + "loss": 1.4388, + "step": 28144 + }, + { + "epoch": 2.21, + "learning_rate": 4.79410885048903e-05, + "loss": 1.4829, + "step": 28145 + }, + { + "epoch": 2.21, + "learning_rate": 4.793203106210984e-05, + "loss": 1.472, + "step": 28146 + }, + { + "epoch": 2.21, + "learning_rate": 4.792297431231452e-05, + "loss": 1.4028, + "step": 28147 + }, + { + "epoch": 2.21, + "learning_rate": 4.791391825556592e-05, + "loss": 1.4391, + "step": 28148 + }, + { + "epoch": 2.21, + "learning_rate": 4.790486289192549e-05, + "loss": 1.4302, + "step": 28149 + }, + { + "epoch": 2.21, + "learning_rate": 4.789580822145468e-05, + "loss": 1.4044, + "step": 28150 + }, + { + "epoch": 2.21, + "learning_rate": 4.788675424421496e-05, + "loss": 1.4639, + "step": 28151 + }, + { + "epoch": 2.22, + "learning_rate": 4.787770096026786e-05, + "loss": 1.4737, + "step": 28152 + }, + { + "epoch": 2.22, + "learning_rate": 4.7868648369674806e-05, + "loss": 1.478, + "step": 28153 + }, + { + "epoch": 2.22, + "learning_rate": 4.785959647249724e-05, + "loss": 1.5162, + "step": 28154 + }, + { + "epoch": 2.22, + "learning_rate": 4.7850545268796685e-05, + "loss": 1.4496, + "step": 28155 + }, + { + "epoch": 2.22, + "learning_rate": 4.7841494758634525e-05, + "loss": 1.4787, + "step": 28156 + }, + { + "epoch": 2.22, + "learning_rate": 4.783244494207227e-05, + "loss": 1.4657, + "step": 28157 + }, + { + "epoch": 2.22, + "learning_rate": 4.782339581917128e-05, + "loss": 1.4623, + "step": 28158 + }, + { + "epoch": 2.22, + "learning_rate": 4.781434738999311e-05, + "loss": 1.4421, + "step": 28159 + }, + { + "epoch": 2.22, + "learning_rate": 4.780529965459913e-05, + "loss": 1.4427, + "step": 28160 + }, + { + "epoch": 2.22, + "learning_rate": 4.779625261305071e-05, + "loss": 1.417, + "step": 28161 + }, + { + "epoch": 2.22, + "learning_rate": 4.77872062654094e-05, + "loss": 1.4254, + "step": 28162 + }, + { + "epoch": 2.22, + "learning_rate": 4.7778160611736546e-05, + "loss": 1.458, + "step": 28163 + }, + { + "epoch": 2.22, + "learning_rate": 4.776911565209351e-05, + "loss": 1.4348, + "step": 28164 + }, + { + "epoch": 2.22, + "learning_rate": 4.776007138654182e-05, + "loss": 1.4733, + "step": 28165 + }, + { + "epoch": 2.22, + "learning_rate": 4.7751027815142826e-05, + "loss": 1.4758, + "step": 28166 + }, + { + "epoch": 2.22, + "learning_rate": 4.774198493795793e-05, + "loss": 1.4679, + "step": 28167 + }, + { + "epoch": 2.22, + "learning_rate": 4.7732942755048476e-05, + "loss": 1.4292, + "step": 28168 + }, + { + "epoch": 2.22, + "learning_rate": 4.772390126647596e-05, + "loss": 1.4575, + "step": 28169 + }, + { + "epoch": 2.22, + "learning_rate": 4.7714860472301706e-05, + "loss": 1.4406, + "step": 28170 + }, + { + "epoch": 2.22, + "learning_rate": 4.7705820372587054e-05, + "loss": 1.4618, + "step": 28171 + }, + { + "epoch": 2.22, + "learning_rate": 4.7696780967393435e-05, + "loss": 1.4435, + "step": 28172 + }, + { + "epoch": 2.22, + "learning_rate": 4.7687742256782255e-05, + "loss": 1.4592, + "step": 28173 + }, + { + "epoch": 2.22, + "learning_rate": 4.767870424081486e-05, + "loss": 1.4858, + "step": 28174 + }, + { + "epoch": 2.22, + "learning_rate": 4.7669666919552536e-05, + "loss": 1.4763, + "step": 28175 + }, + { + "epoch": 2.22, + "learning_rate": 4.7660630293056755e-05, + "loss": 1.4314, + "step": 28176 + }, + { + "epoch": 2.22, + "learning_rate": 4.765159436138882e-05, + "loss": 1.4703, + "step": 28177 + }, + { + "epoch": 2.22, + "learning_rate": 4.764255912461004e-05, + "loss": 1.4412, + "step": 28178 + }, + { + "epoch": 2.22, + "learning_rate": 4.7633524582781845e-05, + "loss": 1.4124, + "step": 28179 + }, + { + "epoch": 2.22, + "learning_rate": 4.762449073596552e-05, + "loss": 1.4718, + "step": 28180 + }, + { + "epoch": 2.22, + "learning_rate": 4.761545758422236e-05, + "loss": 1.4103, + "step": 28181 + }, + { + "epoch": 2.22, + "learning_rate": 4.760642512761378e-05, + "loss": 1.5032, + "step": 28182 + }, + { + "epoch": 2.22, + "learning_rate": 4.7597393366201095e-05, + "loss": 1.4771, + "step": 28183 + }, + { + "epoch": 2.22, + "learning_rate": 4.758836230004557e-05, + "loss": 1.4684, + "step": 28184 + }, + { + "epoch": 2.22, + "learning_rate": 4.757933192920851e-05, + "loss": 1.4223, + "step": 28185 + }, + { + "epoch": 2.22, + "learning_rate": 4.757030225375133e-05, + "loss": 1.4694, + "step": 28186 + }, + { + "epoch": 2.22, + "learning_rate": 4.75612732737352e-05, + "loss": 1.4579, + "step": 28187 + }, + { + "epoch": 2.22, + "learning_rate": 4.755224498922151e-05, + "loss": 1.4281, + "step": 28188 + }, + { + "epoch": 2.22, + "learning_rate": 4.7543217400271595e-05, + "loss": 1.4439, + "step": 28189 + }, + { + "epoch": 2.22, + "learning_rate": 4.753419050694669e-05, + "loss": 1.4374, + "step": 28190 + }, + { + "epoch": 2.22, + "learning_rate": 4.7525164309308065e-05, + "loss": 1.4814, + "step": 28191 + }, + { + "epoch": 2.22, + "learning_rate": 4.7516138807416994e-05, + "loss": 1.4291, + "step": 28192 + }, + { + "epoch": 2.22, + "learning_rate": 4.7507114001334825e-05, + "loss": 1.4364, + "step": 28193 + }, + { + "epoch": 2.22, + "learning_rate": 4.749808989112281e-05, + "loss": 1.4392, + "step": 28194 + }, + { + "epoch": 2.22, + "learning_rate": 4.748906647684214e-05, + "loss": 1.4071, + "step": 28195 + }, + { + "epoch": 2.22, + "learning_rate": 4.748004375855417e-05, + "loss": 1.4755, + "step": 28196 + }, + { + "epoch": 2.22, + "learning_rate": 4.747102173632015e-05, + "loss": 1.4271, + "step": 28197 + }, + { + "epoch": 2.22, + "learning_rate": 4.746200041020125e-05, + "loss": 1.4094, + "step": 28198 + }, + { + "epoch": 2.22, + "learning_rate": 4.7452979780258837e-05, + "loss": 1.4892, + "step": 28199 + }, + { + "epoch": 2.22, + "learning_rate": 4.7443959846554106e-05, + "loss": 1.4553, + "step": 28200 + }, + { + "epoch": 2.22, + "learning_rate": 4.743494060914823e-05, + "loss": 1.4356, + "step": 28201 + }, + { + "epoch": 2.22, + "learning_rate": 4.742592206810257e-05, + "loss": 1.4639, + "step": 28202 + }, + { + "epoch": 2.22, + "learning_rate": 4.741690422347825e-05, + "loss": 1.4185, + "step": 28203 + }, + { + "epoch": 2.22, + "learning_rate": 4.740788707533657e-05, + "loss": 1.4367, + "step": 28204 + }, + { + "epoch": 2.22, + "learning_rate": 4.739887062373869e-05, + "loss": 1.4269, + "step": 28205 + }, + { + "epoch": 2.22, + "learning_rate": 4.738985486874589e-05, + "loss": 1.4804, + "step": 28206 + }, + { + "epoch": 2.22, + "learning_rate": 4.7380839810419364e-05, + "loss": 1.41, + "step": 28207 + }, + { + "epoch": 2.22, + "learning_rate": 4.737182544882031e-05, + "loss": 1.4949, + "step": 28208 + }, + { + "epoch": 2.22, + "learning_rate": 4.736281178400987e-05, + "loss": 1.4799, + "step": 28209 + }, + { + "epoch": 2.22, + "learning_rate": 4.735379881604934e-05, + "loss": 1.4951, + "step": 28210 + }, + { + "epoch": 2.22, + "learning_rate": 4.7344786544999887e-05, + "loss": 1.4699, + "step": 28211 + }, + { + "epoch": 2.22, + "learning_rate": 4.733577497092261e-05, + "loss": 1.4533, + "step": 28212 + }, + { + "epoch": 2.22, + "learning_rate": 4.732676409387884e-05, + "loss": 1.4946, + "step": 28213 + }, + { + "epoch": 2.22, + "learning_rate": 4.7317753913929666e-05, + "loss": 1.4598, + "step": 28214 + }, + { + "epoch": 2.22, + "learning_rate": 4.7308744431136237e-05, + "loss": 1.4549, + "step": 28215 + }, + { + "epoch": 2.22, + "learning_rate": 4.729973564555981e-05, + "loss": 1.4559, + "step": 28216 + }, + { + "epoch": 2.22, + "learning_rate": 4.7290727557261504e-05, + "loss": 1.4482, + "step": 28217 + }, + { + "epoch": 2.22, + "learning_rate": 4.728172016630244e-05, + "loss": 1.432, + "step": 28218 + }, + { + "epoch": 2.22, + "learning_rate": 4.727271347274379e-05, + "loss": 1.4569, + "step": 28219 + }, + { + "epoch": 2.22, + "learning_rate": 4.726370747664679e-05, + "loss": 1.4333, + "step": 28220 + }, + { + "epoch": 2.22, + "learning_rate": 4.7254702178072515e-05, + "loss": 1.4125, + "step": 28221 + }, + { + "epoch": 2.22, + "learning_rate": 4.724569757708207e-05, + "loss": 1.4014, + "step": 28222 + }, + { + "epoch": 2.22, + "learning_rate": 4.723669367373668e-05, + "loss": 1.449, + "step": 28223 + }, + { + "epoch": 2.22, + "learning_rate": 4.722769046809742e-05, + "loss": 1.4677, + "step": 28224 + }, + { + "epoch": 2.22, + "learning_rate": 4.721868796022545e-05, + "loss": 1.4633, + "step": 28225 + }, + { + "epoch": 2.22, + "learning_rate": 4.720968615018179e-05, + "loss": 1.4879, + "step": 28226 + }, + { + "epoch": 2.22, + "learning_rate": 4.7200685038027716e-05, + "loss": 1.4206, + "step": 28227 + }, + { + "epoch": 2.22, + "learning_rate": 4.719168462382425e-05, + "loss": 1.431, + "step": 28228 + }, + { + "epoch": 2.22, + "learning_rate": 4.718268490763245e-05, + "loss": 1.4964, + "step": 28229 + }, + { + "epoch": 2.22, + "learning_rate": 4.717368588951355e-05, + "loss": 1.3807, + "step": 28230 + }, + { + "epoch": 2.22, + "learning_rate": 4.716468756952857e-05, + "loss": 1.4299, + "step": 28231 + }, + { + "epoch": 2.22, + "learning_rate": 4.7155689947738554e-05, + "loss": 1.4689, + "step": 28232 + }, + { + "epoch": 2.22, + "learning_rate": 4.714669302420469e-05, + "loss": 1.5141, + "step": 28233 + }, + { + "epoch": 2.22, + "learning_rate": 4.713769679898801e-05, + "loss": 1.4765, + "step": 28234 + }, + { + "epoch": 2.22, + "learning_rate": 4.7128701272149624e-05, + "loss": 1.4767, + "step": 28235 + }, + { + "epoch": 2.22, + "learning_rate": 4.7119706443750544e-05, + "loss": 1.4782, + "step": 28236 + }, + { + "epoch": 2.22, + "learning_rate": 4.711071231385194e-05, + "loss": 1.4379, + "step": 28237 + }, + { + "epoch": 2.22, + "learning_rate": 4.710171888251481e-05, + "loss": 1.4801, + "step": 28238 + }, + { + "epoch": 2.22, + "learning_rate": 4.709272614980018e-05, + "loss": 1.4589, + "step": 28239 + }, + { + "epoch": 2.22, + "learning_rate": 4.70837341157692e-05, + "loss": 1.441, + "step": 28240 + }, + { + "epoch": 2.22, + "learning_rate": 4.707474278048287e-05, + "loss": 1.4694, + "step": 28241 + }, + { + "epoch": 2.22, + "learning_rate": 4.7065752144002236e-05, + "loss": 1.4902, + "step": 28242 + }, + { + "epoch": 2.22, + "learning_rate": 4.705676220638829e-05, + "loss": 1.4383, + "step": 28243 + }, + { + "epoch": 2.22, + "learning_rate": 4.7047772967702186e-05, + "loss": 1.4334, + "step": 28244 + }, + { + "epoch": 2.22, + "learning_rate": 4.7038784428004865e-05, + "loss": 1.4177, + "step": 28245 + }, + { + "epoch": 2.22, + "learning_rate": 4.702979658735735e-05, + "loss": 1.4819, + "step": 28246 + }, + { + "epoch": 2.22, + "learning_rate": 4.7020809445820735e-05, + "loss": 1.4113, + "step": 28247 + }, + { + "epoch": 2.22, + "learning_rate": 4.701182300345599e-05, + "loss": 1.4572, + "step": 28248 + }, + { + "epoch": 2.22, + "learning_rate": 4.700283726032408e-05, + "loss": 1.4888, + "step": 28249 + }, + { + "epoch": 2.22, + "learning_rate": 4.699385221648608e-05, + "loss": 1.4686, + "step": 28250 + }, + { + "epoch": 2.22, + "learning_rate": 4.6984867872003026e-05, + "loss": 1.4863, + "step": 28251 + }, + { + "epoch": 2.22, + "learning_rate": 4.697588422693587e-05, + "loss": 1.468, + "step": 28252 + }, + { + "epoch": 2.22, + "learning_rate": 4.6966901281345546e-05, + "loss": 1.4052, + "step": 28253 + }, + { + "epoch": 2.22, + "learning_rate": 4.695791903529317e-05, + "loss": 1.4812, + "step": 28254 + }, + { + "epoch": 2.22, + "learning_rate": 4.694893748883965e-05, + "loss": 1.4609, + "step": 28255 + }, + { + "epoch": 2.22, + "learning_rate": 4.6939956642045927e-05, + "loss": 1.4462, + "step": 28256 + }, + { + "epoch": 2.22, + "learning_rate": 4.693097649497309e-05, + "loss": 1.4539, + "step": 28257 + }, + { + "epoch": 2.22, + "learning_rate": 4.692199704768203e-05, + "loss": 1.4686, + "step": 28258 + }, + { + "epoch": 2.22, + "learning_rate": 4.691301830023367e-05, + "loss": 1.4878, + "step": 28259 + }, + { + "epoch": 2.22, + "learning_rate": 4.6904040252689105e-05, + "loss": 1.4441, + "step": 28260 + }, + { + "epoch": 2.22, + "learning_rate": 4.689506290510918e-05, + "loss": 1.5174, + "step": 28261 + }, + { + "epoch": 2.22, + "learning_rate": 4.68860862575549e-05, + "loss": 1.455, + "step": 28262 + }, + { + "epoch": 2.22, + "learning_rate": 4.687711031008714e-05, + "loss": 1.4162, + "step": 28263 + }, + { + "epoch": 2.22, + "learning_rate": 4.686813506276694e-05, + "loss": 1.5034, + "step": 28264 + }, + { + "epoch": 2.22, + "learning_rate": 4.685916051565519e-05, + "loss": 1.4631, + "step": 28265 + }, + { + "epoch": 2.22, + "learning_rate": 4.685018666881277e-05, + "loss": 1.4475, + "step": 28266 + }, + { + "epoch": 2.22, + "learning_rate": 4.6841213522300665e-05, + "loss": 1.4708, + "step": 28267 + }, + { + "epoch": 2.22, + "learning_rate": 4.683224107617983e-05, + "loss": 1.4307, + "step": 28268 + }, + { + "epoch": 2.22, + "learning_rate": 4.682326933051116e-05, + "loss": 1.4597, + "step": 28269 + }, + { + "epoch": 2.22, + "learning_rate": 4.68142982853555e-05, + "loss": 1.4647, + "step": 28270 + }, + { + "epoch": 2.22, + "learning_rate": 4.680532794077386e-05, + "loss": 1.4595, + "step": 28271 + }, + { + "epoch": 2.22, + "learning_rate": 4.67963582968271e-05, + "loss": 1.4496, + "step": 28272 + }, + { + "epoch": 2.22, + "learning_rate": 4.678738935357605e-05, + "loss": 1.4665, + "step": 28273 + }, + { + "epoch": 2.22, + "learning_rate": 4.6778421111081734e-05, + "loss": 1.4632, + "step": 28274 + }, + { + "epoch": 2.22, + "learning_rate": 4.676945356940497e-05, + "loss": 1.4272, + "step": 28275 + }, + { + "epoch": 2.22, + "learning_rate": 4.676048672860661e-05, + "loss": 1.476, + "step": 28276 + }, + { + "epoch": 2.22, + "learning_rate": 4.675152058874761e-05, + "loss": 1.4271, + "step": 28277 + }, + { + "epoch": 2.22, + "learning_rate": 4.6742555149888815e-05, + "loss": 1.4552, + "step": 28278 + }, + { + "epoch": 2.23, + "learning_rate": 4.6733590412091085e-05, + "loss": 1.4878, + "step": 28279 + }, + { + "epoch": 2.23, + "learning_rate": 4.672462637541524e-05, + "loss": 1.4773, + "step": 28280 + }, + { + "epoch": 2.23, + "learning_rate": 4.671566303992218e-05, + "loss": 1.4462, + "step": 28281 + }, + { + "epoch": 2.23, + "learning_rate": 4.670670040567283e-05, + "loss": 1.4342, + "step": 28282 + }, + { + "epoch": 2.23, + "learning_rate": 4.669773847272798e-05, + "loss": 1.4536, + "step": 28283 + }, + { + "epoch": 2.23, + "learning_rate": 4.668877724114845e-05, + "loss": 1.4631, + "step": 28284 + }, + { + "epoch": 2.23, + "learning_rate": 4.667981671099513e-05, + "loss": 1.46, + "step": 28285 + }, + { + "epoch": 2.23, + "learning_rate": 4.6670856882328844e-05, + "loss": 1.5063, + "step": 28286 + }, + { + "epoch": 2.23, + "learning_rate": 4.666189775521038e-05, + "loss": 1.47, + "step": 28287 + }, + { + "epoch": 2.23, + "learning_rate": 4.665293932970064e-05, + "loss": 1.486, + "step": 28288 + }, + { + "epoch": 2.23, + "learning_rate": 4.664398160586042e-05, + "loss": 1.4992, + "step": 28289 + }, + { + "epoch": 2.23, + "learning_rate": 4.663502458375047e-05, + "loss": 1.4631, + "step": 28290 + }, + { + "epoch": 2.23, + "learning_rate": 4.662606826343172e-05, + "loss": 1.4022, + "step": 28291 + }, + { + "epoch": 2.23, + "learning_rate": 4.661711264496493e-05, + "loss": 1.4407, + "step": 28292 + }, + { + "epoch": 2.23, + "learning_rate": 4.660815772841083e-05, + "loss": 1.4629, + "step": 28293 + }, + { + "epoch": 2.23, + "learning_rate": 4.6599203513830326e-05, + "loss": 1.49, + "step": 28294 + }, + { + "epoch": 2.23, + "learning_rate": 4.659025000128419e-05, + "loss": 1.4136, + "step": 28295 + }, + { + "epoch": 2.23, + "learning_rate": 4.658129719083316e-05, + "loss": 1.3973, + "step": 28296 + }, + { + "epoch": 2.23, + "learning_rate": 4.657234508253797e-05, + "loss": 1.379, + "step": 28297 + }, + { + "epoch": 2.23, + "learning_rate": 4.656339367645958e-05, + "loss": 1.4862, + "step": 28298 + }, + { + "epoch": 2.23, + "learning_rate": 4.6554442972658664e-05, + "loss": 1.4878, + "step": 28299 + }, + { + "epoch": 2.23, + "learning_rate": 4.6545492971195944e-05, + "loss": 1.4845, + "step": 28300 + }, + { + "epoch": 2.23, + "learning_rate": 4.653654367213229e-05, + "loss": 1.458, + "step": 28301 + }, + { + "epoch": 2.23, + "learning_rate": 4.65275950755284e-05, + "loss": 1.43, + "step": 28302 + }, + { + "epoch": 2.23, + "learning_rate": 4.6518647181445056e-05, + "loss": 1.4786, + "step": 28303 + }, + { + "epoch": 2.23, + "learning_rate": 4.650969998994292e-05, + "loss": 1.4723, + "step": 28304 + }, + { + "epoch": 2.23, + "learning_rate": 4.6500753501082884e-05, + "loss": 1.4525, + "step": 28305 + }, + { + "epoch": 2.23, + "learning_rate": 4.649180771492559e-05, + "loss": 1.4663, + "step": 28306 + }, + { + "epoch": 2.23, + "learning_rate": 4.648286263153178e-05, + "loss": 1.4229, + "step": 28307 + }, + { + "epoch": 2.23, + "learning_rate": 4.647391825096223e-05, + "loss": 1.4322, + "step": 28308 + }, + { + "epoch": 2.23, + "learning_rate": 4.6464974573277644e-05, + "loss": 1.4298, + "step": 28309 + }, + { + "epoch": 2.23, + "learning_rate": 4.645603159853872e-05, + "loss": 1.3811, + "step": 28310 + }, + { + "epoch": 2.23, + "learning_rate": 4.6447089326806244e-05, + "loss": 1.4798, + "step": 28311 + }, + { + "epoch": 2.23, + "learning_rate": 4.643814775814087e-05, + "loss": 1.4636, + "step": 28312 + }, + { + "epoch": 2.23, + "learning_rate": 4.642920689260329e-05, + "loss": 1.4672, + "step": 28313 + }, + { + "epoch": 2.23, + "learning_rate": 4.642026673025423e-05, + "loss": 1.4152, + "step": 28314 + }, + { + "epoch": 2.23, + "learning_rate": 4.6411327271154445e-05, + "loss": 1.4533, + "step": 28315 + }, + { + "epoch": 2.23, + "learning_rate": 4.640238851536459e-05, + "loss": 1.4946, + "step": 28316 + }, + { + "epoch": 2.23, + "learning_rate": 4.63934504629453e-05, + "loss": 1.4672, + "step": 28317 + }, + { + "epoch": 2.23, + "learning_rate": 4.638451311395735e-05, + "loss": 1.4656, + "step": 28318 + }, + { + "epoch": 2.23, + "learning_rate": 4.637557646846138e-05, + "loss": 1.4495, + "step": 28319 + }, + { + "epoch": 2.23, + "learning_rate": 4.6366640526518066e-05, + "loss": 1.4533, + "step": 28320 + }, + { + "epoch": 2.23, + "learning_rate": 4.635770528818802e-05, + "loss": 1.4737, + "step": 28321 + }, + { + "epoch": 2.23, + "learning_rate": 4.6348770753532006e-05, + "loss": 1.4532, + "step": 28322 + }, + { + "epoch": 2.23, + "learning_rate": 4.633983692261063e-05, + "loss": 1.4668, + "step": 28323 + }, + { + "epoch": 2.23, + "learning_rate": 4.633090379548452e-05, + "loss": 1.4581, + "step": 28324 + }, + { + "epoch": 2.23, + "learning_rate": 4.6321971372214414e-05, + "loss": 1.5157, + "step": 28325 + }, + { + "epoch": 2.23, + "learning_rate": 4.6313039652860905e-05, + "loss": 1.4561, + "step": 28326 + }, + { + "epoch": 2.23, + "learning_rate": 4.63041086374846e-05, + "loss": 1.4858, + "step": 28327 + }, + { + "epoch": 2.23, + "learning_rate": 4.629517832614621e-05, + "loss": 1.423, + "step": 28328 + }, + { + "epoch": 2.23, + "learning_rate": 4.6286248718906273e-05, + "loss": 1.4253, + "step": 28329 + }, + { + "epoch": 2.23, + "learning_rate": 4.627731981582553e-05, + "loss": 1.4553, + "step": 28330 + }, + { + "epoch": 2.23, + "learning_rate": 4.626839161696451e-05, + "loss": 1.451, + "step": 28331 + }, + { + "epoch": 2.23, + "learning_rate": 4.62594641223839e-05, + "loss": 1.4713, + "step": 28332 + }, + { + "epoch": 2.23, + "learning_rate": 4.6250537332144294e-05, + "loss": 1.4523, + "step": 28333 + }, + { + "epoch": 2.23, + "learning_rate": 4.624161124630623e-05, + "loss": 1.4012, + "step": 28334 + }, + { + "epoch": 2.23, + "learning_rate": 4.6232685864930416e-05, + "loss": 1.4932, + "step": 28335 + }, + { + "epoch": 2.23, + "learning_rate": 4.6223761188077394e-05, + "loss": 1.4987, + "step": 28336 + }, + { + "epoch": 2.23, + "learning_rate": 4.621483721580776e-05, + "loss": 1.427, + "step": 28337 + }, + { + "epoch": 2.23, + "learning_rate": 4.620591394818207e-05, + "loss": 1.5141, + "step": 28338 + }, + { + "epoch": 2.23, + "learning_rate": 4.6196991385261e-05, + "loss": 1.4289, + "step": 28339 + }, + { + "epoch": 2.23, + "learning_rate": 4.618806952710507e-05, + "loss": 1.4444, + "step": 28340 + }, + { + "epoch": 2.23, + "learning_rate": 4.6179148373774814e-05, + "loss": 1.419, + "step": 28341 + }, + { + "epoch": 2.23, + "learning_rate": 4.6170227925330885e-05, + "loss": 1.4368, + "step": 28342 + }, + { + "epoch": 2.23, + "learning_rate": 4.616130818183382e-05, + "loss": 1.4341, + "step": 28343 + }, + { + "epoch": 2.23, + "learning_rate": 4.615238914334412e-05, + "loss": 1.3862, + "step": 28344 + }, + { + "epoch": 2.23, + "learning_rate": 4.6143470809922395e-05, + "loss": 1.4791, + "step": 28345 + }, + { + "epoch": 2.23, + "learning_rate": 4.613455318162922e-05, + "loss": 1.46, + "step": 28346 + }, + { + "epoch": 2.23, + "learning_rate": 4.612563625852513e-05, + "loss": 1.4532, + "step": 28347 + }, + { + "epoch": 2.23, + "learning_rate": 4.611672004067059e-05, + "loss": 1.4082, + "step": 28348 + }, + { + "epoch": 2.23, + "learning_rate": 4.6107804528126246e-05, + "loss": 1.3987, + "step": 28349 + }, + { + "epoch": 2.23, + "learning_rate": 4.6098889720952584e-05, + "loss": 1.4466, + "step": 28350 + }, + { + "epoch": 2.23, + "learning_rate": 4.608997561921006e-05, + "loss": 1.4863, + "step": 28351 + }, + { + "epoch": 2.23, + "learning_rate": 4.6081062222959324e-05, + "loss": 1.4636, + "step": 28352 + }, + { + "epoch": 2.23, + "learning_rate": 4.607214953226082e-05, + "loss": 1.4973, + "step": 28353 + }, + { + "epoch": 2.23, + "learning_rate": 4.6063237547175055e-05, + "loss": 1.513, + "step": 28354 + }, + { + "epoch": 2.23, + "learning_rate": 4.605432626776252e-05, + "loss": 1.4668, + "step": 28355 + }, + { + "epoch": 2.23, + "learning_rate": 4.6045415694083794e-05, + "loss": 1.4563, + "step": 28356 + }, + { + "epoch": 2.23, + "learning_rate": 4.6036505826199324e-05, + "loss": 1.469, + "step": 28357 + }, + { + "epoch": 2.23, + "learning_rate": 4.602759666416956e-05, + "loss": 1.427, + "step": 28358 + }, + { + "epoch": 2.23, + "learning_rate": 4.601868820805509e-05, + "loss": 1.4696, + "step": 28359 + }, + { + "epoch": 2.23, + "learning_rate": 4.600978045791628e-05, + "loss": 1.4011, + "step": 28360 + }, + { + "epoch": 2.23, + "learning_rate": 4.600087341381373e-05, + "loss": 1.4544, + "step": 28361 + }, + { + "epoch": 2.23, + "learning_rate": 4.5991967075807835e-05, + "loss": 1.4352, + "step": 28362 + }, + { + "epoch": 2.23, + "learning_rate": 4.59830614439591e-05, + "loss": 1.4338, + "step": 28363 + }, + { + "epoch": 2.23, + "learning_rate": 4.5974156518328006e-05, + "loss": 1.4379, + "step": 28364 + }, + { + "epoch": 2.23, + "learning_rate": 4.596525229897491e-05, + "loss": 1.5218, + "step": 28365 + }, + { + "epoch": 2.23, + "learning_rate": 4.59563487859604e-05, + "loss": 1.5033, + "step": 28366 + }, + { + "epoch": 2.23, + "learning_rate": 4.5947445979344863e-05, + "loss": 1.4384, + "step": 28367 + }, + { + "epoch": 2.23, + "learning_rate": 4.593854387918871e-05, + "loss": 1.43, + "step": 28368 + }, + { + "epoch": 2.23, + "learning_rate": 4.592964248555245e-05, + "loss": 1.4761, + "step": 28369 + }, + { + "epoch": 2.23, + "learning_rate": 4.59207417984965e-05, + "loss": 1.4417, + "step": 28370 + }, + { + "epoch": 2.23, + "learning_rate": 4.591184181808122e-05, + "loss": 1.4783, + "step": 28371 + }, + { + "epoch": 2.23, + "learning_rate": 4.5902942544367135e-05, + "loss": 1.4676, + "step": 28372 + }, + { + "epoch": 2.23, + "learning_rate": 4.589404397741464e-05, + "loss": 1.4781, + "step": 28373 + }, + { + "epoch": 2.23, + "learning_rate": 4.588514611728413e-05, + "loss": 1.442, + "step": 28374 + }, + { + "epoch": 2.23, + "learning_rate": 4.5876248964035984e-05, + "loss": 1.4797, + "step": 28375 + }, + { + "epoch": 2.23, + "learning_rate": 4.586735251773063e-05, + "loss": 1.4057, + "step": 28376 + }, + { + "epoch": 2.23, + "learning_rate": 4.5858456778428545e-05, + "loss": 1.4842, + "step": 28377 + }, + { + "epoch": 2.23, + "learning_rate": 4.5849561746190065e-05, + "loss": 1.4569, + "step": 28378 + }, + { + "epoch": 2.23, + "learning_rate": 4.5840667421075534e-05, + "loss": 1.5276, + "step": 28379 + }, + { + "epoch": 2.23, + "learning_rate": 4.583177380314544e-05, + "loss": 1.4282, + "step": 28380 + }, + { + "epoch": 2.23, + "learning_rate": 4.5822880892460134e-05, + "loss": 1.4225, + "step": 28381 + }, + { + "epoch": 2.23, + "learning_rate": 4.581398868907992e-05, + "loss": 1.4316, + "step": 28382 + }, + { + "epoch": 2.23, + "learning_rate": 4.580509719306526e-05, + "loss": 1.4483, + "step": 28383 + }, + { + "epoch": 2.23, + "learning_rate": 4.579620640447652e-05, + "loss": 1.4515, + "step": 28384 + }, + { + "epoch": 2.23, + "learning_rate": 4.5787316323373955e-05, + "loss": 1.4474, + "step": 28385 + }, + { + "epoch": 2.23, + "learning_rate": 4.577842694981807e-05, + "loss": 1.4144, + "step": 28386 + }, + { + "epoch": 2.23, + "learning_rate": 4.5769538283869154e-05, + "loss": 1.4844, + "step": 28387 + }, + { + "epoch": 2.23, + "learning_rate": 4.57606503255875e-05, + "loss": 1.47, + "step": 28388 + }, + { + "epoch": 2.23, + "learning_rate": 4.5751763075033556e-05, + "loss": 1.38, + "step": 28389 + }, + { + "epoch": 2.23, + "learning_rate": 4.57428765322676e-05, + "loss": 1.4261, + "step": 28390 + }, + { + "epoch": 2.23, + "learning_rate": 4.5733990697349946e-05, + "loss": 1.4499, + "step": 28391 + }, + { + "epoch": 2.23, + "learning_rate": 4.572510557034094e-05, + "loss": 1.4635, + "step": 28392 + }, + { + "epoch": 2.23, + "learning_rate": 4.571622115130099e-05, + "loss": 1.41, + "step": 28393 + }, + { + "epoch": 2.23, + "learning_rate": 4.570733744029033e-05, + "loss": 1.4718, + "step": 28394 + }, + { + "epoch": 2.23, + "learning_rate": 4.5698454437369315e-05, + "loss": 1.437, + "step": 28395 + }, + { + "epoch": 2.23, + "learning_rate": 4.568957214259819e-05, + "loss": 1.4255, + "step": 28396 + }, + { + "epoch": 2.23, + "learning_rate": 4.568069055603733e-05, + "loss": 1.4297, + "step": 28397 + }, + { + "epoch": 2.23, + "learning_rate": 4.567180967774703e-05, + "loss": 1.4479, + "step": 28398 + }, + { + "epoch": 2.23, + "learning_rate": 4.5662929507787516e-05, + "loss": 1.4227, + "step": 28399 + }, + { + "epoch": 2.23, + "learning_rate": 4.565405004621919e-05, + "loss": 1.4289, + "step": 28400 + }, + { + "epoch": 2.23, + "learning_rate": 4.564517129310227e-05, + "loss": 1.4928, + "step": 28401 + }, + { + "epoch": 2.23, + "learning_rate": 4.5636293248497006e-05, + "loss": 1.4635, + "step": 28402 + }, + { + "epoch": 2.23, + "learning_rate": 4.5627415912463766e-05, + "loss": 1.4112, + "step": 28403 + }, + { + "epoch": 2.23, + "learning_rate": 4.5618539285062776e-05, + "loss": 1.4366, + "step": 28404 + }, + { + "epoch": 2.23, + "learning_rate": 4.560966336635426e-05, + "loss": 1.4367, + "step": 28405 + }, + { + "epoch": 2.24, + "learning_rate": 4.560078815639857e-05, + "loss": 1.4493, + "step": 28406 + }, + { + "epoch": 2.24, + "learning_rate": 4.559191365525585e-05, + "loss": 1.4677, + "step": 28407 + }, + { + "epoch": 2.24, + "learning_rate": 4.558303986298649e-05, + "loss": 1.4204, + "step": 28408 + }, + { + "epoch": 2.24, + "learning_rate": 4.5574166779650604e-05, + "loss": 1.4062, + "step": 28409 + }, + { + "epoch": 2.24, + "learning_rate": 4.556529440530854e-05, + "loss": 1.5089, + "step": 28410 + }, + { + "epoch": 2.24, + "learning_rate": 4.55564227400205e-05, + "loss": 1.4318, + "step": 28411 + }, + { + "epoch": 2.24, + "learning_rate": 4.5547551783846685e-05, + "loss": 1.3867, + "step": 28412 + }, + { + "epoch": 2.24, + "learning_rate": 4.553868153684739e-05, + "loss": 1.4398, + "step": 28413 + }, + { + "epoch": 2.24, + "learning_rate": 4.552981199908279e-05, + "loss": 1.46, + "step": 28414 + }, + { + "epoch": 2.24, + "learning_rate": 4.552094317061312e-05, + "loss": 1.5307, + "step": 28415 + }, + { + "epoch": 2.24, + "learning_rate": 4.5512075051498545e-05, + "loss": 1.4397, + "step": 28416 + }, + { + "epoch": 2.24, + "learning_rate": 4.550320764179935e-05, + "loss": 1.5078, + "step": 28417 + }, + { + "epoch": 2.24, + "learning_rate": 4.549434094157573e-05, + "loss": 1.4171, + "step": 28418 + }, + { + "epoch": 2.24, + "learning_rate": 4.548547495088782e-05, + "loss": 1.4541, + "step": 28419 + }, + { + "epoch": 2.24, + "learning_rate": 4.5476609669795886e-05, + "loss": 1.4681, + "step": 28420 + }, + { + "epoch": 2.24, + "learning_rate": 4.546774509836011e-05, + "loss": 1.4508, + "step": 28421 + }, + { + "epoch": 2.24, + "learning_rate": 4.5458881236640596e-05, + "loss": 1.3954, + "step": 28422 + }, + { + "epoch": 2.24, + "learning_rate": 4.545001808469759e-05, + "loss": 1.4582, + "step": 28423 + }, + { + "epoch": 2.24, + "learning_rate": 4.5441155642591325e-05, + "loss": 1.4295, + "step": 28424 + }, + { + "epoch": 2.24, + "learning_rate": 4.5432293910381914e-05, + "loss": 1.4496, + "step": 28425 + }, + { + "epoch": 2.24, + "learning_rate": 4.542343288812947e-05, + "loss": 1.4906, + "step": 28426 + }, + { + "epoch": 2.24, + "learning_rate": 4.5414572575894246e-05, + "loss": 1.4724, + "step": 28427 + }, + { + "epoch": 2.24, + "learning_rate": 4.5405712973736355e-05, + "loss": 1.4485, + "step": 28428 + }, + { + "epoch": 2.24, + "learning_rate": 4.539685408171592e-05, + "loss": 1.421, + "step": 28429 + }, + { + "epoch": 2.24, + "learning_rate": 4.5387995899893176e-05, + "loss": 1.4545, + "step": 28430 + }, + { + "epoch": 2.24, + "learning_rate": 4.537913842832819e-05, + "loss": 1.4834, + "step": 28431 + }, + { + "epoch": 2.24, + "learning_rate": 4.537028166708112e-05, + "loss": 1.4404, + "step": 28432 + }, + { + "epoch": 2.24, + "learning_rate": 4.536142561621206e-05, + "loss": 1.5158, + "step": 28433 + }, + { + "epoch": 2.24, + "learning_rate": 4.5352570275781224e-05, + "loss": 1.4012, + "step": 28434 + }, + { + "epoch": 2.24, + "learning_rate": 4.534371564584868e-05, + "loss": 1.4352, + "step": 28435 + }, + { + "epoch": 2.24, + "learning_rate": 4.533486172647452e-05, + "loss": 1.4213, + "step": 28436 + }, + { + "epoch": 2.24, + "learning_rate": 4.532600851771892e-05, + "loss": 1.4416, + "step": 28437 + }, + { + "epoch": 2.24, + "learning_rate": 4.531715601964197e-05, + "loss": 1.5285, + "step": 28438 + }, + { + "epoch": 2.24, + "learning_rate": 4.5308304232303704e-05, + "loss": 1.4668, + "step": 28439 + }, + { + "epoch": 2.24, + "learning_rate": 4.529945315576429e-05, + "loss": 1.4692, + "step": 28440 + }, + { + "epoch": 2.24, + "learning_rate": 4.5290602790083854e-05, + "loss": 1.5, + "step": 28441 + }, + { + "epoch": 2.24, + "learning_rate": 4.528175313532243e-05, + "loss": 1.4146, + "step": 28442 + }, + { + "epoch": 2.24, + "learning_rate": 4.527290419154008e-05, + "loss": 1.467, + "step": 28443 + }, + { + "epoch": 2.24, + "learning_rate": 4.526405595879696e-05, + "loss": 1.4488, + "step": 28444 + }, + { + "epoch": 2.24, + "learning_rate": 4.5255208437153096e-05, + "loss": 1.4344, + "step": 28445 + }, + { + "epoch": 2.24, + "learning_rate": 4.5246361626668525e-05, + "loss": 1.4442, + "step": 28446 + }, + { + "epoch": 2.24, + "learning_rate": 4.523751552740341e-05, + "loss": 1.4411, + "step": 28447 + }, + { + "epoch": 2.24, + "learning_rate": 4.522867013941772e-05, + "loss": 1.4355, + "step": 28448 + }, + { + "epoch": 2.24, + "learning_rate": 4.521982546277156e-05, + "loss": 1.5204, + "step": 28449 + }, + { + "epoch": 2.24, + "learning_rate": 4.521098149752492e-05, + "loss": 1.4609, + "step": 28450 + }, + { + "epoch": 2.24, + "learning_rate": 4.5202138243737935e-05, + "loss": 1.4562, + "step": 28451 + }, + { + "epoch": 2.24, + "learning_rate": 4.519329570147059e-05, + "loss": 1.4943, + "step": 28452 + }, + { + "epoch": 2.24, + "learning_rate": 4.518445387078288e-05, + "loss": 1.4869, + "step": 28453 + }, + { + "epoch": 2.24, + "learning_rate": 4.5175612751734905e-05, + "loss": 1.408, + "step": 28454 + }, + { + "epoch": 2.24, + "learning_rate": 4.51667723443867e-05, + "loss": 1.4806, + "step": 28455 + }, + { + "epoch": 2.24, + "learning_rate": 4.5157932648798273e-05, + "loss": 1.4237, + "step": 28456 + }, + { + "epoch": 2.24, + "learning_rate": 4.514909366502958e-05, + "loss": 1.4469, + "step": 28457 + }, + { + "epoch": 2.24, + "learning_rate": 4.514025539314072e-05, + "loss": 1.4576, + "step": 28458 + }, + { + "epoch": 2.24, + "learning_rate": 4.5131417833191656e-05, + "loss": 1.4918, + "step": 28459 + }, + { + "epoch": 2.24, + "learning_rate": 4.512258098524235e-05, + "loss": 1.4161, + "step": 28460 + }, + { + "epoch": 2.24, + "learning_rate": 4.511374484935289e-05, + "loss": 1.4483, + "step": 28461 + }, + { + "epoch": 2.24, + "learning_rate": 4.510490942558323e-05, + "loss": 1.4597, + "step": 28462 + }, + { + "epoch": 2.24, + "learning_rate": 4.509607471399329e-05, + "loss": 1.4645, + "step": 28463 + }, + { + "epoch": 2.24, + "learning_rate": 4.5087240714643155e-05, + "loss": 1.4786, + "step": 28464 + }, + { + "epoch": 2.24, + "learning_rate": 4.507840742759278e-05, + "loss": 1.4345, + "step": 28465 + }, + { + "epoch": 2.24, + "learning_rate": 4.5069574852902054e-05, + "loss": 1.4427, + "step": 28466 + }, + { + "epoch": 2.24, + "learning_rate": 4.506074299063107e-05, + "loss": 1.4398, + "step": 28467 + }, + { + "epoch": 2.24, + "learning_rate": 4.5051911840839725e-05, + "loss": 1.5267, + "step": 28468 + }, + { + "epoch": 2.24, + "learning_rate": 4.5043081403587974e-05, + "loss": 1.4556, + "step": 28469 + }, + { + "epoch": 2.24, + "learning_rate": 4.5034251678935684e-05, + "loss": 1.4238, + "step": 28470 + }, + { + "epoch": 2.24, + "learning_rate": 4.5025422666943014e-05, + "loss": 1.4825, + "step": 28471 + }, + { + "epoch": 2.24, + "learning_rate": 4.501659436766977e-05, + "loss": 1.4288, + "step": 28472 + }, + { + "epoch": 2.24, + "learning_rate": 4.500776678117594e-05, + "loss": 1.4337, + "step": 28473 + }, + { + "epoch": 2.24, + "learning_rate": 4.499893990752137e-05, + "loss": 1.4374, + "step": 28474 + }, + { + "epoch": 2.24, + "learning_rate": 4.499011374676611e-05, + "loss": 1.4374, + "step": 28475 + }, + { + "epoch": 2.24, + "learning_rate": 4.4981288298970026e-05, + "loss": 1.4415, + "step": 28476 + }, + { + "epoch": 2.24, + "learning_rate": 4.4972463564193e-05, + "loss": 1.4477, + "step": 28477 + }, + { + "epoch": 2.24, + "learning_rate": 4.496363954249502e-05, + "loss": 1.4076, + "step": 28478 + }, + { + "epoch": 2.24, + "learning_rate": 4.4954816233935974e-05, + "loss": 1.4573, + "step": 28479 + }, + { + "epoch": 2.24, + "learning_rate": 4.4945993638575714e-05, + "loss": 1.4691, + "step": 28480 + }, + { + "epoch": 2.24, + "learning_rate": 4.493717175647422e-05, + "loss": 1.4502, + "step": 28481 + }, + { + "epoch": 2.24, + "learning_rate": 4.492835058769134e-05, + "loss": 1.5082, + "step": 28482 + }, + { + "epoch": 2.24, + "learning_rate": 4.4919530132286954e-05, + "loss": 1.4402, + "step": 28483 + }, + { + "epoch": 2.24, + "learning_rate": 4.491071039032101e-05, + "loss": 1.4255, + "step": 28484 + }, + { + "epoch": 2.24, + "learning_rate": 4.490189136185335e-05, + "loss": 1.5001, + "step": 28485 + }, + { + "epoch": 2.24, + "learning_rate": 4.48930730469438e-05, + "loss": 1.424, + "step": 28486 + }, + { + "epoch": 2.24, + "learning_rate": 4.4884255445652274e-05, + "loss": 1.5139, + "step": 28487 + }, + { + "epoch": 2.24, + "learning_rate": 4.48754385580387e-05, + "loss": 1.4758, + "step": 28488 + }, + { + "epoch": 2.24, + "learning_rate": 4.4866622384162884e-05, + "loss": 1.4511, + "step": 28489 + }, + { + "epoch": 2.24, + "learning_rate": 4.485780692408468e-05, + "loss": 1.4652, + "step": 28490 + }, + { + "epoch": 2.24, + "learning_rate": 4.484899217786391e-05, + "loss": 1.4513, + "step": 28491 + }, + { + "epoch": 2.24, + "learning_rate": 4.484017814556049e-05, + "loss": 1.4187, + "step": 28492 + }, + { + "epoch": 2.24, + "learning_rate": 4.483136482723424e-05, + "loss": 1.402, + "step": 28493 + }, + { + "epoch": 2.24, + "learning_rate": 4.482255222294494e-05, + "loss": 1.4142, + "step": 28494 + }, + { + "epoch": 2.24, + "learning_rate": 4.481374033275249e-05, + "loss": 1.4221, + "step": 28495 + }, + { + "epoch": 2.24, + "learning_rate": 4.4804929156716736e-05, + "loss": 1.4689, + "step": 28496 + }, + { + "epoch": 2.24, + "learning_rate": 4.479611869489739e-05, + "loss": 1.443, + "step": 28497 + }, + { + "epoch": 2.24, + "learning_rate": 4.478730894735439e-05, + "loss": 1.4371, + "step": 28498 + }, + { + "epoch": 2.24, + "learning_rate": 4.477849991414751e-05, + "loss": 1.4445, + "step": 28499 + }, + { + "epoch": 2.24, + "learning_rate": 4.4769691595336485e-05, + "loss": 1.4652, + "step": 28500 + }, + { + "epoch": 2.24, + "learning_rate": 4.4760883990981196e-05, + "loss": 1.4546, + "step": 28501 + }, + { + "epoch": 2.24, + "learning_rate": 4.475207710114148e-05, + "loss": 1.3867, + "step": 28502 + }, + { + "epoch": 2.24, + "learning_rate": 4.4743270925877085e-05, + "loss": 1.4357, + "step": 28503 + }, + { + "epoch": 2.24, + "learning_rate": 4.473446546524772e-05, + "loss": 1.4606, + "step": 28504 + }, + { + "epoch": 2.24, + "learning_rate": 4.472566071931331e-05, + "loss": 1.4876, + "step": 28505 + }, + { + "epoch": 2.24, + "learning_rate": 4.4716856688133576e-05, + "loss": 1.4386, + "step": 28506 + }, + { + "epoch": 2.24, + "learning_rate": 4.4708053371768274e-05, + "loss": 1.4568, + "step": 28507 + }, + { + "epoch": 2.24, + "learning_rate": 4.4699250770277136e-05, + "loss": 1.4598, + "step": 28508 + }, + { + "epoch": 2.24, + "learning_rate": 4.469044888372003e-05, + "loss": 1.4602, + "step": 28509 + }, + { + "epoch": 2.24, + "learning_rate": 4.4681647712156657e-05, + "loss": 1.4554, + "step": 28510 + }, + { + "epoch": 2.24, + "learning_rate": 4.4672847255646746e-05, + "loss": 1.3991, + "step": 28511 + }, + { + "epoch": 2.24, + "learning_rate": 4.46640475142501e-05, + "loss": 1.4266, + "step": 28512 + }, + { + "epoch": 2.24, + "learning_rate": 4.4655248488026446e-05, + "loss": 1.4371, + "step": 28513 + }, + { + "epoch": 2.24, + "learning_rate": 4.464645017703548e-05, + "loss": 1.4741, + "step": 28514 + }, + { + "epoch": 2.24, + "learning_rate": 4.4637652581337024e-05, + "loss": 1.433, + "step": 28515 + }, + { + "epoch": 2.24, + "learning_rate": 4.4628855700990765e-05, + "loss": 1.4857, + "step": 28516 + }, + { + "epoch": 2.24, + "learning_rate": 4.462005953605638e-05, + "loss": 1.4137, + "step": 28517 + }, + { + "epoch": 2.24, + "learning_rate": 4.461126408659365e-05, + "loss": 1.4699, + "step": 28518 + }, + { + "epoch": 2.24, + "learning_rate": 4.46024693526623e-05, + "loss": 1.5006, + "step": 28519 + }, + { + "epoch": 2.24, + "learning_rate": 4.459367533432203e-05, + "loss": 1.4462, + "step": 28520 + }, + { + "epoch": 2.24, + "learning_rate": 4.458488203163249e-05, + "loss": 1.5194, + "step": 28521 + }, + { + "epoch": 2.24, + "learning_rate": 4.457608944465349e-05, + "loss": 1.4625, + "step": 28522 + }, + { + "epoch": 2.24, + "learning_rate": 4.456729757344465e-05, + "loss": 1.4502, + "step": 28523 + }, + { + "epoch": 2.24, + "learning_rate": 4.455850641806562e-05, + "loss": 1.4689, + "step": 28524 + }, + { + "epoch": 2.24, + "learning_rate": 4.454971597857621e-05, + "loss": 1.4075, + "step": 28525 + }, + { + "epoch": 2.24, + "learning_rate": 4.454092625503603e-05, + "loss": 1.4822, + "step": 28526 + }, + { + "epoch": 2.24, + "learning_rate": 4.453213724750476e-05, + "loss": 1.4483, + "step": 28527 + }, + { + "epoch": 2.24, + "learning_rate": 4.4523348956042034e-05, + "loss": 1.4274, + "step": 28528 + }, + { + "epoch": 2.24, + "learning_rate": 4.45145613807076e-05, + "loss": 1.4746, + "step": 28529 + }, + { + "epoch": 2.24, + "learning_rate": 4.450577452156109e-05, + "loss": 1.462, + "step": 28530 + }, + { + "epoch": 2.24, + "learning_rate": 4.449698837866211e-05, + "loss": 1.4588, + "step": 28531 + }, + { + "epoch": 2.24, + "learning_rate": 4.44882029520704e-05, + "loss": 1.4696, + "step": 28532 + }, + { + "epoch": 2.25, + "learning_rate": 4.447941824184553e-05, + "loss": 1.4863, + "step": 28533 + }, + { + "epoch": 2.25, + "learning_rate": 4.447063424804721e-05, + "loss": 1.4783, + "step": 28534 + }, + { + "epoch": 2.25, + "learning_rate": 4.4461850970735e-05, + "loss": 1.4743, + "step": 28535 + }, + { + "epoch": 2.25, + "learning_rate": 4.445306840996864e-05, + "loss": 1.4006, + "step": 28536 + }, + { + "epoch": 2.25, + "learning_rate": 4.444428656580769e-05, + "loss": 1.4944, + "step": 28537 + }, + { + "epoch": 2.25, + "learning_rate": 4.443550543831174e-05, + "loss": 1.4806, + "step": 28538 + }, + { + "epoch": 2.25, + "learning_rate": 4.442672502754051e-05, + "loss": 1.4818, + "step": 28539 + }, + { + "epoch": 2.25, + "learning_rate": 4.4417945333553535e-05, + "loss": 1.4433, + "step": 28540 + }, + { + "epoch": 2.25, + "learning_rate": 4.4409166356410426e-05, + "loss": 1.4757, + "step": 28541 + }, + { + "epoch": 2.25, + "learning_rate": 4.4400388096170837e-05, + "loss": 1.4301, + "step": 28542 + }, + { + "epoch": 2.25, + "learning_rate": 4.439161055289434e-05, + "loss": 1.4114, + "step": 28543 + }, + { + "epoch": 2.25, + "learning_rate": 4.4382833726640524e-05, + "loss": 1.4688, + "step": 28544 + }, + { + "epoch": 2.25, + "learning_rate": 4.437405761746894e-05, + "loss": 1.4308, + "step": 28545 + }, + { + "epoch": 2.25, + "learning_rate": 4.4365282225439273e-05, + "loss": 1.429, + "step": 28546 + }, + { + "epoch": 2.25, + "learning_rate": 4.435650755061104e-05, + "loss": 1.4461, + "step": 28547 + }, + { + "epoch": 2.25, + "learning_rate": 4.434773359304377e-05, + "loss": 1.5199, + "step": 28548 + }, + { + "epoch": 2.25, + "learning_rate": 4.4338960352797084e-05, + "loss": 1.4821, + "step": 28549 + }, + { + "epoch": 2.25, + "learning_rate": 4.433018782993059e-05, + "loss": 1.492, + "step": 28550 + }, + { + "epoch": 2.25, + "learning_rate": 4.432141602450381e-05, + "loss": 1.4527, + "step": 28551 + }, + { + "epoch": 2.25, + "learning_rate": 4.431264493657627e-05, + "loss": 1.4182, + "step": 28552 + }, + { + "epoch": 2.25, + "learning_rate": 4.430387456620757e-05, + "loss": 1.4218, + "step": 28553 + }, + { + "epoch": 2.25, + "learning_rate": 4.429510491345725e-05, + "loss": 1.4231, + "step": 28554 + }, + { + "epoch": 2.25, + "learning_rate": 4.428633597838477e-05, + "loss": 1.5022, + "step": 28555 + }, + { + "epoch": 2.25, + "learning_rate": 4.427756776104981e-05, + "loss": 1.4118, + "step": 28556 + }, + { + "epoch": 2.25, + "learning_rate": 4.426880026151179e-05, + "loss": 1.4121, + "step": 28557 + }, + { + "epoch": 2.25, + "learning_rate": 4.426003347983022e-05, + "loss": 1.4841, + "step": 28558 + }, + { + "epoch": 2.25, + "learning_rate": 4.425126741606475e-05, + "loss": 1.4661, + "step": 28559 + }, + { + "epoch": 2.25, + "learning_rate": 4.424250207027479e-05, + "loss": 1.4765, + "step": 28560 + }, + { + "epoch": 2.25, + "learning_rate": 4.423373744251989e-05, + "loss": 1.4469, + "step": 28561 + }, + { + "epoch": 2.25, + "learning_rate": 4.422497353285949e-05, + "loss": 1.4572, + "step": 28562 + }, + { + "epoch": 2.25, + "learning_rate": 4.421621034135321e-05, + "loss": 1.439, + "step": 28563 + }, + { + "epoch": 2.25, + "learning_rate": 4.4207447868060427e-05, + "loss": 1.4443, + "step": 28564 + }, + { + "epoch": 2.25, + "learning_rate": 4.4198686113040696e-05, + "loss": 1.4489, + "step": 28565 + }, + { + "epoch": 2.25, + "learning_rate": 4.418992507635355e-05, + "loss": 1.4153, + "step": 28566 + }, + { + "epoch": 2.25, + "learning_rate": 4.4181164758058416e-05, + "loss": 1.3983, + "step": 28567 + }, + { + "epoch": 2.25, + "learning_rate": 4.417240515821479e-05, + "loss": 1.4916, + "step": 28568 + }, + { + "epoch": 2.25, + "learning_rate": 4.416364627688206e-05, + "loss": 1.4732, + "step": 28569 + }, + { + "epoch": 2.25, + "learning_rate": 4.4154888114119834e-05, + "loss": 1.4626, + "step": 28570 + }, + { + "epoch": 2.25, + "learning_rate": 4.41461306699875e-05, + "loss": 1.4288, + "step": 28571 + }, + { + "epoch": 2.25, + "learning_rate": 4.413737394454449e-05, + "loss": 1.478, + "step": 28572 + }, + { + "epoch": 2.25, + "learning_rate": 4.4128617937850325e-05, + "loss": 1.4738, + "step": 28573 + }, + { + "epoch": 2.25, + "learning_rate": 4.4119862649964424e-05, + "loss": 1.4748, + "step": 28574 + }, + { + "epoch": 2.25, + "learning_rate": 4.411110808094617e-05, + "loss": 1.4436, + "step": 28575 + }, + { + "epoch": 2.25, + "learning_rate": 4.410235423085512e-05, + "loss": 1.4667, + "step": 28576 + }, + { + "epoch": 2.25, + "learning_rate": 4.409360109975063e-05, + "loss": 1.4678, + "step": 28577 + }, + { + "epoch": 2.25, + "learning_rate": 4.4084848687692104e-05, + "loss": 1.4732, + "step": 28578 + }, + { + "epoch": 2.25, + "learning_rate": 4.407609699473905e-05, + "loss": 1.4678, + "step": 28579 + }, + { + "epoch": 2.25, + "learning_rate": 4.4067346020950814e-05, + "loss": 1.4729, + "step": 28580 + }, + { + "epoch": 2.25, + "learning_rate": 4.4058595766386864e-05, + "loss": 1.4694, + "step": 28581 + }, + { + "epoch": 2.25, + "learning_rate": 4.4049846231106555e-05, + "loss": 1.4563, + "step": 28582 + }, + { + "epoch": 2.25, + "learning_rate": 4.404109741516936e-05, + "loss": 1.4296, + "step": 28583 + }, + { + "epoch": 2.25, + "learning_rate": 4.403234931863464e-05, + "loss": 1.5036, + "step": 28584 + }, + { + "epoch": 2.25, + "learning_rate": 4.402360194156179e-05, + "loss": 1.4671, + "step": 28585 + }, + { + "epoch": 2.25, + "learning_rate": 4.401485528401017e-05, + "loss": 1.4636, + "step": 28586 + }, + { + "epoch": 2.25, + "learning_rate": 4.400610934603923e-05, + "loss": 1.4846, + "step": 28587 + }, + { + "epoch": 2.25, + "learning_rate": 4.399736412770831e-05, + "loss": 1.4734, + "step": 28588 + }, + { + "epoch": 2.25, + "learning_rate": 4.3988619629076746e-05, + "loss": 1.4287, + "step": 28589 + }, + { + "epoch": 2.25, + "learning_rate": 4.3979875850204e-05, + "loss": 1.4489, + "step": 28590 + }, + { + "epoch": 2.25, + "learning_rate": 4.39711327911494e-05, + "loss": 1.4508, + "step": 28591 + }, + { + "epoch": 2.25, + "learning_rate": 4.396239045197224e-05, + "loss": 1.4602, + "step": 28592 + }, + { + "epoch": 2.25, + "learning_rate": 4.395364883273198e-05, + "loss": 1.4415, + "step": 28593 + }, + { + "epoch": 2.25, + "learning_rate": 4.394490793348792e-05, + "loss": 1.5127, + "step": 28594 + }, + { + "epoch": 2.25, + "learning_rate": 4.393616775429938e-05, + "loss": 1.4478, + "step": 28595 + }, + { + "epoch": 2.25, + "learning_rate": 4.39274282952257e-05, + "loss": 1.4065, + "step": 28596 + }, + { + "epoch": 2.25, + "learning_rate": 4.3918689556326313e-05, + "loss": 1.4858, + "step": 28597 + }, + { + "epoch": 2.25, + "learning_rate": 4.390995153766048e-05, + "loss": 1.4991, + "step": 28598 + }, + { + "epoch": 2.25, + "learning_rate": 4.390121423928749e-05, + "loss": 1.4251, + "step": 28599 + }, + { + "epoch": 2.25, + "learning_rate": 4.389247766126675e-05, + "loss": 1.3911, + "step": 28600 + }, + { + "epoch": 2.25, + "learning_rate": 4.388374180365753e-05, + "loss": 1.4777, + "step": 28601 + }, + { + "epoch": 2.25, + "learning_rate": 4.387500666651913e-05, + "loss": 1.5011, + "step": 28602 + }, + { + "epoch": 2.25, + "learning_rate": 4.386627224991083e-05, + "loss": 1.435, + "step": 28603 + }, + { + "epoch": 2.25, + "learning_rate": 4.3857538553892024e-05, + "loss": 1.4651, + "step": 28604 + }, + { + "epoch": 2.25, + "learning_rate": 4.384880557852196e-05, + "loss": 1.463, + "step": 28605 + }, + { + "epoch": 2.25, + "learning_rate": 4.384007332385988e-05, + "loss": 1.494, + "step": 28606 + }, + { + "epoch": 2.25, + "learning_rate": 4.383134178996517e-05, + "loss": 1.4852, + "step": 28607 + }, + { + "epoch": 2.25, + "learning_rate": 4.382261097689704e-05, + "loss": 1.438, + "step": 28608 + }, + { + "epoch": 2.25, + "learning_rate": 4.3813880884714756e-05, + "loss": 1.4736, + "step": 28609 + }, + { + "epoch": 2.25, + "learning_rate": 4.3805151513477666e-05, + "loss": 1.4553, + "step": 28610 + }, + { + "epoch": 2.25, + "learning_rate": 4.379642286324495e-05, + "loss": 1.4519, + "step": 28611 + }, + { + "epoch": 2.25, + "learning_rate": 4.378769493407595e-05, + "loss": 1.4503, + "step": 28612 + }, + { + "epoch": 2.25, + "learning_rate": 4.377896772602985e-05, + "loss": 1.4669, + "step": 28613 + }, + { + "epoch": 2.25, + "learning_rate": 4.3770241239165996e-05, + "loss": 1.429, + "step": 28614 + }, + { + "epoch": 2.25, + "learning_rate": 4.376151547354358e-05, + "loss": 1.4193, + "step": 28615 + }, + { + "epoch": 2.25, + "learning_rate": 4.3752790429221794e-05, + "loss": 1.4426, + "step": 28616 + }, + { + "epoch": 2.25, + "learning_rate": 4.3744066106259965e-05, + "loss": 1.4631, + "step": 28617 + }, + { + "epoch": 2.25, + "learning_rate": 4.373534250471731e-05, + "loss": 1.45, + "step": 28618 + }, + { + "epoch": 2.25, + "learning_rate": 4.3726619624653034e-05, + "loss": 1.5317, + "step": 28619 + }, + { + "epoch": 2.25, + "learning_rate": 4.3717897466126306e-05, + "loss": 1.4457, + "step": 28620 + }, + { + "epoch": 2.25, + "learning_rate": 4.370917602919646e-05, + "loss": 1.4582, + "step": 28621 + }, + { + "epoch": 2.25, + "learning_rate": 4.3700455313922644e-05, + "loss": 1.4589, + "step": 28622 + }, + { + "epoch": 2.25, + "learning_rate": 4.369173532036404e-05, + "loss": 1.4644, + "step": 28623 + }, + { + "epoch": 2.25, + "learning_rate": 4.3683016048579934e-05, + "loss": 1.4575, + "step": 28624 + }, + { + "epoch": 2.25, + "learning_rate": 4.367429749862947e-05, + "loss": 1.424, + "step": 28625 + }, + { + "epoch": 2.25, + "learning_rate": 4.366557967057181e-05, + "loss": 1.4411, + "step": 28626 + }, + { + "epoch": 2.25, + "learning_rate": 4.365686256446618e-05, + "loss": 1.4268, + "step": 28627 + }, + { + "epoch": 2.25, + "learning_rate": 4.364814618037181e-05, + "loss": 1.4415, + "step": 28628 + }, + { + "epoch": 2.25, + "learning_rate": 4.363943051834785e-05, + "loss": 1.4372, + "step": 28629 + }, + { + "epoch": 2.25, + "learning_rate": 4.36307155784534e-05, + "loss": 1.4728, + "step": 28630 + }, + { + "epoch": 2.25, + "learning_rate": 4.362200136074775e-05, + "loss": 1.4236, + "step": 28631 + }, + { + "epoch": 2.25, + "learning_rate": 4.361328786529e-05, + "loss": 1.4548, + "step": 28632 + }, + { + "epoch": 2.25, + "learning_rate": 4.360457509213928e-05, + "loss": 1.4114, + "step": 28633 + }, + { + "epoch": 2.25, + "learning_rate": 4.3595863041354824e-05, + "loss": 1.4615, + "step": 28634 + }, + { + "epoch": 2.25, + "learning_rate": 4.3587151712995724e-05, + "loss": 1.4048, + "step": 28635 + }, + { + "epoch": 2.25, + "learning_rate": 4.357844110712111e-05, + "loss": 1.4113, + "step": 28636 + }, + { + "epoch": 2.25, + "learning_rate": 4.3569731223790186e-05, + "loss": 1.485, + "step": 28637 + }, + { + "epoch": 2.25, + "learning_rate": 4.3561022063062076e-05, + "loss": 1.4513, + "step": 28638 + }, + { + "epoch": 2.25, + "learning_rate": 4.3552313624995866e-05, + "loss": 1.4277, + "step": 28639 + }, + { + "epoch": 2.25, + "learning_rate": 4.354360590965067e-05, + "loss": 1.4951, + "step": 28640 + }, + { + "epoch": 2.25, + "learning_rate": 4.353489891708569e-05, + "loss": 1.4499, + "step": 28641 + }, + { + "epoch": 2.25, + "learning_rate": 4.352619264735999e-05, + "loss": 1.4058, + "step": 28642 + }, + { + "epoch": 2.25, + "learning_rate": 4.3517487100532635e-05, + "loss": 1.482, + "step": 28643 + }, + { + "epoch": 2.25, + "learning_rate": 4.3508782276662784e-05, + "loss": 1.4801, + "step": 28644 + }, + { + "epoch": 2.25, + "learning_rate": 4.3500078175809576e-05, + "loss": 1.4593, + "step": 28645 + }, + { + "epoch": 2.25, + "learning_rate": 4.349137479803207e-05, + "loss": 1.4485, + "step": 28646 + }, + { + "epoch": 2.25, + "learning_rate": 4.3482672143389315e-05, + "loss": 1.4241, + "step": 28647 + }, + { + "epoch": 2.25, + "learning_rate": 4.347397021194048e-05, + "loss": 1.4908, + "step": 28648 + }, + { + "epoch": 2.25, + "learning_rate": 4.3465269003744584e-05, + "loss": 1.4179, + "step": 28649 + }, + { + "epoch": 2.25, + "learning_rate": 4.345656851886068e-05, + "loss": 1.4824, + "step": 28650 + }, + { + "epoch": 2.25, + "learning_rate": 4.344786875734795e-05, + "loss": 1.3816, + "step": 28651 + }, + { + "epoch": 2.25, + "learning_rate": 4.343916971926536e-05, + "loss": 1.4961, + "step": 28652 + }, + { + "epoch": 2.25, + "learning_rate": 4.3430471404671974e-05, + "loss": 1.509, + "step": 28653 + }, + { + "epoch": 2.25, + "learning_rate": 4.342177381362691e-05, + "loss": 1.4366, + "step": 28654 + }, + { + "epoch": 2.25, + "learning_rate": 4.34130769461892e-05, + "loss": 1.4673, + "step": 28655 + }, + { + "epoch": 2.25, + "learning_rate": 4.340438080241787e-05, + "loss": 1.4188, + "step": 28656 + }, + { + "epoch": 2.25, + "learning_rate": 4.339568538237194e-05, + "loss": 1.4526, + "step": 28657 + }, + { + "epoch": 2.25, + "learning_rate": 4.33869906861105e-05, + "loss": 1.5003, + "step": 28658 + }, + { + "epoch": 2.25, + "learning_rate": 4.337829671369252e-05, + "loss": 1.4273, + "step": 28659 + }, + { + "epoch": 2.26, + "learning_rate": 4.336960346517712e-05, + "loss": 1.3953, + "step": 28660 + }, + { + "epoch": 2.26, + "learning_rate": 4.336091094062322e-05, + "loss": 1.4172, + "step": 28661 + }, + { + "epoch": 2.26, + "learning_rate": 4.335221914008994e-05, + "loss": 1.4352, + "step": 28662 + }, + { + "epoch": 2.26, + "learning_rate": 4.334352806363622e-05, + "loss": 1.4738, + "step": 28663 + }, + { + "epoch": 2.26, + "learning_rate": 4.3334837711321056e-05, + "loss": 1.4071, + "step": 28664 + }, + { + "epoch": 2.26, + "learning_rate": 4.332614808320353e-05, + "loss": 1.4781, + "step": 28665 + }, + { + "epoch": 2.26, + "learning_rate": 4.3317459179342565e-05, + "loss": 1.4725, + "step": 28666 + }, + { + "epoch": 2.26, + "learning_rate": 4.330877099979717e-05, + "loss": 1.4513, + "step": 28667 + }, + { + "epoch": 2.26, + "learning_rate": 4.330008354462636e-05, + "loss": 1.4043, + "step": 28668 + }, + { + "epoch": 2.26, + "learning_rate": 4.329139681388911e-05, + "loss": 1.4435, + "step": 28669 + }, + { + "epoch": 2.26, + "learning_rate": 4.328271080764435e-05, + "loss": 1.4616, + "step": 28670 + }, + { + "epoch": 2.26, + "learning_rate": 4.3274025525951124e-05, + "loss": 1.4431, + "step": 28671 + }, + { + "epoch": 2.26, + "learning_rate": 4.326534096886838e-05, + "loss": 1.4366, + "step": 28672 + }, + { + "epoch": 2.26, + "learning_rate": 4.325665713645507e-05, + "loss": 1.4997, + "step": 28673 + }, + { + "epoch": 2.26, + "learning_rate": 4.324797402877005e-05, + "loss": 1.4523, + "step": 28674 + }, + { + "epoch": 2.26, + "learning_rate": 4.3239291645872475e-05, + "loss": 1.4331, + "step": 28675 + }, + { + "epoch": 2.26, + "learning_rate": 4.3230609987821204e-05, + "loss": 1.4735, + "step": 28676 + }, + { + "epoch": 2.26, + "learning_rate": 4.3221929054675116e-05, + "loss": 1.4207, + "step": 28677 + }, + { + "epoch": 2.26, + "learning_rate": 4.321324884649325e-05, + "loss": 1.5048, + "step": 28678 + }, + { + "epoch": 2.26, + "learning_rate": 4.320456936333449e-05, + "loss": 1.461, + "step": 28679 + }, + { + "epoch": 2.26, + "learning_rate": 4.319589060525778e-05, + "loss": 1.4681, + "step": 28680 + }, + { + "epoch": 2.26, + "learning_rate": 4.318721257232198e-05, + "loss": 1.4263, + "step": 28681 + }, + { + "epoch": 2.26, + "learning_rate": 4.317853526458611e-05, + "loss": 1.3856, + "step": 28682 + }, + { + "epoch": 2.26, + "learning_rate": 4.316985868210903e-05, + "loss": 1.423, + "step": 28683 + }, + { + "epoch": 2.26, + "learning_rate": 4.3161182824949626e-05, + "loss": 1.4764, + "step": 28684 + }, + { + "epoch": 2.26, + "learning_rate": 4.315250769316686e-05, + "loss": 1.4807, + "step": 28685 + }, + { + "epoch": 2.26, + "learning_rate": 4.314383328681961e-05, + "loss": 1.4266, + "step": 28686 + }, + { + "epoch": 2.26, + "learning_rate": 4.313515960596672e-05, + "loss": 1.4361, + "step": 28687 + }, + { + "epoch": 2.26, + "learning_rate": 4.3126486650667166e-05, + "loss": 1.4678, + "step": 28688 + }, + { + "epoch": 2.26, + "learning_rate": 4.3117814420979794e-05, + "loss": 1.4269, + "step": 28689 + }, + { + "epoch": 2.26, + "learning_rate": 4.310914291696344e-05, + "loss": 1.4314, + "step": 28690 + }, + { + "epoch": 2.26, + "learning_rate": 4.3100472138677e-05, + "loss": 1.4473, + "step": 28691 + }, + { + "epoch": 2.26, + "learning_rate": 4.309180208617943e-05, + "loss": 1.4964, + "step": 28692 + }, + { + "epoch": 2.26, + "learning_rate": 4.308313275952952e-05, + "loss": 1.4577, + "step": 28693 + }, + { + "epoch": 2.26, + "learning_rate": 4.307446415878608e-05, + "loss": 1.4525, + "step": 28694 + }, + { + "epoch": 2.26, + "learning_rate": 4.306579628400808e-05, + "loss": 1.4229, + "step": 28695 + }, + { + "epoch": 2.26, + "learning_rate": 4.3057129135254307e-05, + "loss": 1.4127, + "step": 28696 + }, + { + "epoch": 2.26, + "learning_rate": 4.3048462712583606e-05, + "loss": 1.4211, + "step": 28697 + }, + { + "epoch": 2.26, + "learning_rate": 4.3039797016054784e-05, + "loss": 1.3967, + "step": 28698 + }, + { + "epoch": 2.26, + "learning_rate": 4.3031132045726765e-05, + "loss": 1.4588, + "step": 28699 + }, + { + "epoch": 2.26, + "learning_rate": 4.3022467801658314e-05, + "loss": 1.4497, + "step": 28700 + }, + { + "epoch": 2.26, + "learning_rate": 4.3013804283908235e-05, + "loss": 1.479, + "step": 28701 + }, + { + "epoch": 2.26, + "learning_rate": 4.300514149253543e-05, + "loss": 1.4408, + "step": 28702 + }, + { + "epoch": 2.26, + "learning_rate": 4.299647942759867e-05, + "loss": 1.4354, + "step": 28703 + }, + { + "epoch": 2.26, + "learning_rate": 4.298781808915672e-05, + "loss": 1.4438, + "step": 28704 + }, + { + "epoch": 2.26, + "learning_rate": 4.297915747726848e-05, + "loss": 1.469, + "step": 28705 + }, + { + "epoch": 2.26, + "learning_rate": 4.297049759199265e-05, + "loss": 1.4073, + "step": 28706 + }, + { + "epoch": 2.26, + "learning_rate": 4.296183843338812e-05, + "loss": 1.4703, + "step": 28707 + }, + { + "epoch": 2.26, + "learning_rate": 4.295318000151359e-05, + "loss": 1.4952, + "step": 28708 + }, + { + "epoch": 2.26, + "learning_rate": 4.2944522296427964e-05, + "loss": 1.4241, + "step": 28709 + }, + { + "epoch": 2.26, + "learning_rate": 4.293586531818993e-05, + "loss": 1.5281, + "step": 28710 + }, + { + "epoch": 2.26, + "learning_rate": 4.292720906685825e-05, + "loss": 1.4347, + "step": 28711 + }, + { + "epoch": 2.26, + "learning_rate": 4.2918553542491776e-05, + "loss": 1.4917, + "step": 28712 + }, + { + "epoch": 2.26, + "learning_rate": 4.290989874514923e-05, + "loss": 1.4647, + "step": 28713 + }, + { + "epoch": 2.26, + "learning_rate": 4.290124467488939e-05, + "loss": 1.3839, + "step": 28714 + }, + { + "epoch": 2.26, + "learning_rate": 4.289259133177093e-05, + "loss": 1.4515, + "step": 28715 + }, + { + "epoch": 2.26, + "learning_rate": 4.288393871585272e-05, + "loss": 1.4461, + "step": 28716 + }, + { + "epoch": 2.26, + "learning_rate": 4.2875286827193465e-05, + "loss": 1.4652, + "step": 28717 + }, + { + "epoch": 2.26, + "learning_rate": 4.286663566585184e-05, + "loss": 1.4607, + "step": 28718 + }, + { + "epoch": 2.26, + "learning_rate": 4.2857985231886675e-05, + "loss": 1.4744, + "step": 28719 + }, + { + "epoch": 2.26, + "learning_rate": 4.284933552535668e-05, + "loss": 1.4487, + "step": 28720 + }, + { + "epoch": 2.26, + "learning_rate": 4.2840686546320516e-05, + "loss": 1.5305, + "step": 28721 + }, + { + "epoch": 2.26, + "learning_rate": 4.283203829483696e-05, + "loss": 1.4187, + "step": 28722 + }, + { + "epoch": 2.26, + "learning_rate": 4.282339077096477e-05, + "loss": 1.505, + "step": 28723 + }, + { + "epoch": 2.26, + "learning_rate": 4.28147439747626e-05, + "loss": 1.4275, + "step": 28724 + }, + { + "epoch": 2.26, + "learning_rate": 4.2806097906289124e-05, + "loss": 1.4316, + "step": 28725 + }, + { + "epoch": 2.26, + "learning_rate": 4.2797452565603134e-05, + "loss": 1.4751, + "step": 28726 + }, + { + "epoch": 2.26, + "learning_rate": 4.278880795276329e-05, + "loss": 1.4567, + "step": 28727 + }, + { + "epoch": 2.26, + "learning_rate": 4.278016406782824e-05, + "loss": 1.475, + "step": 28728 + }, + { + "epoch": 2.26, + "learning_rate": 4.277152091085674e-05, + "loss": 1.462, + "step": 28729 + }, + { + "epoch": 2.26, + "learning_rate": 4.276287848190743e-05, + "loss": 1.4791, + "step": 28730 + }, + { + "epoch": 2.26, + "learning_rate": 4.2754236781039e-05, + "loss": 1.5469, + "step": 28731 + }, + { + "epoch": 2.26, + "learning_rate": 4.274559580831009e-05, + "loss": 1.4485, + "step": 28732 + }, + { + "epoch": 2.26, + "learning_rate": 4.273695556377943e-05, + "loss": 1.4676, + "step": 28733 + }, + { + "epoch": 2.26, + "learning_rate": 4.272831604750566e-05, + "loss": 1.455, + "step": 28734 + }, + { + "epoch": 2.26, + "learning_rate": 4.2719677259547355e-05, + "loss": 1.4961, + "step": 28735 + }, + { + "epoch": 2.26, + "learning_rate": 4.27110391999633e-05, + "loss": 1.4606, + "step": 28736 + }, + { + "epoch": 2.26, + "learning_rate": 4.270240186881205e-05, + "loss": 1.4145, + "step": 28737 + }, + { + "epoch": 2.26, + "learning_rate": 4.2693765266152306e-05, + "loss": 1.4003, + "step": 28738 + }, + { + "epoch": 2.26, + "learning_rate": 4.2685129392042635e-05, + "loss": 1.4354, + "step": 28739 + }, + { + "epoch": 2.26, + "learning_rate": 4.2676494246541774e-05, + "loss": 1.4487, + "step": 28740 + }, + { + "epoch": 2.26, + "learning_rate": 4.266785982970829e-05, + "loss": 1.5597, + "step": 28741 + }, + { + "epoch": 2.26, + "learning_rate": 4.265922614160075e-05, + "loss": 1.4667, + "step": 28742 + }, + { + "epoch": 2.26, + "learning_rate": 4.2650593182277874e-05, + "loss": 1.4148, + "step": 28743 + }, + { + "epoch": 2.26, + "learning_rate": 4.264196095179824e-05, + "loss": 1.4333, + "step": 28744 + }, + { + "epoch": 2.26, + "learning_rate": 4.263332945022039e-05, + "loss": 1.4897, + "step": 28745 + }, + { + "epoch": 2.26, + "learning_rate": 4.262469867760305e-05, + "loss": 1.4005, + "step": 28746 + }, + { + "epoch": 2.26, + "learning_rate": 4.2616068634004716e-05, + "loss": 1.4483, + "step": 28747 + }, + { + "epoch": 2.26, + "learning_rate": 4.2607439319484004e-05, + "loss": 1.463, + "step": 28748 + }, + { + "epoch": 2.26, + "learning_rate": 4.2598810734099546e-05, + "loss": 1.4132, + "step": 28749 + }, + { + "epoch": 2.26, + "learning_rate": 4.25901828779099e-05, + "loss": 1.4595, + "step": 28750 + }, + { + "epoch": 2.26, + "learning_rate": 4.2581555750973634e-05, + "loss": 1.4209, + "step": 28751 + }, + { + "epoch": 2.26, + "learning_rate": 4.257292935334928e-05, + "loss": 1.4529, + "step": 28752 + }, + { + "epoch": 2.26, + "learning_rate": 4.256430368509545e-05, + "loss": 1.4487, + "step": 28753 + }, + { + "epoch": 2.26, + "learning_rate": 4.255567874627076e-05, + "loss": 1.4851, + "step": 28754 + }, + { + "epoch": 2.26, + "learning_rate": 4.25470545369337e-05, + "loss": 1.4593, + "step": 28755 + }, + { + "epoch": 2.26, + "learning_rate": 4.2538431057142825e-05, + "loss": 1.4231, + "step": 28756 + }, + { + "epoch": 2.26, + "learning_rate": 4.252980830695673e-05, + "loss": 1.4851, + "step": 28757 + }, + { + "epoch": 2.26, + "learning_rate": 4.2521186286433946e-05, + "loss": 1.431, + "step": 28758 + }, + { + "epoch": 2.26, + "learning_rate": 4.2512564995632936e-05, + "loss": 1.4669, + "step": 28759 + }, + { + "epoch": 2.26, + "learning_rate": 4.2503944434612346e-05, + "loss": 1.4163, + "step": 28760 + }, + { + "epoch": 2.26, + "learning_rate": 4.249532460343065e-05, + "loss": 1.4253, + "step": 28761 + }, + { + "epoch": 2.26, + "learning_rate": 4.248670550214632e-05, + "loss": 1.4721, + "step": 28762 + }, + { + "epoch": 2.26, + "learning_rate": 4.247808713081798e-05, + "loss": 1.4173, + "step": 28763 + }, + { + "epoch": 2.26, + "learning_rate": 4.24694694895041e-05, + "loss": 1.4506, + "step": 28764 + }, + { + "epoch": 2.26, + "learning_rate": 4.246085257826312e-05, + "loss": 1.4902, + "step": 28765 + }, + { + "epoch": 2.26, + "learning_rate": 4.245223639715367e-05, + "loss": 1.4327, + "step": 28766 + }, + { + "epoch": 2.26, + "learning_rate": 4.244362094623417e-05, + "loss": 1.4241, + "step": 28767 + }, + { + "epoch": 2.26, + "learning_rate": 4.243500622556313e-05, + "loss": 1.4711, + "step": 28768 + }, + { + "epoch": 2.26, + "learning_rate": 4.242639223519896e-05, + "loss": 1.4535, + "step": 28769 + }, + { + "epoch": 2.26, + "learning_rate": 4.2417778975200313e-05, + "loss": 1.4861, + "step": 28770 + }, + { + "epoch": 2.26, + "learning_rate": 4.2409166445625566e-05, + "loss": 1.4491, + "step": 28771 + }, + { + "epoch": 2.26, + "learning_rate": 4.240055464653321e-05, + "loss": 1.4707, + "step": 28772 + }, + { + "epoch": 2.26, + "learning_rate": 4.239194357798166e-05, + "loss": 1.5211, + "step": 28773 + }, + { + "epoch": 2.26, + "learning_rate": 4.238333324002948e-05, + "loss": 1.4257, + "step": 28774 + }, + { + "epoch": 2.26, + "learning_rate": 4.2374723632735084e-05, + "loss": 1.3984, + "step": 28775 + }, + { + "epoch": 2.26, + "learning_rate": 4.2366114756156875e-05, + "loss": 1.4554, + "step": 28776 + }, + { + "epoch": 2.26, + "learning_rate": 4.2357506610353394e-05, + "loss": 1.4237, + "step": 28777 + }, + { + "epoch": 2.26, + "learning_rate": 4.234889919538304e-05, + "loss": 1.4474, + "step": 28778 + }, + { + "epoch": 2.26, + "learning_rate": 4.2340292511304205e-05, + "loss": 1.4363, + "step": 28779 + }, + { + "epoch": 2.26, + "learning_rate": 4.233168655817543e-05, + "loss": 1.4228, + "step": 28780 + }, + { + "epoch": 2.26, + "learning_rate": 4.232308133605507e-05, + "loss": 1.4685, + "step": 28781 + }, + { + "epoch": 2.26, + "learning_rate": 4.231447684500153e-05, + "loss": 1.4523, + "step": 28782 + }, + { + "epoch": 2.26, + "learning_rate": 4.230587308507332e-05, + "loss": 1.4896, + "step": 28783 + }, + { + "epoch": 2.26, + "learning_rate": 4.2297270056328745e-05, + "loss": 1.4696, + "step": 28784 + }, + { + "epoch": 2.26, + "learning_rate": 4.228866775882632e-05, + "loss": 1.4638, + "step": 28785 + }, + { + "epoch": 2.26, + "learning_rate": 4.2280066192624354e-05, + "loss": 1.4592, + "step": 28786 + }, + { + "epoch": 2.26, + "learning_rate": 4.227146535778134e-05, + "loss": 1.4684, + "step": 28787 + }, + { + "epoch": 2.27, + "learning_rate": 4.2262865254355614e-05, + "loss": 1.4483, + "step": 28788 + }, + { + "epoch": 2.27, + "learning_rate": 4.2254265882405555e-05, + "loss": 1.3859, + "step": 28789 + }, + { + "epoch": 2.27, + "learning_rate": 4.22456672419896e-05, + "loss": 1.4704, + "step": 28790 + }, + { + "epoch": 2.27, + "learning_rate": 4.223706933316611e-05, + "loss": 1.4611, + "step": 28791 + }, + { + "epoch": 2.27, + "learning_rate": 4.222847215599345e-05, + "loss": 1.4627, + "step": 28792 + }, + { + "epoch": 2.27, + "learning_rate": 4.2219875710529946e-05, + "loss": 1.5062, + "step": 28793 + }, + { + "epoch": 2.27, + "learning_rate": 4.2211279996834054e-05, + "loss": 1.4355, + "step": 28794 + }, + { + "epoch": 2.27, + "learning_rate": 4.220268501496408e-05, + "loss": 1.4735, + "step": 28795 + }, + { + "epoch": 2.27, + "learning_rate": 4.219409076497834e-05, + "loss": 1.409, + "step": 28796 + }, + { + "epoch": 2.27, + "learning_rate": 4.218549724693529e-05, + "loss": 1.4447, + "step": 28797 + }, + { + "epoch": 2.27, + "learning_rate": 4.2176904460893216e-05, + "loss": 1.4423, + "step": 28798 + }, + { + "epoch": 2.27, + "learning_rate": 4.2168312406910407e-05, + "loss": 1.4431, + "step": 28799 + }, + { + "epoch": 2.27, + "learning_rate": 4.215972108504525e-05, + "loss": 1.4445, + "step": 28800 + }, + { + "epoch": 2.27, + "learning_rate": 4.215113049535613e-05, + "loss": 1.4831, + "step": 28801 + }, + { + "epoch": 2.27, + "learning_rate": 4.214254063790129e-05, + "loss": 1.429, + "step": 28802 + }, + { + "epoch": 2.27, + "learning_rate": 4.2133951512739075e-05, + "loss": 1.4776, + "step": 28803 + }, + { + "epoch": 2.27, + "learning_rate": 4.212536311992781e-05, + "loss": 1.4705, + "step": 28804 + }, + { + "epoch": 2.27, + "learning_rate": 4.211677545952582e-05, + "loss": 1.4795, + "step": 28805 + }, + { + "epoch": 2.27, + "learning_rate": 4.2108188531591344e-05, + "loss": 1.4544, + "step": 28806 + }, + { + "epoch": 2.27, + "learning_rate": 4.209960233618278e-05, + "loss": 1.5021, + "step": 28807 + }, + { + "epoch": 2.27, + "learning_rate": 4.2091016873358356e-05, + "loss": 1.4879, + "step": 28808 + }, + { + "epoch": 2.27, + "learning_rate": 4.208243214317638e-05, + "loss": 1.4596, + "step": 28809 + }, + { + "epoch": 2.27, + "learning_rate": 4.20738481456951e-05, + "loss": 1.4542, + "step": 28810 + }, + { + "epoch": 2.27, + "learning_rate": 4.206526488097288e-05, + "loss": 1.4741, + "step": 28811 + }, + { + "epoch": 2.27, + "learning_rate": 4.205668234906793e-05, + "loss": 1.4833, + "step": 28812 + }, + { + "epoch": 2.27, + "learning_rate": 4.204810055003851e-05, + "loss": 1.4434, + "step": 28813 + }, + { + "epoch": 2.27, + "learning_rate": 4.203951948394295e-05, + "loss": 1.4628, + "step": 28814 + }, + { + "epoch": 2.27, + "learning_rate": 4.2030939150839496e-05, + "loss": 1.4633, + "step": 28815 + }, + { + "epoch": 2.27, + "learning_rate": 4.202235955078632e-05, + "loss": 1.4395, + "step": 28816 + }, + { + "epoch": 2.27, + "learning_rate": 4.201378068384172e-05, + "loss": 1.4292, + "step": 28817 + }, + { + "epoch": 2.27, + "learning_rate": 4.200520255006404e-05, + "loss": 1.4307, + "step": 28818 + }, + { + "epoch": 2.27, + "learning_rate": 4.199662514951142e-05, + "loss": 1.4151, + "step": 28819 + }, + { + "epoch": 2.27, + "learning_rate": 4.198804848224206e-05, + "loss": 1.4563, + "step": 28820 + }, + { + "epoch": 2.27, + "learning_rate": 4.197947254831429e-05, + "loss": 1.411, + "step": 28821 + }, + { + "epoch": 2.27, + "learning_rate": 4.19708973477863e-05, + "loss": 1.4872, + "step": 28822 + }, + { + "epoch": 2.27, + "learning_rate": 4.1962322880716266e-05, + "loss": 1.4564, + "step": 28823 + }, + { + "epoch": 2.27, + "learning_rate": 4.1953749147162466e-05, + "loss": 1.467, + "step": 28824 + }, + { + "epoch": 2.27, + "learning_rate": 4.1945176147183095e-05, + "loss": 1.4616, + "step": 28825 + }, + { + "epoch": 2.27, + "learning_rate": 4.193660388083635e-05, + "loss": 1.3998, + "step": 28826 + }, + { + "epoch": 2.27, + "learning_rate": 4.192803234818038e-05, + "loss": 1.4157, + "step": 28827 + }, + { + "epoch": 2.27, + "learning_rate": 4.191946154927347e-05, + "loss": 1.4284, + "step": 28828 + }, + { + "epoch": 2.27, + "learning_rate": 4.191089148417378e-05, + "loss": 1.4168, + "step": 28829 + }, + { + "epoch": 2.27, + "learning_rate": 4.1902322152939436e-05, + "loss": 1.4693, + "step": 28830 + }, + { + "epoch": 2.27, + "learning_rate": 4.189375355562868e-05, + "loss": 1.4954, + "step": 28831 + }, + { + "epoch": 2.27, + "learning_rate": 4.1885185692299715e-05, + "loss": 1.4314, + "step": 28832 + }, + { + "epoch": 2.27, + "learning_rate": 4.18766185630107e-05, + "loss": 1.5111, + "step": 28833 + }, + { + "epoch": 2.27, + "learning_rate": 4.186805216781971e-05, + "loss": 1.4134, + "step": 28834 + }, + { + "epoch": 2.27, + "learning_rate": 4.185948650678502e-05, + "loss": 1.4335, + "step": 28835 + }, + { + "epoch": 2.27, + "learning_rate": 4.185092157996474e-05, + "loss": 1.422, + "step": 28836 + }, + { + "epoch": 2.27, + "learning_rate": 4.1842357387416993e-05, + "loss": 1.4467, + "step": 28837 + }, + { + "epoch": 2.27, + "learning_rate": 4.183379392919999e-05, + "loss": 1.4391, + "step": 28838 + }, + { + "epoch": 2.27, + "learning_rate": 4.182523120537182e-05, + "loss": 1.4627, + "step": 28839 + }, + { + "epoch": 2.27, + "learning_rate": 4.18166692159906e-05, + "loss": 1.4923, + "step": 28840 + }, + { + "epoch": 2.27, + "learning_rate": 4.180810796111454e-05, + "loss": 1.4632, + "step": 28841 + }, + { + "epoch": 2.27, + "learning_rate": 4.179954744080172e-05, + "loss": 1.4403, + "step": 28842 + }, + { + "epoch": 2.27, + "learning_rate": 4.179098765511022e-05, + "loss": 1.4178, + "step": 28843 + }, + { + "epoch": 2.27, + "learning_rate": 4.178242860409825e-05, + "loss": 1.4494, + "step": 28844 + }, + { + "epoch": 2.27, + "learning_rate": 4.177387028782387e-05, + "loss": 1.4916, + "step": 28845 + }, + { + "epoch": 2.27, + "learning_rate": 4.176531270634518e-05, + "loss": 1.435, + "step": 28846 + }, + { + "epoch": 2.27, + "learning_rate": 4.1756755859720196e-05, + "loss": 1.5, + "step": 28847 + }, + { + "epoch": 2.27, + "learning_rate": 4.17481997480072e-05, + "loss": 1.3983, + "step": 28848 + }, + { + "epoch": 2.27, + "learning_rate": 4.1739644371264186e-05, + "loss": 1.4458, + "step": 28849 + }, + { + "epoch": 2.27, + "learning_rate": 4.173108972954924e-05, + "loss": 1.4152, + "step": 28850 + }, + { + "epoch": 2.27, + "learning_rate": 4.172253582292041e-05, + "loss": 1.4418, + "step": 28851 + }, + { + "epoch": 2.27, + "learning_rate": 4.171398265143585e-05, + "loss": 1.5067, + "step": 28852 + }, + { + "epoch": 2.27, + "learning_rate": 4.17054302151536e-05, + "loss": 1.4252, + "step": 28853 + }, + { + "epoch": 2.27, + "learning_rate": 4.169687851413166e-05, + "loss": 1.4671, + "step": 28854 + }, + { + "epoch": 2.27, + "learning_rate": 4.1688327548428205e-05, + "loss": 1.4622, + "step": 28855 + }, + { + "epoch": 2.27, + "learning_rate": 4.167977731810123e-05, + "loss": 1.4368, + "step": 28856 + }, + { + "epoch": 2.27, + "learning_rate": 4.167122782320874e-05, + "loss": 1.4291, + "step": 28857 + }, + { + "epoch": 2.27, + "learning_rate": 4.166267906380888e-05, + "loss": 1.4942, + "step": 28858 + }, + { + "epoch": 2.27, + "learning_rate": 4.165413103995965e-05, + "loss": 1.4353, + "step": 28859 + }, + { + "epoch": 2.27, + "learning_rate": 4.1645583751719033e-05, + "loss": 1.4161, + "step": 28860 + }, + { + "epoch": 2.27, + "learning_rate": 4.163703719914515e-05, + "loss": 1.4748, + "step": 28861 + }, + { + "epoch": 2.27, + "learning_rate": 4.162849138229598e-05, + "loss": 1.4196, + "step": 28862 + }, + { + "epoch": 2.27, + "learning_rate": 4.161994630122951e-05, + "loss": 1.4834, + "step": 28863 + }, + { + "epoch": 2.27, + "learning_rate": 4.16114019560038e-05, + "loss": 1.4187, + "step": 28864 + }, + { + "epoch": 2.27, + "learning_rate": 4.160285834667689e-05, + "loss": 1.464, + "step": 28865 + }, + { + "epoch": 2.27, + "learning_rate": 4.159431547330677e-05, + "loss": 1.4562, + "step": 28866 + }, + { + "epoch": 2.27, + "learning_rate": 4.1585773335951404e-05, + "loss": 1.4431, + "step": 28867 + }, + { + "epoch": 2.27, + "learning_rate": 4.157723193466876e-05, + "loss": 1.4857, + "step": 28868 + }, + { + "epoch": 2.27, + "learning_rate": 4.156869126951695e-05, + "loss": 1.4712, + "step": 28869 + }, + { + "epoch": 2.27, + "learning_rate": 4.1560151340553874e-05, + "loss": 1.4514, + "step": 28870 + }, + { + "epoch": 2.27, + "learning_rate": 4.1551612147837495e-05, + "loss": 1.4353, + "step": 28871 + }, + { + "epoch": 2.27, + "learning_rate": 4.154307369142585e-05, + "loss": 1.45, + "step": 28872 + }, + { + "epoch": 2.27, + "learning_rate": 4.153453597137689e-05, + "loss": 1.5114, + "step": 28873 + }, + { + "epoch": 2.27, + "learning_rate": 4.152599898774854e-05, + "loss": 1.4672, + "step": 28874 + }, + { + "epoch": 2.27, + "learning_rate": 4.1517462740598825e-05, + "loss": 1.4686, + "step": 28875 + }, + { + "epoch": 2.27, + "learning_rate": 4.150892722998569e-05, + "loss": 1.488, + "step": 28876 + }, + { + "epoch": 2.27, + "learning_rate": 4.1500392455967015e-05, + "loss": 1.4678, + "step": 28877 + }, + { + "epoch": 2.27, + "learning_rate": 4.149185841860083e-05, + "loss": 1.4681, + "step": 28878 + }, + { + "epoch": 2.27, + "learning_rate": 4.1483325117945026e-05, + "loss": 1.4466, + "step": 28879 + }, + { + "epoch": 2.27, + "learning_rate": 4.147479255405758e-05, + "loss": 1.4344, + "step": 28880 + }, + { + "epoch": 2.27, + "learning_rate": 4.1466260726996395e-05, + "loss": 1.4241, + "step": 28881 + }, + { + "epoch": 2.27, + "learning_rate": 4.145772963681942e-05, + "loss": 1.4823, + "step": 28882 + }, + { + "epoch": 2.27, + "learning_rate": 4.144919928358457e-05, + "loss": 1.4372, + "step": 28883 + }, + { + "epoch": 2.27, + "learning_rate": 4.1440669667349754e-05, + "loss": 1.451, + "step": 28884 + }, + { + "epoch": 2.27, + "learning_rate": 4.1432140788172826e-05, + "loss": 1.4778, + "step": 28885 + }, + { + "epoch": 2.27, + "learning_rate": 4.1423612646111827e-05, + "loss": 1.4374, + "step": 28886 + }, + { + "epoch": 2.27, + "learning_rate": 4.141508524122456e-05, + "loss": 1.4728, + "step": 28887 + }, + { + "epoch": 2.27, + "learning_rate": 4.1406558573568885e-05, + "loss": 1.4427, + "step": 28888 + }, + { + "epoch": 2.27, + "learning_rate": 4.139803264320281e-05, + "loss": 1.5097, + "step": 28889 + }, + { + "epoch": 2.27, + "learning_rate": 4.138950745018417e-05, + "loss": 1.4653, + "step": 28890 + }, + { + "epoch": 2.27, + "learning_rate": 4.138098299457078e-05, + "loss": 1.4761, + "step": 28891 + }, + { + "epoch": 2.27, + "learning_rate": 4.137245927642061e-05, + "loss": 1.4791, + "step": 28892 + }, + { + "epoch": 2.27, + "learning_rate": 4.136393629579152e-05, + "loss": 1.4454, + "step": 28893 + }, + { + "epoch": 2.27, + "learning_rate": 4.13554140527413e-05, + "loss": 1.4768, + "step": 28894 + }, + { + "epoch": 2.27, + "learning_rate": 4.1346892547327856e-05, + "loss": 1.466, + "step": 28895 + }, + { + "epoch": 2.27, + "learning_rate": 4.133837177960909e-05, + "loss": 1.4356, + "step": 28896 + }, + { + "epoch": 2.27, + "learning_rate": 4.132985174964283e-05, + "loss": 1.4412, + "step": 28897 + }, + { + "epoch": 2.27, + "learning_rate": 4.132133245748685e-05, + "loss": 1.437, + "step": 28898 + }, + { + "epoch": 2.27, + "learning_rate": 4.131281390319911e-05, + "loss": 1.4627, + "step": 28899 + }, + { + "epoch": 2.27, + "learning_rate": 4.130429608683738e-05, + "loss": 1.3812, + "step": 28900 + }, + { + "epoch": 2.27, + "learning_rate": 4.129577900845945e-05, + "loss": 1.4578, + "step": 28901 + }, + { + "epoch": 2.27, + "learning_rate": 4.128726266812323e-05, + "loss": 1.4562, + "step": 28902 + }, + { + "epoch": 2.27, + "learning_rate": 4.12787470658865e-05, + "loss": 1.4698, + "step": 28903 + }, + { + "epoch": 2.27, + "learning_rate": 4.1270232201807095e-05, + "loss": 1.5205, + "step": 28904 + }, + { + "epoch": 2.27, + "learning_rate": 4.126171807594276e-05, + "loss": 1.4346, + "step": 28905 + }, + { + "epoch": 2.27, + "learning_rate": 4.1253204688351405e-05, + "loss": 1.4203, + "step": 28906 + }, + { + "epoch": 2.27, + "learning_rate": 4.1244692039090774e-05, + "loss": 1.3855, + "step": 28907 + }, + { + "epoch": 2.27, + "learning_rate": 4.123618012821862e-05, + "loss": 1.4248, + "step": 28908 + }, + { + "epoch": 2.27, + "learning_rate": 4.122766895579282e-05, + "loss": 1.4602, + "step": 28909 + }, + { + "epoch": 2.27, + "learning_rate": 4.121915852187109e-05, + "loss": 1.428, + "step": 28910 + }, + { + "epoch": 2.27, + "learning_rate": 4.121064882651129e-05, + "loss": 1.4371, + "step": 28911 + }, + { + "epoch": 2.27, + "learning_rate": 4.12021398697711e-05, + "loss": 1.4662, + "step": 28912 + }, + { + "epoch": 2.27, + "learning_rate": 4.119363165170838e-05, + "loss": 1.4317, + "step": 28913 + }, + { + "epoch": 2.27, + "learning_rate": 4.118512417238085e-05, + "loss": 1.4676, + "step": 28914 + }, + { + "epoch": 2.28, + "learning_rate": 4.117661743184625e-05, + "loss": 1.4197, + "step": 28915 + }, + { + "epoch": 2.28, + "learning_rate": 4.116811143016241e-05, + "loss": 1.4743, + "step": 28916 + }, + { + "epoch": 2.28, + "learning_rate": 4.115960616738702e-05, + "loss": 1.4927, + "step": 28917 + }, + { + "epoch": 2.28, + "learning_rate": 4.1151101643577804e-05, + "loss": 1.4674, + "step": 28918 + }, + { + "epoch": 2.28, + "learning_rate": 4.114259785879258e-05, + "loss": 1.5218, + "step": 28919 + }, + { + "epoch": 2.28, + "learning_rate": 4.113409481308905e-05, + "loss": 1.4769, + "step": 28920 + }, + { + "epoch": 2.28, + "learning_rate": 4.112559250652494e-05, + "loss": 1.4963, + "step": 28921 + }, + { + "epoch": 2.28, + "learning_rate": 4.111709093915793e-05, + "loss": 1.4383, + "step": 28922 + }, + { + "epoch": 2.28, + "learning_rate": 4.110859011104583e-05, + "loss": 1.4513, + "step": 28923 + }, + { + "epoch": 2.28, + "learning_rate": 4.1100090022246306e-05, + "loss": 1.4835, + "step": 28924 + }, + { + "epoch": 2.28, + "learning_rate": 4.109159067281703e-05, + "loss": 1.4519, + "step": 28925 + }, + { + "epoch": 2.28, + "learning_rate": 4.108309206281576e-05, + "loss": 1.444, + "step": 28926 + }, + { + "epoch": 2.28, + "learning_rate": 4.107459419230023e-05, + "loss": 1.4399, + "step": 28927 + }, + { + "epoch": 2.28, + "learning_rate": 4.10660970613281e-05, + "loss": 1.465, + "step": 28928 + }, + { + "epoch": 2.28, + "learning_rate": 4.105760066995701e-05, + "loss": 1.4425, + "step": 28929 + }, + { + "epoch": 2.28, + "learning_rate": 4.104910501824473e-05, + "loss": 1.4544, + "step": 28930 + }, + { + "epoch": 2.28, + "learning_rate": 4.104061010624891e-05, + "loss": 1.4256, + "step": 28931 + }, + { + "epoch": 2.28, + "learning_rate": 4.1032115934027165e-05, + "loss": 1.4036, + "step": 28932 + }, + { + "epoch": 2.28, + "learning_rate": 4.1023622501637284e-05, + "loss": 1.4065, + "step": 28933 + }, + { + "epoch": 2.28, + "learning_rate": 4.101512980913685e-05, + "loss": 1.4456, + "step": 28934 + }, + { + "epoch": 2.28, + "learning_rate": 4.1006637856583504e-05, + "loss": 1.4669, + "step": 28935 + }, + { + "epoch": 2.28, + "learning_rate": 4.099814664403498e-05, + "loss": 1.4665, + "step": 28936 + }, + { + "epoch": 2.28, + "learning_rate": 4.098965617154888e-05, + "loss": 1.4174, + "step": 28937 + }, + { + "epoch": 2.28, + "learning_rate": 4.098116643918287e-05, + "loss": 1.4664, + "step": 28938 + }, + { + "epoch": 2.28, + "learning_rate": 4.0972677446994545e-05, + "loss": 1.4523, + "step": 28939 + }, + { + "epoch": 2.28, + "learning_rate": 4.096418919504161e-05, + "loss": 1.4606, + "step": 28940 + }, + { + "epoch": 2.28, + "learning_rate": 4.095570168338165e-05, + "loss": 1.4181, + "step": 28941 + }, + { + "epoch": 2.28, + "learning_rate": 4.094721491207222e-05, + "loss": 1.4235, + "step": 28942 + }, + { + "epoch": 2.28, + "learning_rate": 4.093872888117109e-05, + "loss": 1.4926, + "step": 28943 + }, + { + "epoch": 2.28, + "learning_rate": 4.0930243590735835e-05, + "loss": 1.4039, + "step": 28944 + }, + { + "epoch": 2.28, + "learning_rate": 4.092175904082402e-05, + "loss": 1.4511, + "step": 28945 + }, + { + "epoch": 2.28, + "learning_rate": 4.091327523149322e-05, + "loss": 1.4585, + "step": 28946 + }, + { + "epoch": 2.28, + "learning_rate": 4.0904792162801135e-05, + "loss": 1.4277, + "step": 28947 + }, + { + "epoch": 2.28, + "learning_rate": 4.089630983480531e-05, + "loss": 1.4739, + "step": 28948 + }, + { + "epoch": 2.28, + "learning_rate": 4.088782824756327e-05, + "loss": 1.4348, + "step": 28949 + }, + { + "epoch": 2.28, + "learning_rate": 4.087934740113273e-05, + "loss": 1.4863, + "step": 28950 + }, + { + "epoch": 2.28, + "learning_rate": 4.087086729557118e-05, + "loss": 1.4488, + "step": 28951 + }, + { + "epoch": 2.28, + "learning_rate": 4.08623879309362e-05, + "loss": 1.4321, + "step": 28952 + }, + { + "epoch": 2.28, + "learning_rate": 4.0853909307285396e-05, + "loss": 1.4278, + "step": 28953 + }, + { + "epoch": 2.28, + "learning_rate": 4.0845431424676345e-05, + "loss": 1.4783, + "step": 28954 + }, + { + "epoch": 2.28, + "learning_rate": 4.0836954283166505e-05, + "loss": 1.4423, + "step": 28955 + }, + { + "epoch": 2.28, + "learning_rate": 4.082847788281357e-05, + "loss": 1.4938, + "step": 28956 + }, + { + "epoch": 2.28, + "learning_rate": 4.082000222367497e-05, + "loss": 1.3963, + "step": 28957 + }, + { + "epoch": 2.28, + "learning_rate": 4.081152730580836e-05, + "loss": 1.441, + "step": 28958 + }, + { + "epoch": 2.28, + "learning_rate": 4.080305312927117e-05, + "loss": 1.4678, + "step": 28959 + }, + { + "epoch": 2.28, + "learning_rate": 4.079457969412103e-05, + "loss": 1.5053, + "step": 28960 + }, + { + "epoch": 2.28, + "learning_rate": 4.078610700041544e-05, + "loss": 1.4779, + "step": 28961 + }, + { + "epoch": 2.28, + "learning_rate": 4.07776350482119e-05, + "loss": 1.4644, + "step": 28962 + }, + { + "epoch": 2.28, + "learning_rate": 4.076916383756791e-05, + "loss": 1.4509, + "step": 28963 + }, + { + "epoch": 2.28, + "learning_rate": 4.076069336854107e-05, + "loss": 1.4447, + "step": 28964 + }, + { + "epoch": 2.28, + "learning_rate": 4.075222364118882e-05, + "loss": 1.4552, + "step": 28965 + }, + { + "epoch": 2.28, + "learning_rate": 4.074375465556866e-05, + "loss": 1.435, + "step": 28966 + }, + { + "epoch": 2.28, + "learning_rate": 4.0735286411738146e-05, + "loss": 1.4386, + "step": 28967 + }, + { + "epoch": 2.28, + "learning_rate": 4.072681890975474e-05, + "loss": 1.3981, + "step": 28968 + }, + { + "epoch": 2.28, + "learning_rate": 4.071835214967588e-05, + "loss": 1.4185, + "step": 28969 + }, + { + "epoch": 2.28, + "learning_rate": 4.070988613155917e-05, + "loss": 1.5176, + "step": 28970 + }, + { + "epoch": 2.28, + "learning_rate": 4.0701420855462e-05, + "loss": 1.4417, + "step": 28971 + }, + { + "epoch": 2.28, + "learning_rate": 4.0692956321441825e-05, + "loss": 1.4476, + "step": 28972 + }, + { + "epoch": 2.28, + "learning_rate": 4.068449252955616e-05, + "loss": 1.4482, + "step": 28973 + }, + { + "epoch": 2.28, + "learning_rate": 4.067602947986252e-05, + "loss": 1.4565, + "step": 28974 + }, + { + "epoch": 2.28, + "learning_rate": 4.066756717241829e-05, + "loss": 1.479, + "step": 28975 + }, + { + "epoch": 2.28, + "learning_rate": 4.0659105607280914e-05, + "loss": 1.4453, + "step": 28976 + }, + { + "epoch": 2.28, + "learning_rate": 4.0650644784507916e-05, + "loss": 1.4607, + "step": 28977 + }, + { + "epoch": 2.28, + "learning_rate": 4.06421847041567e-05, + "loss": 1.4623, + "step": 28978 + }, + { + "epoch": 2.28, + "learning_rate": 4.063372536628469e-05, + "loss": 1.432, + "step": 28979 + }, + { + "epoch": 2.28, + "learning_rate": 4.062526677094928e-05, + "loss": 1.4726, + "step": 28980 + }, + { + "epoch": 2.28, + "learning_rate": 4.061680891820801e-05, + "loss": 1.4621, + "step": 28981 + }, + { + "epoch": 2.28, + "learning_rate": 4.060835180811824e-05, + "loss": 1.4398, + "step": 28982 + }, + { + "epoch": 2.28, + "learning_rate": 4.0599895440737355e-05, + "loss": 1.4473, + "step": 28983 + }, + { + "epoch": 2.28, + "learning_rate": 4.059143981612285e-05, + "loss": 1.4747, + "step": 28984 + }, + { + "epoch": 2.28, + "learning_rate": 4.058298493433208e-05, + "loss": 1.4714, + "step": 28985 + }, + { + "epoch": 2.28, + "learning_rate": 4.0574530795422435e-05, + "loss": 1.4629, + "step": 28986 + }, + { + "epoch": 2.28, + "learning_rate": 4.056607739945136e-05, + "loss": 1.4503, + "step": 28987 + }, + { + "epoch": 2.28, + "learning_rate": 4.055762474647626e-05, + "loss": 1.4475, + "step": 28988 + }, + { + "epoch": 2.28, + "learning_rate": 4.054917283655442e-05, + "loss": 1.4833, + "step": 28989 + }, + { + "epoch": 2.28, + "learning_rate": 4.054072166974331e-05, + "loss": 1.4833, + "step": 28990 + }, + { + "epoch": 2.28, + "learning_rate": 4.053227124610034e-05, + "loss": 1.4577, + "step": 28991 + }, + { + "epoch": 2.28, + "learning_rate": 4.052382156568283e-05, + "loss": 1.4481, + "step": 28992 + }, + { + "epoch": 2.28, + "learning_rate": 4.051537262854813e-05, + "loss": 1.4392, + "step": 28993 + }, + { + "epoch": 2.28, + "learning_rate": 4.050692443475367e-05, + "loss": 1.4589, + "step": 28994 + }, + { + "epoch": 2.28, + "learning_rate": 4.049847698435677e-05, + "loss": 1.4398, + "step": 28995 + }, + { + "epoch": 2.28, + "learning_rate": 4.049003027741478e-05, + "loss": 1.486, + "step": 28996 + }, + { + "epoch": 2.28, + "learning_rate": 4.0481584313985e-05, + "loss": 1.4609, + "step": 28997 + }, + { + "epoch": 2.28, + "learning_rate": 4.047313909412487e-05, + "loss": 1.4078, + "step": 28998 + }, + { + "epoch": 2.28, + "learning_rate": 4.04646946178917e-05, + "loss": 1.4385, + "step": 28999 + }, + { + "epoch": 2.28, + "learning_rate": 4.045625088534275e-05, + "loss": 1.4178, + "step": 29000 + }, + { + "epoch": 2.28, + "learning_rate": 4.044780789653546e-05, + "loss": 1.508, + "step": 29001 + }, + { + "epoch": 2.28, + "learning_rate": 4.0439365651527086e-05, + "loss": 1.4269, + "step": 29002 + }, + { + "epoch": 2.28, + "learning_rate": 4.0430924150374916e-05, + "loss": 1.4442, + "step": 29003 + }, + { + "epoch": 2.28, + "learning_rate": 4.0422483393136304e-05, + "loss": 1.4924, + "step": 29004 + }, + { + "epoch": 2.28, + "learning_rate": 4.0414043379868616e-05, + "loss": 1.3891, + "step": 29005 + }, + { + "epoch": 2.28, + "learning_rate": 4.04056041106291e-05, + "loss": 1.4711, + "step": 29006 + }, + { + "epoch": 2.28, + "learning_rate": 4.039716558547499e-05, + "loss": 1.4707, + "step": 29007 + }, + { + "epoch": 2.28, + "learning_rate": 4.0388727804463696e-05, + "loss": 1.4461, + "step": 29008 + }, + { + "epoch": 2.28, + "learning_rate": 4.038029076765245e-05, + "loss": 1.4378, + "step": 29009 + }, + { + "epoch": 2.28, + "learning_rate": 4.0371854475098496e-05, + "loss": 1.4682, + "step": 29010 + }, + { + "epoch": 2.28, + "learning_rate": 4.0363418926859206e-05, + "loss": 1.4411, + "step": 29011 + }, + { + "epoch": 2.28, + "learning_rate": 4.035498412299179e-05, + "loss": 1.4896, + "step": 29012 + }, + { + "epoch": 2.28, + "learning_rate": 4.034655006355348e-05, + "loss": 1.4715, + "step": 29013 + }, + { + "epoch": 2.28, + "learning_rate": 4.033811674860162e-05, + "loss": 1.4392, + "step": 29014 + }, + { + "epoch": 2.28, + "learning_rate": 4.032968417819343e-05, + "loss": 1.4255, + "step": 29015 + }, + { + "epoch": 2.28, + "learning_rate": 4.032125235238618e-05, + "loss": 1.4839, + "step": 29016 + }, + { + "epoch": 2.28, + "learning_rate": 4.031282127123705e-05, + "loss": 1.4482, + "step": 29017 + }, + { + "epoch": 2.28, + "learning_rate": 4.030439093480336e-05, + "loss": 1.3805, + "step": 29018 + }, + { + "epoch": 2.28, + "learning_rate": 4.0295961343142346e-05, + "loss": 1.4369, + "step": 29019 + }, + { + "epoch": 2.28, + "learning_rate": 4.028753249631115e-05, + "loss": 1.4072, + "step": 29020 + }, + { + "epoch": 2.28, + "learning_rate": 4.0279104394367085e-05, + "loss": 1.4168, + "step": 29021 + }, + { + "epoch": 2.28, + "learning_rate": 4.027067703736738e-05, + "loss": 1.4761, + "step": 29022 + }, + { + "epoch": 2.28, + "learning_rate": 4.026225042536923e-05, + "loss": 1.4057, + "step": 29023 + }, + { + "epoch": 2.28, + "learning_rate": 4.02538245584298e-05, + "loss": 1.4313, + "step": 29024 + }, + { + "epoch": 2.28, + "learning_rate": 4.024539943660637e-05, + "loss": 1.4718, + "step": 29025 + }, + { + "epoch": 2.28, + "learning_rate": 4.023697505995613e-05, + "loss": 1.4391, + "step": 29026 + }, + { + "epoch": 2.28, + "learning_rate": 4.0228551428536197e-05, + "loss": 1.4742, + "step": 29027 + }, + { + "epoch": 2.28, + "learning_rate": 4.0220128542403865e-05, + "loss": 1.3864, + "step": 29028 + }, + { + "epoch": 2.28, + "learning_rate": 4.021170640161629e-05, + "loss": 1.4949, + "step": 29029 + }, + { + "epoch": 2.28, + "learning_rate": 4.02032850062306e-05, + "loss": 1.3927, + "step": 29030 + }, + { + "epoch": 2.28, + "learning_rate": 4.019486435630404e-05, + "loss": 1.4784, + "step": 29031 + }, + { + "epoch": 2.28, + "learning_rate": 4.018644445189378e-05, + "loss": 1.4386, + "step": 29032 + }, + { + "epoch": 2.28, + "learning_rate": 4.0178025293056936e-05, + "loss": 1.3978, + "step": 29033 + }, + { + "epoch": 2.28, + "learning_rate": 4.016960687985067e-05, + "loss": 1.5011, + "step": 29034 + }, + { + "epoch": 2.28, + "learning_rate": 4.0161189212332214e-05, + "loss": 1.4901, + "step": 29035 + }, + { + "epoch": 2.28, + "learning_rate": 4.01527722905586e-05, + "loss": 1.4806, + "step": 29036 + }, + { + "epoch": 2.28, + "learning_rate": 4.01443561145871e-05, + "loss": 1.4299, + "step": 29037 + }, + { + "epoch": 2.28, + "learning_rate": 4.0135940684474754e-05, + "loss": 1.4225, + "step": 29038 + }, + { + "epoch": 2.28, + "learning_rate": 4.0127526000278805e-05, + "loss": 1.4552, + "step": 29039 + }, + { + "epoch": 2.28, + "learning_rate": 4.01191120620563e-05, + "loss": 1.4474, + "step": 29040 + }, + { + "epoch": 2.28, + "learning_rate": 4.011069886986434e-05, + "loss": 1.4984, + "step": 29041 + }, + { + "epoch": 2.29, + "learning_rate": 4.010228642376015e-05, + "loss": 1.4574, + "step": 29042 + }, + { + "epoch": 2.29, + "learning_rate": 4.009387472380079e-05, + "loss": 1.4475, + "step": 29043 + }, + { + "epoch": 2.29, + "learning_rate": 4.008546377004331e-05, + "loss": 1.4513, + "step": 29044 + }, + { + "epoch": 2.29, + "learning_rate": 4.007705356254494e-05, + "loss": 1.4653, + "step": 29045 + }, + { + "epoch": 2.29, + "learning_rate": 4.0068644101362696e-05, + "loss": 1.4137, + "step": 29046 + }, + { + "epoch": 2.29, + "learning_rate": 4.0060235386553666e-05, + "loss": 1.4425, + "step": 29047 + }, + { + "epoch": 2.29, + "learning_rate": 4.0051827418175e-05, + "loss": 1.4615, + "step": 29048 + }, + { + "epoch": 2.29, + "learning_rate": 4.0043420196283756e-05, + "loss": 1.3843, + "step": 29049 + }, + { + "epoch": 2.29, + "learning_rate": 4.0035013720937e-05, + "loss": 1.4487, + "step": 29050 + }, + { + "epoch": 2.29, + "learning_rate": 4.002660799219178e-05, + "loss": 1.4454, + "step": 29051 + }, + { + "epoch": 2.29, + "learning_rate": 4.0018203010105216e-05, + "loss": 1.4106, + "step": 29052 + }, + { + "epoch": 2.29, + "learning_rate": 4.000979877473439e-05, + "loss": 1.4369, + "step": 29053 + }, + { + "epoch": 2.29, + "learning_rate": 4.000139528613629e-05, + "loss": 1.3957, + "step": 29054 + }, + { + "epoch": 2.29, + "learning_rate": 3.9992992544368064e-05, + "loss": 1.4634, + "step": 29055 + }, + { + "epoch": 2.29, + "learning_rate": 3.998459054948671e-05, + "loss": 1.46, + "step": 29056 + }, + { + "epoch": 2.29, + "learning_rate": 3.997618930154927e-05, + "loss": 1.4536, + "step": 29057 + }, + { + "epoch": 2.29, + "learning_rate": 3.996778880061275e-05, + "loss": 1.4905, + "step": 29058 + }, + { + "epoch": 2.29, + "learning_rate": 3.995938904673426e-05, + "loss": 1.4339, + "step": 29059 + }, + { + "epoch": 2.29, + "learning_rate": 3.99509900399708e-05, + "loss": 1.4672, + "step": 29060 + }, + { + "epoch": 2.29, + "learning_rate": 3.994259178037934e-05, + "loss": 1.4671, + "step": 29061 + }, + { + "epoch": 2.29, + "learning_rate": 3.9934194268017e-05, + "loss": 1.5185, + "step": 29062 + }, + { + "epoch": 2.29, + "learning_rate": 3.992579750294073e-05, + "loss": 1.4867, + "step": 29063 + }, + { + "epoch": 2.29, + "learning_rate": 3.9917401485207504e-05, + "loss": 1.5055, + "step": 29064 + }, + { + "epoch": 2.29, + "learning_rate": 3.990900621487442e-05, + "loss": 1.4928, + "step": 29065 + }, + { + "epoch": 2.29, + "learning_rate": 3.990061169199843e-05, + "loss": 1.4286, + "step": 29066 + }, + { + "epoch": 2.29, + "learning_rate": 3.98922179166365e-05, + "loss": 1.4408, + "step": 29067 + }, + { + "epoch": 2.29, + "learning_rate": 3.9883824888845636e-05, + "loss": 1.4854, + "step": 29068 + }, + { + "epoch": 2.29, + "learning_rate": 3.987543260868288e-05, + "loss": 1.4638, + "step": 29069 + }, + { + "epoch": 2.29, + "learning_rate": 3.986704107620517e-05, + "loss": 1.4651, + "step": 29070 + }, + { + "epoch": 2.29, + "learning_rate": 3.985865029146941e-05, + "loss": 1.4701, + "step": 29071 + }, + { + "epoch": 2.29, + "learning_rate": 3.9850260254532693e-05, + "loss": 1.3882, + "step": 29072 + }, + { + "epoch": 2.29, + "learning_rate": 3.984187096545194e-05, + "loss": 1.4642, + "step": 29073 + }, + { + "epoch": 2.29, + "learning_rate": 3.983348242428406e-05, + "loss": 1.4734, + "step": 29074 + }, + { + "epoch": 2.29, + "learning_rate": 3.982509463108603e-05, + "loss": 1.469, + "step": 29075 + }, + { + "epoch": 2.29, + "learning_rate": 3.981670758591483e-05, + "loss": 1.4329, + "step": 29076 + }, + { + "epoch": 2.29, + "learning_rate": 3.980832128882737e-05, + "loss": 1.3651, + "step": 29077 + }, + { + "epoch": 2.29, + "learning_rate": 3.979993573988057e-05, + "loss": 1.4356, + "step": 29078 + }, + { + "epoch": 2.29, + "learning_rate": 3.979155093913143e-05, + "loss": 1.4469, + "step": 29079 + }, + { + "epoch": 2.29, + "learning_rate": 3.9783166886636856e-05, + "loss": 1.4742, + "step": 29080 + }, + { + "epoch": 2.29, + "learning_rate": 3.977478358245371e-05, + "loss": 1.4282, + "step": 29081 + }, + { + "epoch": 2.29, + "learning_rate": 3.9766401026638985e-05, + "loss": 1.3853, + "step": 29082 + }, + { + "epoch": 2.29, + "learning_rate": 3.9758019219249525e-05, + "loss": 1.4385, + "step": 29083 + }, + { + "epoch": 2.29, + "learning_rate": 3.974963816034233e-05, + "loss": 1.4735, + "step": 29084 + }, + { + "epoch": 2.29, + "learning_rate": 3.974125784997421e-05, + "loss": 1.4895, + "step": 29085 + }, + { + "epoch": 2.29, + "learning_rate": 3.973287828820215e-05, + "loss": 1.4661, + "step": 29086 + }, + { + "epoch": 2.29, + "learning_rate": 3.972449947508297e-05, + "loss": 1.4679, + "step": 29087 + }, + { + "epoch": 2.29, + "learning_rate": 3.971612141067356e-05, + "loss": 1.4238, + "step": 29088 + }, + { + "epoch": 2.29, + "learning_rate": 3.9707744095030876e-05, + "loss": 1.4437, + "step": 29089 + }, + { + "epoch": 2.29, + "learning_rate": 3.969936752821173e-05, + "loss": 1.4299, + "step": 29090 + }, + { + "epoch": 2.29, + "learning_rate": 3.9690991710273005e-05, + "loss": 1.448, + "step": 29091 + }, + { + "epoch": 2.29, + "learning_rate": 3.968261664127155e-05, + "loss": 1.4406, + "step": 29092 + }, + { + "epoch": 2.29, + "learning_rate": 3.967424232126429e-05, + "loss": 1.424, + "step": 29093 + }, + { + "epoch": 2.29, + "learning_rate": 3.9665868750308034e-05, + "loss": 1.4647, + "step": 29094 + }, + { + "epoch": 2.29, + "learning_rate": 3.965749592845959e-05, + "loss": 1.4468, + "step": 29095 + }, + { + "epoch": 2.29, + "learning_rate": 3.96491238557759e-05, + "loss": 1.4554, + "step": 29096 + }, + { + "epoch": 2.29, + "learning_rate": 3.964075253231377e-05, + "loss": 1.4582, + "step": 29097 + }, + { + "epoch": 2.29, + "learning_rate": 3.963238195813e-05, + "loss": 1.5159, + "step": 29098 + }, + { + "epoch": 2.29, + "learning_rate": 3.962401213328143e-05, + "loss": 1.5163, + "step": 29099 + }, + { + "epoch": 2.29, + "learning_rate": 3.961564305782497e-05, + "loss": 1.4885, + "step": 29100 + }, + { + "epoch": 2.29, + "learning_rate": 3.9607274731817356e-05, + "loss": 1.4777, + "step": 29101 + }, + { + "epoch": 2.29, + "learning_rate": 3.95989071553154e-05, + "loss": 1.4083, + "step": 29102 + }, + { + "epoch": 2.29, + "learning_rate": 3.9590540328375974e-05, + "loss": 1.4443, + "step": 29103 + }, + { + "epoch": 2.29, + "learning_rate": 3.958217425105585e-05, + "loss": 1.4138, + "step": 29104 + }, + { + "epoch": 2.29, + "learning_rate": 3.957380892341179e-05, + "loss": 1.4415, + "step": 29105 + }, + { + "epoch": 2.29, + "learning_rate": 3.956544434550068e-05, + "loss": 1.4658, + "step": 29106 + }, + { + "epoch": 2.29, + "learning_rate": 3.955708051737925e-05, + "loss": 1.4623, + "step": 29107 + }, + { + "epoch": 2.29, + "learning_rate": 3.95487174391043e-05, + "loss": 1.4244, + "step": 29108 + }, + { + "epoch": 2.29, + "learning_rate": 3.954035511073256e-05, + "loss": 1.507, + "step": 29109 + }, + { + "epoch": 2.29, + "learning_rate": 3.953199353232089e-05, + "loss": 1.4602, + "step": 29110 + }, + { + "epoch": 2.29, + "learning_rate": 3.952363270392603e-05, + "loss": 1.4832, + "step": 29111 + }, + { + "epoch": 2.29, + "learning_rate": 3.95152726256047e-05, + "loss": 1.4334, + "step": 29112 + }, + { + "epoch": 2.29, + "learning_rate": 3.950691329741373e-05, + "loss": 1.4376, + "step": 29113 + }, + { + "epoch": 2.29, + "learning_rate": 3.9498554719409804e-05, + "loss": 1.4725, + "step": 29114 + }, + { + "epoch": 2.29, + "learning_rate": 3.949019689164976e-05, + "loss": 1.4173, + "step": 29115 + }, + { + "epoch": 2.29, + "learning_rate": 3.948183981419024e-05, + "loss": 1.5424, + "step": 29116 + }, + { + "epoch": 2.29, + "learning_rate": 3.94734834870881e-05, + "loss": 1.4163, + "step": 29117 + }, + { + "epoch": 2.29, + "learning_rate": 3.94651279104e-05, + "loss": 1.4488, + "step": 29118 + }, + { + "epoch": 2.29, + "learning_rate": 3.945677308418264e-05, + "loss": 1.4704, + "step": 29119 + }, + { + "epoch": 2.29, + "learning_rate": 3.944841900849284e-05, + "loss": 1.3841, + "step": 29120 + }, + { + "epoch": 2.29, + "learning_rate": 3.944006568338726e-05, + "loss": 1.3952, + "step": 29121 + }, + { + "epoch": 2.29, + "learning_rate": 3.943171310892259e-05, + "loss": 1.4607, + "step": 29122 + }, + { + "epoch": 2.29, + "learning_rate": 3.94233612851556e-05, + "loss": 1.4157, + "step": 29123 + }, + { + "epoch": 2.29, + "learning_rate": 3.941501021214297e-05, + "loss": 1.467, + "step": 29124 + }, + { + "epoch": 2.29, + "learning_rate": 3.940665988994135e-05, + "loss": 1.5205, + "step": 29125 + }, + { + "epoch": 2.29, + "learning_rate": 3.939831031860753e-05, + "loss": 1.4923, + "step": 29126 + }, + { + "epoch": 2.29, + "learning_rate": 3.938996149819814e-05, + "loss": 1.4288, + "step": 29127 + }, + { + "epoch": 2.29, + "learning_rate": 3.938161342876988e-05, + "loss": 1.4451, + "step": 29128 + }, + { + "epoch": 2.29, + "learning_rate": 3.9373266110379376e-05, + "loss": 1.4109, + "step": 29129 + }, + { + "epoch": 2.29, + "learning_rate": 3.9364919543083345e-05, + "loss": 1.4187, + "step": 29130 + }, + { + "epoch": 2.29, + "learning_rate": 3.935657372693849e-05, + "loss": 1.4303, + "step": 29131 + }, + { + "epoch": 2.29, + "learning_rate": 3.9348228662001446e-05, + "loss": 1.4454, + "step": 29132 + }, + { + "epoch": 2.29, + "learning_rate": 3.933988434832884e-05, + "loss": 1.4836, + "step": 29133 + }, + { + "epoch": 2.29, + "learning_rate": 3.9331540785977366e-05, + "loss": 1.4726, + "step": 29134 + }, + { + "epoch": 2.29, + "learning_rate": 3.9323197975003676e-05, + "loss": 1.4911, + "step": 29135 + }, + { + "epoch": 2.29, + "learning_rate": 3.931485591546436e-05, + "loss": 1.4518, + "step": 29136 + }, + { + "epoch": 2.29, + "learning_rate": 3.930651460741612e-05, + "loss": 1.4056, + "step": 29137 + }, + { + "epoch": 2.29, + "learning_rate": 3.929817405091556e-05, + "loss": 1.4267, + "step": 29138 + }, + { + "epoch": 2.29, + "learning_rate": 3.9289834246019274e-05, + "loss": 1.4806, + "step": 29139 + }, + { + "epoch": 2.29, + "learning_rate": 3.928149519278395e-05, + "loss": 1.4424, + "step": 29140 + }, + { + "epoch": 2.29, + "learning_rate": 3.927315689126618e-05, + "loss": 1.4503, + "step": 29141 + }, + { + "epoch": 2.29, + "learning_rate": 3.926481934152252e-05, + "loss": 1.4753, + "step": 29142 + }, + { + "epoch": 2.29, + "learning_rate": 3.9256482543609696e-05, + "loss": 1.4403, + "step": 29143 + }, + { + "epoch": 2.29, + "learning_rate": 3.924814649758422e-05, + "loss": 1.494, + "step": 29144 + }, + { + "epoch": 2.29, + "learning_rate": 3.923981120350272e-05, + "loss": 1.41, + "step": 29145 + }, + { + "epoch": 2.29, + "learning_rate": 3.923147666142168e-05, + "loss": 1.4351, + "step": 29146 + }, + { + "epoch": 2.29, + "learning_rate": 3.9223142871397886e-05, + "loss": 1.4439, + "step": 29147 + }, + { + "epoch": 2.29, + "learning_rate": 3.921480983348782e-05, + "loss": 1.4228, + "step": 29148 + }, + { + "epoch": 2.29, + "learning_rate": 3.920647754774806e-05, + "loss": 1.4479, + "step": 29149 + }, + { + "epoch": 2.29, + "learning_rate": 3.919814601423513e-05, + "loss": 1.3798, + "step": 29150 + }, + { + "epoch": 2.29, + "learning_rate": 3.918981523300569e-05, + "loss": 1.4501, + "step": 29151 + }, + { + "epoch": 2.29, + "learning_rate": 3.9181485204116234e-05, + "loss": 1.4349, + "step": 29152 + }, + { + "epoch": 2.29, + "learning_rate": 3.917315592762331e-05, + "loss": 1.5113, + "step": 29153 + }, + { + "epoch": 2.29, + "learning_rate": 3.9164827403583554e-05, + "loss": 1.4266, + "step": 29154 + }, + { + "epoch": 2.29, + "learning_rate": 3.915649963205343e-05, + "loss": 1.4297, + "step": 29155 + }, + { + "epoch": 2.29, + "learning_rate": 3.914817261308949e-05, + "loss": 1.468, + "step": 29156 + }, + { + "epoch": 2.29, + "learning_rate": 3.913984634674831e-05, + "loss": 1.4588, + "step": 29157 + }, + { + "epoch": 2.29, + "learning_rate": 3.91315208330864e-05, + "loss": 1.4432, + "step": 29158 + }, + { + "epoch": 2.29, + "learning_rate": 3.912319607216025e-05, + "loss": 1.4648, + "step": 29159 + }, + { + "epoch": 2.29, + "learning_rate": 3.911487206402644e-05, + "loss": 1.4972, + "step": 29160 + }, + { + "epoch": 2.29, + "learning_rate": 3.910654880874146e-05, + "loss": 1.4472, + "step": 29161 + }, + { + "epoch": 2.29, + "learning_rate": 3.909822630636178e-05, + "loss": 1.4858, + "step": 29162 + }, + { + "epoch": 2.29, + "learning_rate": 3.908990455694393e-05, + "loss": 1.4874, + "step": 29163 + }, + { + "epoch": 2.29, + "learning_rate": 3.9081583560544465e-05, + "loss": 1.4007, + "step": 29164 + }, + { + "epoch": 2.29, + "learning_rate": 3.907326331721985e-05, + "loss": 1.4624, + "step": 29165 + }, + { + "epoch": 2.29, + "learning_rate": 3.906494382702652e-05, + "loss": 1.4506, + "step": 29166 + }, + { + "epoch": 2.29, + "learning_rate": 3.9056625090021045e-05, + "loss": 1.5162, + "step": 29167 + }, + { + "epoch": 2.29, + "learning_rate": 3.904830710625985e-05, + "loss": 1.4952, + "step": 29168 + }, + { + "epoch": 2.3, + "learning_rate": 3.9039989875799435e-05, + "loss": 1.4452, + "step": 29169 + }, + { + "epoch": 2.3, + "learning_rate": 3.9031673398696206e-05, + "loss": 1.4378, + "step": 29170 + }, + { + "epoch": 2.3, + "learning_rate": 3.9023357675006714e-05, + "loss": 1.446, + "step": 29171 + }, + { + "epoch": 2.3, + "learning_rate": 3.9015042704787384e-05, + "loss": 1.4401, + "step": 29172 + }, + { + "epoch": 2.3, + "learning_rate": 3.9006728488094635e-05, + "loss": 1.4639, + "step": 29173 + }, + { + "epoch": 2.3, + "learning_rate": 3.899841502498498e-05, + "loss": 1.3643, + "step": 29174 + }, + { + "epoch": 2.3, + "learning_rate": 3.899010231551484e-05, + "loss": 1.4457, + "step": 29175 + }, + { + "epoch": 2.3, + "learning_rate": 3.898179035974061e-05, + "loss": 1.4471, + "step": 29176 + }, + { + "epoch": 2.3, + "learning_rate": 3.897347915771874e-05, + "loss": 1.5455, + "step": 29177 + }, + { + "epoch": 2.3, + "learning_rate": 3.8965168709505734e-05, + "loss": 1.4399, + "step": 29178 + }, + { + "epoch": 2.3, + "learning_rate": 3.895685901515795e-05, + "loss": 1.4036, + "step": 29179 + }, + { + "epoch": 2.3, + "learning_rate": 3.894855007473177e-05, + "loss": 1.4168, + "step": 29180 + }, + { + "epoch": 2.3, + "learning_rate": 3.8940241888283705e-05, + "loss": 1.4331, + "step": 29181 + }, + { + "epoch": 2.3, + "learning_rate": 3.8931934455870095e-05, + "loss": 1.4398, + "step": 29182 + }, + { + "epoch": 2.3, + "learning_rate": 3.892362777754732e-05, + "loss": 1.4159, + "step": 29183 + }, + { + "epoch": 2.3, + "learning_rate": 3.8915321853371865e-05, + "loss": 1.448, + "step": 29184 + }, + { + "epoch": 2.3, + "learning_rate": 3.890701668340007e-05, + "loss": 1.4748, + "step": 29185 + }, + { + "epoch": 2.3, + "learning_rate": 3.8898712267688324e-05, + "loss": 1.4411, + "step": 29186 + }, + { + "epoch": 2.3, + "learning_rate": 3.8890408606292975e-05, + "loss": 1.4562, + "step": 29187 + }, + { + "epoch": 2.3, + "learning_rate": 3.8882105699270474e-05, + "loss": 1.4841, + "step": 29188 + }, + { + "epoch": 2.3, + "learning_rate": 3.8873803546677146e-05, + "loss": 1.4653, + "step": 29189 + }, + { + "epoch": 2.3, + "learning_rate": 3.8865502148569336e-05, + "loss": 1.4139, + "step": 29190 + }, + { + "epoch": 2.3, + "learning_rate": 3.8857201505003476e-05, + "loss": 1.4505, + "step": 29191 + }, + { + "epoch": 2.3, + "learning_rate": 3.8848901616035884e-05, + "loss": 1.4577, + "step": 29192 + }, + { + "epoch": 2.3, + "learning_rate": 3.884060248172288e-05, + "loss": 1.5082, + "step": 29193 + }, + { + "epoch": 2.3, + "learning_rate": 3.883230410212083e-05, + "loss": 1.457, + "step": 29194 + }, + { + "epoch": 2.3, + "learning_rate": 3.8824006477286135e-05, + "loss": 1.5146, + "step": 29195 + }, + { + "epoch": 2.3, + "learning_rate": 3.8815709607275074e-05, + "loss": 1.4308, + "step": 29196 + }, + { + "epoch": 2.3, + "learning_rate": 3.8807413492143957e-05, + "loss": 1.4849, + "step": 29197 + }, + { + "epoch": 2.3, + "learning_rate": 3.879911813194917e-05, + "loss": 1.3727, + "step": 29198 + }, + { + "epoch": 2.3, + "learning_rate": 3.879082352674702e-05, + "loss": 1.4926, + "step": 29199 + }, + { + "epoch": 2.3, + "learning_rate": 3.878252967659377e-05, + "loss": 1.4577, + "step": 29200 + }, + { + "epoch": 2.3, + "learning_rate": 3.87742365815458e-05, + "loss": 1.4549, + "step": 29201 + }, + { + "epoch": 2.3, + "learning_rate": 3.876594424165939e-05, + "loss": 1.4128, + "step": 29202 + }, + { + "epoch": 2.3, + "learning_rate": 3.8757652656990825e-05, + "loss": 1.4569, + "step": 29203 + }, + { + "epoch": 2.3, + "learning_rate": 3.874936182759637e-05, + "loss": 1.4482, + "step": 29204 + }, + { + "epoch": 2.3, + "learning_rate": 3.87410717535324e-05, + "loss": 1.4152, + "step": 29205 + }, + { + "epoch": 2.3, + "learning_rate": 3.873278243485516e-05, + "loss": 1.4384, + "step": 29206 + }, + { + "epoch": 2.3, + "learning_rate": 3.872449387162087e-05, + "loss": 1.4431, + "step": 29207 + }, + { + "epoch": 2.3, + "learning_rate": 3.8716206063885925e-05, + "loss": 1.4497, + "step": 29208 + }, + { + "epoch": 2.3, + "learning_rate": 3.8707919011706464e-05, + "loss": 1.4029, + "step": 29209 + }, + { + "epoch": 2.3, + "learning_rate": 3.869963271513887e-05, + "loss": 1.4599, + "step": 29210 + }, + { + "epoch": 2.3, + "learning_rate": 3.8691347174239294e-05, + "loss": 1.4265, + "step": 29211 + }, + { + "epoch": 2.3, + "learning_rate": 3.86830623890641e-05, + "loss": 1.4655, + "step": 29212 + }, + { + "epoch": 2.3, + "learning_rate": 3.867477835966949e-05, + "loss": 1.4639, + "step": 29213 + }, + { + "epoch": 2.3, + "learning_rate": 3.8666495086111646e-05, + "loss": 1.4713, + "step": 29214 + }, + { + "epoch": 2.3, + "learning_rate": 3.86582125684469e-05, + "loss": 1.4996, + "step": 29215 + }, + { + "epoch": 2.3, + "learning_rate": 3.864993080673146e-05, + "loss": 1.4718, + "step": 29216 + }, + { + "epoch": 2.3, + "learning_rate": 3.86416498010215e-05, + "loss": 1.4766, + "step": 29217 + }, + { + "epoch": 2.3, + "learning_rate": 3.863336955137331e-05, + "loss": 1.4871, + "step": 29218 + }, + { + "epoch": 2.3, + "learning_rate": 3.8625090057843104e-05, + "loss": 1.4315, + "step": 29219 + }, + { + "epoch": 2.3, + "learning_rate": 3.861681132048702e-05, + "loss": 1.4491, + "step": 29220 + }, + { + "epoch": 2.3, + "learning_rate": 3.860853333936137e-05, + "loss": 1.4495, + "step": 29221 + }, + { + "epoch": 2.3, + "learning_rate": 3.86002561145223e-05, + "loss": 1.4574, + "step": 29222 + }, + { + "epoch": 2.3, + "learning_rate": 3.859197964602601e-05, + "loss": 1.4116, + "step": 29223 + }, + { + "epoch": 2.3, + "learning_rate": 3.858370393392863e-05, + "loss": 1.4873, + "step": 29224 + }, + { + "epoch": 2.3, + "learning_rate": 3.857542897828649e-05, + "loss": 1.4544, + "step": 29225 + }, + { + "epoch": 2.3, + "learning_rate": 3.8567154779155704e-05, + "loss": 1.4747, + "step": 29226 + }, + { + "epoch": 2.3, + "learning_rate": 3.855888133659244e-05, + "loss": 1.414, + "step": 29227 + }, + { + "epoch": 2.3, + "learning_rate": 3.855060865065284e-05, + "loss": 1.4424, + "step": 29228 + }, + { + "epoch": 2.3, + "learning_rate": 3.854233672139313e-05, + "loss": 1.4861, + "step": 29229 + }, + { + "epoch": 2.3, + "learning_rate": 3.853406554886946e-05, + "loss": 1.4756, + "step": 29230 + }, + { + "epoch": 2.3, + "learning_rate": 3.8525795133137915e-05, + "loss": 1.4621, + "step": 29231 + }, + { + "epoch": 2.3, + "learning_rate": 3.851752547425477e-05, + "loss": 1.4394, + "step": 29232 + }, + { + "epoch": 2.3, + "learning_rate": 3.8509256572276087e-05, + "loss": 1.4317, + "step": 29233 + }, + { + "epoch": 2.3, + "learning_rate": 3.8500988427258e-05, + "loss": 1.4409, + "step": 29234 + }, + { + "epoch": 2.3, + "learning_rate": 3.84927210392567e-05, + "loss": 1.4757, + "step": 29235 + }, + { + "epoch": 2.3, + "learning_rate": 3.84844544083283e-05, + "loss": 1.4709, + "step": 29236 + }, + { + "epoch": 2.3, + "learning_rate": 3.847618853452885e-05, + "loss": 1.4187, + "step": 29237 + }, + { + "epoch": 2.3, + "learning_rate": 3.8467923417914605e-05, + "loss": 1.4785, + "step": 29238 + }, + { + "epoch": 2.3, + "learning_rate": 3.845965905854159e-05, + "loss": 1.4557, + "step": 29239 + }, + { + "epoch": 2.3, + "learning_rate": 3.845139545646591e-05, + "loss": 1.4761, + "step": 29240 + }, + { + "epoch": 2.3, + "learning_rate": 3.844313261174368e-05, + "loss": 1.4112, + "step": 29241 + }, + { + "epoch": 2.3, + "learning_rate": 3.8434870524431076e-05, + "loss": 1.4333, + "step": 29242 + }, + { + "epoch": 2.3, + "learning_rate": 3.842660919458414e-05, + "loss": 1.4744, + "step": 29243 + }, + { + "epoch": 2.3, + "learning_rate": 3.841834862225894e-05, + "loss": 1.4635, + "step": 29244 + }, + { + "epoch": 2.3, + "learning_rate": 3.841008880751154e-05, + "loss": 1.4605, + "step": 29245 + }, + { + "epoch": 2.3, + "learning_rate": 3.840182975039811e-05, + "loss": 1.4506, + "step": 29246 + }, + { + "epoch": 2.3, + "learning_rate": 3.839357145097466e-05, + "loss": 1.4209, + "step": 29247 + }, + { + "epoch": 2.3, + "learning_rate": 3.838531390929722e-05, + "loss": 1.4333, + "step": 29248 + }, + { + "epoch": 2.3, + "learning_rate": 3.8377057125421976e-05, + "loss": 1.4642, + "step": 29249 + }, + { + "epoch": 2.3, + "learning_rate": 3.836880109940488e-05, + "loss": 1.4562, + "step": 29250 + }, + { + "epoch": 2.3, + "learning_rate": 3.836054583130199e-05, + "loss": 1.4789, + "step": 29251 + }, + { + "epoch": 2.3, + "learning_rate": 3.835229132116944e-05, + "loss": 1.4386, + "step": 29252 + }, + { + "epoch": 2.3, + "learning_rate": 3.834403756906322e-05, + "loss": 1.4968, + "step": 29253 + }, + { + "epoch": 2.3, + "learning_rate": 3.833578457503931e-05, + "loss": 1.4535, + "step": 29254 + }, + { + "epoch": 2.3, + "learning_rate": 3.832753233915386e-05, + "loss": 1.4828, + "step": 29255 + }, + { + "epoch": 2.3, + "learning_rate": 3.8319280861462787e-05, + "loss": 1.4823, + "step": 29256 + }, + { + "epoch": 2.3, + "learning_rate": 3.8311030142022206e-05, + "loss": 1.4291, + "step": 29257 + }, + { + "epoch": 2.3, + "learning_rate": 3.830278018088807e-05, + "loss": 1.4353, + "step": 29258 + }, + { + "epoch": 2.3, + "learning_rate": 3.8294530978116445e-05, + "loss": 1.4761, + "step": 29259 + }, + { + "epoch": 2.3, + "learning_rate": 3.8286282533763304e-05, + "loss": 1.4417, + "step": 29260 + }, + { + "epoch": 2.3, + "learning_rate": 3.827803484788468e-05, + "loss": 1.4394, + "step": 29261 + }, + { + "epoch": 2.3, + "learning_rate": 3.826978792053647e-05, + "loss": 1.4149, + "step": 29262 + }, + { + "epoch": 2.3, + "learning_rate": 3.826154175177481e-05, + "loss": 1.396, + "step": 29263 + }, + { + "epoch": 2.3, + "learning_rate": 3.8253296341655616e-05, + "loss": 1.4726, + "step": 29264 + }, + { + "epoch": 2.3, + "learning_rate": 3.8245051690234826e-05, + "loss": 1.4653, + "step": 29265 + }, + { + "epoch": 2.3, + "learning_rate": 3.8236807797568505e-05, + "loss": 1.4706, + "step": 29266 + }, + { + "epoch": 2.3, + "learning_rate": 3.822856466371259e-05, + "loss": 1.4986, + "step": 29267 + }, + { + "epoch": 2.3, + "learning_rate": 3.8220322288722995e-05, + "loss": 1.4219, + "step": 29268 + }, + { + "epoch": 2.3, + "learning_rate": 3.8212080672655757e-05, + "loss": 1.4892, + "step": 29269 + }, + { + "epoch": 2.3, + "learning_rate": 3.8203839815566813e-05, + "loss": 1.4393, + "step": 29270 + }, + { + "epoch": 2.3, + "learning_rate": 3.8195599717512056e-05, + "loss": 1.4755, + "step": 29271 + }, + { + "epoch": 2.3, + "learning_rate": 3.818736037854747e-05, + "loss": 1.452, + "step": 29272 + }, + { + "epoch": 2.3, + "learning_rate": 3.817912179872907e-05, + "loss": 1.459, + "step": 29273 + }, + { + "epoch": 2.3, + "learning_rate": 3.8170883978112716e-05, + "loss": 1.4454, + "step": 29274 + }, + { + "epoch": 2.3, + "learning_rate": 3.816264691675429e-05, + "loss": 1.466, + "step": 29275 + }, + { + "epoch": 2.3, + "learning_rate": 3.815441061470984e-05, + "loss": 1.4261, + "step": 29276 + }, + { + "epoch": 2.3, + "learning_rate": 3.81461750720352e-05, + "loss": 1.4352, + "step": 29277 + }, + { + "epoch": 2.3, + "learning_rate": 3.813794028878627e-05, + "loss": 1.4418, + "step": 29278 + }, + { + "epoch": 2.3, + "learning_rate": 3.8129706265019037e-05, + "loss": 1.5267, + "step": 29279 + }, + { + "epoch": 2.3, + "learning_rate": 3.812147300078937e-05, + "loss": 1.4576, + "step": 29280 + }, + { + "epoch": 2.3, + "learning_rate": 3.8113240496153156e-05, + "loss": 1.4537, + "step": 29281 + }, + { + "epoch": 2.3, + "learning_rate": 3.8105008751166236e-05, + "loss": 1.4725, + "step": 29282 + }, + { + "epoch": 2.3, + "learning_rate": 3.809677776588463e-05, + "loss": 1.48, + "step": 29283 + }, + { + "epoch": 2.3, + "learning_rate": 3.8088547540364135e-05, + "loss": 1.5164, + "step": 29284 + }, + { + "epoch": 2.3, + "learning_rate": 3.808031807466059e-05, + "loss": 1.4198, + "step": 29285 + }, + { + "epoch": 2.3, + "learning_rate": 3.807208936882998e-05, + "loss": 1.479, + "step": 29286 + }, + { + "epoch": 2.3, + "learning_rate": 3.806386142292808e-05, + "loss": 1.422, + "step": 29287 + }, + { + "epoch": 2.3, + "learning_rate": 3.805563423701083e-05, + "loss": 1.4492, + "step": 29288 + }, + { + "epoch": 2.3, + "learning_rate": 3.8047407811133994e-05, + "loss": 1.4481, + "step": 29289 + }, + { + "epoch": 2.3, + "learning_rate": 3.803918214535353e-05, + "loss": 1.4631, + "step": 29290 + }, + { + "epoch": 2.3, + "learning_rate": 3.803095723972522e-05, + "loss": 1.4727, + "step": 29291 + }, + { + "epoch": 2.3, + "learning_rate": 3.8022733094304896e-05, + "loss": 1.482, + "step": 29292 + }, + { + "epoch": 2.3, + "learning_rate": 3.8014509709148456e-05, + "loss": 1.4606, + "step": 29293 + }, + { + "epoch": 2.3, + "learning_rate": 3.800628708431169e-05, + "loss": 1.4697, + "step": 29294 + }, + { + "epoch": 2.3, + "learning_rate": 3.79980652198504e-05, + "loss": 1.4436, + "step": 29295 + }, + { + "epoch": 2.31, + "learning_rate": 3.798984411582048e-05, + "loss": 1.4183, + "step": 29296 + }, + { + "epoch": 2.31, + "learning_rate": 3.7981623772277694e-05, + "loss": 1.4689, + "step": 29297 + }, + { + "epoch": 2.31, + "learning_rate": 3.7973404189277876e-05, + "loss": 1.449, + "step": 29298 + }, + { + "epoch": 2.31, + "learning_rate": 3.7965185366876776e-05, + "loss": 1.4967, + "step": 29299 + }, + { + "epoch": 2.31, + "learning_rate": 3.795696730513028e-05, + "loss": 1.4489, + "step": 29300 + }, + { + "epoch": 2.31, + "learning_rate": 3.7948750004094166e-05, + "loss": 1.4893, + "step": 29301 + }, + { + "epoch": 2.31, + "learning_rate": 3.7940533463824146e-05, + "loss": 1.4111, + "step": 29302 + }, + { + "epoch": 2.31, + "learning_rate": 3.7932317684376054e-05, + "loss": 1.4896, + "step": 29303 + }, + { + "epoch": 2.31, + "learning_rate": 3.792410266580573e-05, + "loss": 1.3941, + "step": 29304 + }, + { + "epoch": 2.31, + "learning_rate": 3.7915888408168915e-05, + "loss": 1.5065, + "step": 29305 + }, + { + "epoch": 2.31, + "learning_rate": 3.790767491152132e-05, + "loss": 1.5066, + "step": 29306 + }, + { + "epoch": 2.31, + "learning_rate": 3.789946217591878e-05, + "loss": 1.4628, + "step": 29307 + }, + { + "epoch": 2.31, + "learning_rate": 3.7891250201417046e-05, + "loss": 1.4539, + "step": 29308 + }, + { + "epoch": 2.31, + "learning_rate": 3.7883038988071794e-05, + "loss": 1.4321, + "step": 29309 + }, + { + "epoch": 2.31, + "learning_rate": 3.78748285359389e-05, + "loss": 1.5047, + "step": 29310 + }, + { + "epoch": 2.31, + "learning_rate": 3.7866618845074035e-05, + "loss": 1.4136, + "step": 29311 + }, + { + "epoch": 2.31, + "learning_rate": 3.785840991553291e-05, + "loss": 1.4721, + "step": 29312 + }, + { + "epoch": 2.31, + "learning_rate": 3.785020174737134e-05, + "loss": 1.4683, + "step": 29313 + }, + { + "epoch": 2.31, + "learning_rate": 3.7841994340645004e-05, + "loss": 1.4475, + "step": 29314 + }, + { + "epoch": 2.31, + "learning_rate": 3.7833787695409626e-05, + "loss": 1.4551, + "step": 29315 + }, + { + "epoch": 2.31, + "learning_rate": 3.7825581811720896e-05, + "loss": 1.4198, + "step": 29316 + }, + { + "epoch": 2.31, + "learning_rate": 3.781737668963461e-05, + "loss": 1.382, + "step": 29317 + }, + { + "epoch": 2.31, + "learning_rate": 3.780917232920643e-05, + "loss": 1.4766, + "step": 29318 + }, + { + "epoch": 2.31, + "learning_rate": 3.780096873049197e-05, + "loss": 1.4431, + "step": 29319 + }, + { + "epoch": 2.31, + "learning_rate": 3.77927658935471e-05, + "loss": 1.4297, + "step": 29320 + }, + { + "epoch": 2.31, + "learning_rate": 3.778456381842742e-05, + "loss": 1.4697, + "step": 29321 + }, + { + "epoch": 2.31, + "learning_rate": 3.777636250518864e-05, + "loss": 1.4609, + "step": 29322 + }, + { + "epoch": 2.31, + "learning_rate": 3.776816195388637e-05, + "loss": 1.443, + "step": 29323 + }, + { + "epoch": 2.31, + "learning_rate": 3.775996216457641e-05, + "loss": 1.406, + "step": 29324 + }, + { + "epoch": 2.31, + "learning_rate": 3.775176313731435e-05, + "loss": 1.4703, + "step": 29325 + }, + { + "epoch": 2.31, + "learning_rate": 3.774356487215584e-05, + "loss": 1.4694, + "step": 29326 + }, + { + "epoch": 2.31, + "learning_rate": 3.773536736915662e-05, + "loss": 1.4571, + "step": 29327 + }, + { + "epoch": 2.31, + "learning_rate": 3.7727170628372285e-05, + "loss": 1.4434, + "step": 29328 + }, + { + "epoch": 2.31, + "learning_rate": 3.771897464985848e-05, + "loss": 1.4165, + "step": 29329 + }, + { + "epoch": 2.31, + "learning_rate": 3.7710779433670915e-05, + "loss": 1.4714, + "step": 29330 + }, + { + "epoch": 2.31, + "learning_rate": 3.7702584979865186e-05, + "loss": 1.4516, + "step": 29331 + }, + { + "epoch": 2.31, + "learning_rate": 3.7694391288496886e-05, + "loss": 1.4045, + "step": 29332 + }, + { + "epoch": 2.31, + "learning_rate": 3.768619835962176e-05, + "loss": 1.4503, + "step": 29333 + }, + { + "epoch": 2.31, + "learning_rate": 3.767800619329531e-05, + "loss": 1.4004, + "step": 29334 + }, + { + "epoch": 2.31, + "learning_rate": 3.766981478957325e-05, + "loss": 1.4606, + "step": 29335 + }, + { + "epoch": 2.31, + "learning_rate": 3.7661624148511125e-05, + "loss": 1.4509, + "step": 29336 + }, + { + "epoch": 2.31, + "learning_rate": 3.765343427016463e-05, + "loss": 1.4751, + "step": 29337 + }, + { + "epoch": 2.31, + "learning_rate": 3.764524515458929e-05, + "loss": 1.4606, + "step": 29338 + }, + { + "epoch": 2.31, + "learning_rate": 3.763705680184076e-05, + "loss": 1.4599, + "step": 29339 + }, + { + "epoch": 2.31, + "learning_rate": 3.762886921197455e-05, + "loss": 1.469, + "step": 29340 + }, + { + "epoch": 2.31, + "learning_rate": 3.762068238504635e-05, + "loss": 1.4395, + "step": 29341 + }, + { + "epoch": 2.31, + "learning_rate": 3.761249632111171e-05, + "loss": 1.4756, + "step": 29342 + }, + { + "epoch": 2.31, + "learning_rate": 3.760431102022615e-05, + "loss": 1.4128, + "step": 29343 + }, + { + "epoch": 2.31, + "learning_rate": 3.7596126482445344e-05, + "loss": 1.4827, + "step": 29344 + }, + { + "epoch": 2.31, + "learning_rate": 3.7587942707824805e-05, + "loss": 1.4052, + "step": 29345 + }, + { + "epoch": 2.31, + "learning_rate": 3.757975969642005e-05, + "loss": 1.4302, + "step": 29346 + }, + { + "epoch": 2.31, + "learning_rate": 3.7571577448286734e-05, + "loss": 1.4885, + "step": 29347 + }, + { + "epoch": 2.31, + "learning_rate": 3.756339596348037e-05, + "loss": 1.4639, + "step": 29348 + }, + { + "epoch": 2.31, + "learning_rate": 3.755521524205645e-05, + "loss": 1.4423, + "step": 29349 + }, + { + "epoch": 2.31, + "learning_rate": 3.754703528407057e-05, + "loss": 1.4398, + "step": 29350 + }, + { + "epoch": 2.31, + "learning_rate": 3.753885608957831e-05, + "loss": 1.4528, + "step": 29351 + }, + { + "epoch": 2.31, + "learning_rate": 3.753067765863515e-05, + "loss": 1.4308, + "step": 29352 + }, + { + "epoch": 2.31, + "learning_rate": 3.752249999129659e-05, + "loss": 1.4171, + "step": 29353 + }, + { + "epoch": 2.31, + "learning_rate": 3.751432308761822e-05, + "loss": 1.4542, + "step": 29354 + }, + { + "epoch": 2.31, + "learning_rate": 3.750614694765551e-05, + "loss": 1.4119, + "step": 29355 + }, + { + "epoch": 2.31, + "learning_rate": 3.749797157146401e-05, + "loss": 1.4455, + "step": 29356 + }, + { + "epoch": 2.31, + "learning_rate": 3.748979695909914e-05, + "loss": 1.4964, + "step": 29357 + }, + { + "epoch": 2.31, + "learning_rate": 3.748162311061649e-05, + "loss": 1.4755, + "step": 29358 + }, + { + "epoch": 2.31, + "learning_rate": 3.747345002607154e-05, + "loss": 1.4633, + "step": 29359 + }, + { + "epoch": 2.31, + "learning_rate": 3.746527770551973e-05, + "loss": 1.4535, + "step": 29360 + }, + { + "epoch": 2.31, + "learning_rate": 3.745710614901662e-05, + "loss": 1.4545, + "step": 29361 + }, + { + "epoch": 2.31, + "learning_rate": 3.7448935356617665e-05, + "loss": 1.4228, + "step": 29362 + }, + { + "epoch": 2.31, + "learning_rate": 3.744076532837826e-05, + "loss": 1.4707, + "step": 29363 + }, + { + "epoch": 2.31, + "learning_rate": 3.7432596064354006e-05, + "loss": 1.4606, + "step": 29364 + }, + { + "epoch": 2.31, + "learning_rate": 3.742442756460031e-05, + "loss": 1.4737, + "step": 29365 + }, + { + "epoch": 2.31, + "learning_rate": 3.741625982917256e-05, + "loss": 1.4945, + "step": 29366 + }, + { + "epoch": 2.31, + "learning_rate": 3.7408092858126284e-05, + "loss": 1.5138, + "step": 29367 + }, + { + "epoch": 2.31, + "learning_rate": 3.739992665151697e-05, + "loss": 1.5043, + "step": 29368 + }, + { + "epoch": 2.31, + "learning_rate": 3.7391761209400026e-05, + "loss": 1.4003, + "step": 29369 + }, + { + "epoch": 2.31, + "learning_rate": 3.738359653183083e-05, + "loss": 1.4852, + "step": 29370 + }, + { + "epoch": 2.31, + "learning_rate": 3.7375432618864906e-05, + "loss": 1.4485, + "step": 29371 + }, + { + "epoch": 2.31, + "learning_rate": 3.736726947055766e-05, + "loss": 1.4427, + "step": 29372 + }, + { + "epoch": 2.31, + "learning_rate": 3.7359107086964485e-05, + "loss": 1.4558, + "step": 29373 + }, + { + "epoch": 2.31, + "learning_rate": 3.7350945468140756e-05, + "loss": 1.4155, + "step": 29374 + }, + { + "epoch": 2.31, + "learning_rate": 3.7342784614142005e-05, + "loss": 1.4734, + "step": 29375 + }, + { + "epoch": 2.31, + "learning_rate": 3.733462452502357e-05, + "loss": 1.4844, + "step": 29376 + }, + { + "epoch": 2.31, + "learning_rate": 3.732646520084082e-05, + "loss": 1.4578, + "step": 29377 + }, + { + "epoch": 2.31, + "learning_rate": 3.7318306641649244e-05, + "loss": 1.4597, + "step": 29378 + }, + { + "epoch": 2.31, + "learning_rate": 3.7310148847504174e-05, + "loss": 1.4679, + "step": 29379 + }, + { + "epoch": 2.31, + "learning_rate": 3.730199181846095e-05, + "loss": 1.4044, + "step": 29380 + }, + { + "epoch": 2.31, + "learning_rate": 3.729383555457507e-05, + "loss": 1.4484, + "step": 29381 + }, + { + "epoch": 2.31, + "learning_rate": 3.7285680055901796e-05, + "loss": 1.5134, + "step": 29382 + }, + { + "epoch": 2.31, + "learning_rate": 3.7277525322496606e-05, + "loss": 1.4419, + "step": 29383 + }, + { + "epoch": 2.31, + "learning_rate": 3.726937135441477e-05, + "loss": 1.4613, + "step": 29384 + }, + { + "epoch": 2.31, + "learning_rate": 3.7261218151711743e-05, + "loss": 1.4299, + "step": 29385 + }, + { + "epoch": 2.31, + "learning_rate": 3.7253065714442816e-05, + "loss": 1.4348, + "step": 29386 + }, + { + "epoch": 2.31, + "learning_rate": 3.724491404266331e-05, + "loss": 1.4482, + "step": 29387 + }, + { + "epoch": 2.31, + "learning_rate": 3.7236763136428664e-05, + "loss": 1.4274, + "step": 29388 + }, + { + "epoch": 2.31, + "learning_rate": 3.722861299579417e-05, + "loss": 1.3954, + "step": 29389 + }, + { + "epoch": 2.31, + "learning_rate": 3.722046362081512e-05, + "loss": 1.4167, + "step": 29390 + }, + { + "epoch": 2.31, + "learning_rate": 3.721231501154692e-05, + "loss": 1.4611, + "step": 29391 + }, + { + "epoch": 2.31, + "learning_rate": 3.720416716804486e-05, + "loss": 1.471, + "step": 29392 + }, + { + "epoch": 2.31, + "learning_rate": 3.719602009036426e-05, + "loss": 1.483, + "step": 29393 + }, + { + "epoch": 2.31, + "learning_rate": 3.71878737785604e-05, + "loss": 1.493, + "step": 29394 + }, + { + "epoch": 2.31, + "learning_rate": 3.717972823268866e-05, + "loss": 1.4662, + "step": 29395 + }, + { + "epoch": 2.31, + "learning_rate": 3.717158345280429e-05, + "loss": 1.4375, + "step": 29396 + }, + { + "epoch": 2.31, + "learning_rate": 3.716343943896259e-05, + "loss": 1.4667, + "step": 29397 + }, + { + "epoch": 2.31, + "learning_rate": 3.7155296191218856e-05, + "loss": 1.4571, + "step": 29398 + }, + { + "epoch": 2.31, + "learning_rate": 3.714715370962842e-05, + "loss": 1.4021, + "step": 29399 + }, + { + "epoch": 2.31, + "learning_rate": 3.713901199424654e-05, + "loss": 1.45, + "step": 29400 + }, + { + "epoch": 2.31, + "learning_rate": 3.7130871045128446e-05, + "loss": 1.4126, + "step": 29401 + }, + { + "epoch": 2.31, + "learning_rate": 3.712273086232949e-05, + "loss": 1.4802, + "step": 29402 + }, + { + "epoch": 2.31, + "learning_rate": 3.7114591445904904e-05, + "loss": 1.468, + "step": 29403 + }, + { + "epoch": 2.31, + "learning_rate": 3.710645279590991e-05, + "loss": 1.4325, + "step": 29404 + }, + { + "epoch": 2.31, + "learning_rate": 3.709831491239984e-05, + "loss": 1.4655, + "step": 29405 + }, + { + "epoch": 2.31, + "learning_rate": 3.70901777954299e-05, + "loss": 1.4946, + "step": 29406 + }, + { + "epoch": 2.31, + "learning_rate": 3.708204144505531e-05, + "loss": 1.4598, + "step": 29407 + }, + { + "epoch": 2.31, + "learning_rate": 3.7073905861331376e-05, + "loss": 1.4602, + "step": 29408 + }, + { + "epoch": 2.31, + "learning_rate": 3.706577104431332e-05, + "loss": 1.5245, + "step": 29409 + }, + { + "epoch": 2.31, + "learning_rate": 3.7057636994056346e-05, + "loss": 1.5176, + "step": 29410 + }, + { + "epoch": 2.31, + "learning_rate": 3.7049503710615655e-05, + "loss": 1.432, + "step": 29411 + }, + { + "epoch": 2.31, + "learning_rate": 3.7041371194046535e-05, + "loss": 1.4908, + "step": 29412 + }, + { + "epoch": 2.31, + "learning_rate": 3.703323944440414e-05, + "loss": 1.3729, + "step": 29413 + }, + { + "epoch": 2.31, + "learning_rate": 3.7025108461743735e-05, + "loss": 1.4907, + "step": 29414 + }, + { + "epoch": 2.31, + "learning_rate": 3.701697824612047e-05, + "loss": 1.4879, + "step": 29415 + }, + { + "epoch": 2.31, + "learning_rate": 3.70088487975896e-05, + "loss": 1.4523, + "step": 29416 + }, + { + "epoch": 2.31, + "learning_rate": 3.7000720116206315e-05, + "loss": 1.4667, + "step": 29417 + }, + { + "epoch": 2.31, + "learning_rate": 3.699259220202572e-05, + "loss": 1.4241, + "step": 29418 + }, + { + "epoch": 2.31, + "learning_rate": 3.698446505510311e-05, + "loss": 1.446, + "step": 29419 + }, + { + "epoch": 2.31, + "learning_rate": 3.697633867549363e-05, + "loss": 1.4413, + "step": 29420 + }, + { + "epoch": 2.31, + "learning_rate": 3.696821306325237e-05, + "loss": 1.4923, + "step": 29421 + }, + { + "epoch": 2.31, + "learning_rate": 3.696008821843463e-05, + "loss": 1.4189, + "step": 29422 + }, + { + "epoch": 2.32, + "learning_rate": 3.6951964141095505e-05, + "loss": 1.5031, + "step": 29423 + }, + { + "epoch": 2.32, + "learning_rate": 3.694384083129011e-05, + "loss": 1.4192, + "step": 29424 + }, + { + "epoch": 2.32, + "learning_rate": 3.69357182890737e-05, + "loss": 1.4826, + "step": 29425 + }, + { + "epoch": 2.32, + "learning_rate": 3.692759651450135e-05, + "loss": 1.4479, + "step": 29426 + }, + { + "epoch": 2.32, + "learning_rate": 3.6919475507628244e-05, + "loss": 1.403, + "step": 29427 + }, + { + "epoch": 2.32, + "learning_rate": 3.691135526850945e-05, + "loss": 1.4402, + "step": 29428 + }, + { + "epoch": 2.32, + "learning_rate": 3.6903235797200134e-05, + "loss": 1.4696, + "step": 29429 + }, + { + "epoch": 2.32, + "learning_rate": 3.689511709375547e-05, + "loss": 1.4421, + "step": 29430 + }, + { + "epoch": 2.32, + "learning_rate": 3.688699915823052e-05, + "loss": 1.4535, + "step": 29431 + }, + { + "epoch": 2.32, + "learning_rate": 3.687888199068046e-05, + "loss": 1.447, + "step": 29432 + }, + { + "epoch": 2.32, + "learning_rate": 3.6870765591160364e-05, + "loss": 1.423, + "step": 29433 + }, + { + "epoch": 2.32, + "learning_rate": 3.686264995972536e-05, + "loss": 1.4435, + "step": 29434 + }, + { + "epoch": 2.32, + "learning_rate": 3.685453509643046e-05, + "loss": 1.468, + "step": 29435 + }, + { + "epoch": 2.32, + "learning_rate": 3.684642100133087e-05, + "loss": 1.4783, + "step": 29436 + }, + { + "epoch": 2.32, + "learning_rate": 3.6838307674481665e-05, + "loss": 1.4141, + "step": 29437 + }, + { + "epoch": 2.32, + "learning_rate": 3.683019511593783e-05, + "loss": 1.4706, + "step": 29438 + }, + { + "epoch": 2.32, + "learning_rate": 3.682208332575458e-05, + "loss": 1.4198, + "step": 29439 + }, + { + "epoch": 2.32, + "learning_rate": 3.681397230398692e-05, + "loss": 1.4831, + "step": 29440 + }, + { + "epoch": 2.32, + "learning_rate": 3.680586205068989e-05, + "loss": 1.4581, + "step": 29441 + }, + { + "epoch": 2.32, + "learning_rate": 3.679775256591862e-05, + "loss": 1.4404, + "step": 29442 + }, + { + "epoch": 2.32, + "learning_rate": 3.6789643849728154e-05, + "loss": 1.3945, + "step": 29443 + }, + { + "epoch": 2.32, + "learning_rate": 3.678153590217349e-05, + "loss": 1.496, + "step": 29444 + }, + { + "epoch": 2.32, + "learning_rate": 3.6773428723309703e-05, + "loss": 1.4423, + "step": 29445 + }, + { + "epoch": 2.32, + "learning_rate": 3.6765322313191915e-05, + "loss": 1.4896, + "step": 29446 + }, + { + "epoch": 2.32, + "learning_rate": 3.6757216671875084e-05, + "loss": 1.4676, + "step": 29447 + }, + { + "epoch": 2.32, + "learning_rate": 3.674911179941422e-05, + "loss": 1.3923, + "step": 29448 + }, + { + "epoch": 2.32, + "learning_rate": 3.674100769586443e-05, + "loss": 1.4795, + "step": 29449 + }, + { + "epoch": 2.32, + "learning_rate": 3.673290436128071e-05, + "loss": 1.4584, + "step": 29450 + }, + { + "epoch": 2.32, + "learning_rate": 3.6724801795718045e-05, + "loss": 1.4312, + "step": 29451 + }, + { + "epoch": 2.32, + "learning_rate": 3.6716699999231437e-05, + "loss": 1.4365, + "step": 29452 + }, + { + "epoch": 2.32, + "learning_rate": 3.670859897187595e-05, + "loss": 1.5086, + "step": 29453 + }, + { + "epoch": 2.32, + "learning_rate": 3.6700498713706566e-05, + "loss": 1.4219, + "step": 29454 + }, + { + "epoch": 2.32, + "learning_rate": 3.6692399224778236e-05, + "loss": 1.4381, + "step": 29455 + }, + { + "epoch": 2.32, + "learning_rate": 3.668430050514601e-05, + "loss": 1.4333, + "step": 29456 + }, + { + "epoch": 2.32, + "learning_rate": 3.6676202554864875e-05, + "loss": 1.4789, + "step": 29457 + }, + { + "epoch": 2.32, + "learning_rate": 3.666810537398973e-05, + "loss": 1.4875, + "step": 29458 + }, + { + "epoch": 2.32, + "learning_rate": 3.6660008962575654e-05, + "loss": 1.4475, + "step": 29459 + }, + { + "epoch": 2.32, + "learning_rate": 3.6651913320677515e-05, + "loss": 1.4516, + "step": 29460 + }, + { + "epoch": 2.32, + "learning_rate": 3.664381844835039e-05, + "loss": 1.4708, + "step": 29461 + }, + { + "epoch": 2.32, + "learning_rate": 3.663572434564914e-05, + "loss": 1.4586, + "step": 29462 + }, + { + "epoch": 2.32, + "learning_rate": 3.662763101262881e-05, + "loss": 1.4537, + "step": 29463 + }, + { + "epoch": 2.32, + "learning_rate": 3.66195384493443e-05, + "loss": 1.4655, + "step": 29464 + }, + { + "epoch": 2.32, + "learning_rate": 3.661144665585049e-05, + "loss": 1.4166, + "step": 29465 + }, + { + "epoch": 2.32, + "learning_rate": 3.6603355632202454e-05, + "loss": 1.4314, + "step": 29466 + }, + { + "epoch": 2.32, + "learning_rate": 3.659526537845504e-05, + "loss": 1.4587, + "step": 29467 + }, + { + "epoch": 2.32, + "learning_rate": 3.6587175894663195e-05, + "loss": 1.4454, + "step": 29468 + }, + { + "epoch": 2.32, + "learning_rate": 3.657908718088181e-05, + "loss": 1.48, + "step": 29469 + }, + { + "epoch": 2.32, + "learning_rate": 3.657099923716586e-05, + "loss": 1.4615, + "step": 29470 + }, + { + "epoch": 2.32, + "learning_rate": 3.656291206357023e-05, + "loss": 1.4557, + "step": 29471 + }, + { + "epoch": 2.32, + "learning_rate": 3.65548256601498e-05, + "loss": 1.4084, + "step": 29472 + }, + { + "epoch": 2.32, + "learning_rate": 3.654674002695952e-05, + "loss": 1.432, + "step": 29473 + }, + { + "epoch": 2.32, + "learning_rate": 3.653865516405428e-05, + "loss": 1.4635, + "step": 29474 + }, + { + "epoch": 2.32, + "learning_rate": 3.6530571071488916e-05, + "loss": 1.4509, + "step": 29475 + }, + { + "epoch": 2.32, + "learning_rate": 3.652248774931835e-05, + "loss": 1.4635, + "step": 29476 + }, + { + "epoch": 2.32, + "learning_rate": 3.6514405197597524e-05, + "loss": 1.4867, + "step": 29477 + }, + { + "epoch": 2.32, + "learning_rate": 3.6506323416381254e-05, + "loss": 1.4545, + "step": 29478 + }, + { + "epoch": 2.32, + "learning_rate": 3.649824240572437e-05, + "loss": 1.4023, + "step": 29479 + }, + { + "epoch": 2.32, + "learning_rate": 3.649016216568184e-05, + "loss": 1.424, + "step": 29480 + }, + { + "epoch": 2.32, + "learning_rate": 3.6482082696308454e-05, + "loss": 1.4796, + "step": 29481 + }, + { + "epoch": 2.32, + "learning_rate": 3.647400399765904e-05, + "loss": 1.4677, + "step": 29482 + }, + { + "epoch": 2.32, + "learning_rate": 3.6465926069788546e-05, + "loss": 1.5069, + "step": 29483 + }, + { + "epoch": 2.32, + "learning_rate": 3.645784891275175e-05, + "loss": 1.4712, + "step": 29484 + }, + { + "epoch": 2.32, + "learning_rate": 3.644977252660351e-05, + "loss": 1.4364, + "step": 29485 + }, + { + "epoch": 2.32, + "learning_rate": 3.644169691139859e-05, + "loss": 1.4634, + "step": 29486 + }, + { + "epoch": 2.32, + "learning_rate": 3.643362206719194e-05, + "loss": 1.4357, + "step": 29487 + }, + { + "epoch": 2.32, + "learning_rate": 3.642554799403833e-05, + "loss": 1.403, + "step": 29488 + }, + { + "epoch": 2.32, + "learning_rate": 3.641747469199253e-05, + "loss": 1.4376, + "step": 29489 + }, + { + "epoch": 2.32, + "learning_rate": 3.6409402161109424e-05, + "loss": 1.4666, + "step": 29490 + }, + { + "epoch": 2.32, + "learning_rate": 3.6401330401443813e-05, + "loss": 1.5101, + "step": 29491 + }, + { + "epoch": 2.32, + "learning_rate": 3.639325941305043e-05, + "loss": 1.4246, + "step": 29492 + }, + { + "epoch": 2.32, + "learning_rate": 3.6385189195984113e-05, + "loss": 1.433, + "step": 29493 + }, + { + "epoch": 2.32, + "learning_rate": 3.637711975029971e-05, + "loss": 1.3702, + "step": 29494 + }, + { + "epoch": 2.32, + "learning_rate": 3.636905107605197e-05, + "loss": 1.4364, + "step": 29495 + }, + { + "epoch": 2.32, + "learning_rate": 3.6360983173295616e-05, + "loss": 1.479, + "step": 29496 + }, + { + "epoch": 2.32, + "learning_rate": 3.635291604208552e-05, + "loss": 1.4488, + "step": 29497 + }, + { + "epoch": 2.32, + "learning_rate": 3.634484968247641e-05, + "loss": 1.4499, + "step": 29498 + }, + { + "epoch": 2.32, + "learning_rate": 3.6336784094523006e-05, + "loss": 1.4428, + "step": 29499 + }, + { + "epoch": 2.32, + "learning_rate": 3.632871927828015e-05, + "loss": 1.432, + "step": 29500 + }, + { + "epoch": 2.32, + "learning_rate": 3.632065523380258e-05, + "loss": 1.443, + "step": 29501 + }, + { + "epoch": 2.32, + "learning_rate": 3.631259196114496e-05, + "loss": 1.4933, + "step": 29502 + }, + { + "epoch": 2.32, + "learning_rate": 3.630452946036216e-05, + "loss": 1.4219, + "step": 29503 + }, + { + "epoch": 2.32, + "learning_rate": 3.629646773150886e-05, + "loss": 1.4389, + "step": 29504 + }, + { + "epoch": 2.32, + "learning_rate": 3.628840677463979e-05, + "loss": 1.4124, + "step": 29505 + }, + { + "epoch": 2.32, + "learning_rate": 3.628034658980965e-05, + "loss": 1.467, + "step": 29506 + }, + { + "epoch": 2.32, + "learning_rate": 3.62722871770732e-05, + "loss": 1.5224, + "step": 29507 + }, + { + "epoch": 2.32, + "learning_rate": 3.626422853648521e-05, + "loss": 1.4278, + "step": 29508 + }, + { + "epoch": 2.32, + "learning_rate": 3.6256170668100346e-05, + "loss": 1.4651, + "step": 29509 + }, + { + "epoch": 2.32, + "learning_rate": 3.624811357197327e-05, + "loss": 1.3846, + "step": 29510 + }, + { + "epoch": 2.32, + "learning_rate": 3.624005724815875e-05, + "loss": 1.4665, + "step": 29511 + }, + { + "epoch": 2.32, + "learning_rate": 3.6232001696711485e-05, + "loss": 1.4301, + "step": 29512 + }, + { + "epoch": 2.32, + "learning_rate": 3.62239469176861e-05, + "loss": 1.4631, + "step": 29513 + }, + { + "epoch": 2.32, + "learning_rate": 3.621589291113737e-05, + "loss": 1.4405, + "step": 29514 + }, + { + "epoch": 2.32, + "learning_rate": 3.6207839677119936e-05, + "loss": 1.4491, + "step": 29515 + }, + { + "epoch": 2.32, + "learning_rate": 3.619978721568842e-05, + "loss": 1.4038, + "step": 29516 + }, + { + "epoch": 2.32, + "learning_rate": 3.61917355268976e-05, + "loss": 1.5074, + "step": 29517 + }, + { + "epoch": 2.32, + "learning_rate": 3.618368461080209e-05, + "loss": 1.489, + "step": 29518 + }, + { + "epoch": 2.32, + "learning_rate": 3.617563446745653e-05, + "loss": 1.447, + "step": 29519 + }, + { + "epoch": 2.32, + "learning_rate": 3.616758509691563e-05, + "loss": 1.4783, + "step": 29520 + }, + { + "epoch": 2.32, + "learning_rate": 3.615953649923399e-05, + "loss": 1.459, + "step": 29521 + }, + { + "epoch": 2.32, + "learning_rate": 3.6151488674466296e-05, + "loss": 1.4389, + "step": 29522 + }, + { + "epoch": 2.32, + "learning_rate": 3.614344162266707e-05, + "loss": 1.4781, + "step": 29523 + }, + { + "epoch": 2.32, + "learning_rate": 3.613539534389114e-05, + "loss": 1.4951, + "step": 29524 + }, + { + "epoch": 2.32, + "learning_rate": 3.612734983819302e-05, + "loss": 1.4523, + "step": 29525 + }, + { + "epoch": 2.32, + "learning_rate": 3.611930510562737e-05, + "loss": 1.3941, + "step": 29526 + }, + { + "epoch": 2.32, + "learning_rate": 3.611126114624875e-05, + "loss": 1.4907, + "step": 29527 + }, + { + "epoch": 2.32, + "learning_rate": 3.610321796011186e-05, + "loss": 1.4334, + "step": 29528 + }, + { + "epoch": 2.32, + "learning_rate": 3.609517554727127e-05, + "loss": 1.5313, + "step": 29529 + }, + { + "epoch": 2.32, + "learning_rate": 3.6087133907781526e-05, + "loss": 1.4385, + "step": 29530 + }, + { + "epoch": 2.32, + "learning_rate": 3.6079093041697344e-05, + "loss": 1.4553, + "step": 29531 + }, + { + "epoch": 2.32, + "learning_rate": 3.6071052949073234e-05, + "loss": 1.3935, + "step": 29532 + }, + { + "epoch": 2.32, + "learning_rate": 3.6063013629963765e-05, + "loss": 1.4913, + "step": 29533 + }, + { + "epoch": 2.32, + "learning_rate": 3.60549750844236e-05, + "loss": 1.4681, + "step": 29534 + }, + { + "epoch": 2.32, + "learning_rate": 3.604693731250729e-05, + "loss": 1.4885, + "step": 29535 + }, + { + "epoch": 2.32, + "learning_rate": 3.6038900314269333e-05, + "loss": 1.4289, + "step": 29536 + }, + { + "epoch": 2.32, + "learning_rate": 3.60308640897644e-05, + "loss": 1.4705, + "step": 29537 + }, + { + "epoch": 2.32, + "learning_rate": 3.6022828639047e-05, + "loss": 1.4327, + "step": 29538 + }, + { + "epoch": 2.32, + "learning_rate": 3.601479396217166e-05, + "loss": 1.4516, + "step": 29539 + }, + { + "epoch": 2.32, + "learning_rate": 3.6006760059192966e-05, + "loss": 1.4595, + "step": 29540 + }, + { + "epoch": 2.32, + "learning_rate": 3.5998726930165513e-05, + "loss": 1.4595, + "step": 29541 + }, + { + "epoch": 2.32, + "learning_rate": 3.599069457514378e-05, + "loss": 1.4192, + "step": 29542 + }, + { + "epoch": 2.32, + "learning_rate": 3.598266299418228e-05, + "loss": 1.4274, + "step": 29543 + }, + { + "epoch": 2.32, + "learning_rate": 3.597463218733562e-05, + "loss": 1.5064, + "step": 29544 + }, + { + "epoch": 2.32, + "learning_rate": 3.5966602154658276e-05, + "loss": 1.4181, + "step": 29545 + }, + { + "epoch": 2.32, + "learning_rate": 3.595857289620478e-05, + "loss": 1.4238, + "step": 29546 + }, + { + "epoch": 2.32, + "learning_rate": 3.595054441202961e-05, + "loss": 1.5065, + "step": 29547 + }, + { + "epoch": 2.32, + "learning_rate": 3.594251670218733e-05, + "loss": 1.4675, + "step": 29548 + }, + { + "epoch": 2.32, + "learning_rate": 3.593448976673243e-05, + "loss": 1.4663, + "step": 29549 + }, + { + "epoch": 2.33, + "learning_rate": 3.592646360571936e-05, + "loss": 1.4716, + "step": 29550 + }, + { + "epoch": 2.33, + "learning_rate": 3.591843821920268e-05, + "loss": 1.4568, + "step": 29551 + }, + { + "epoch": 2.33, + "learning_rate": 3.5910413607236846e-05, + "loss": 1.4712, + "step": 29552 + }, + { + "epoch": 2.33, + "learning_rate": 3.590238976987631e-05, + "loss": 1.4777, + "step": 29553 + }, + { + "epoch": 2.33, + "learning_rate": 3.589436670717559e-05, + "loss": 1.454, + "step": 29554 + }, + { + "epoch": 2.33, + "learning_rate": 3.588634441918918e-05, + "loss": 1.4624, + "step": 29555 + }, + { + "epoch": 2.33, + "learning_rate": 3.587832290597154e-05, + "loss": 1.4559, + "step": 29556 + }, + { + "epoch": 2.33, + "learning_rate": 3.587030216757705e-05, + "loss": 1.4479, + "step": 29557 + }, + { + "epoch": 2.33, + "learning_rate": 3.586228220406028e-05, + "loss": 1.4379, + "step": 29558 + }, + { + "epoch": 2.33, + "learning_rate": 3.585426301547562e-05, + "loss": 1.454, + "step": 29559 + }, + { + "epoch": 2.33, + "learning_rate": 3.584624460187747e-05, + "loss": 1.531, + "step": 29560 + }, + { + "epoch": 2.33, + "learning_rate": 3.583822696332039e-05, + "loss": 1.4301, + "step": 29561 + }, + { + "epoch": 2.33, + "learning_rate": 3.583021009985872e-05, + "loss": 1.4726, + "step": 29562 + }, + { + "epoch": 2.33, + "learning_rate": 3.582219401154694e-05, + "loss": 1.489, + "step": 29563 + }, + { + "epoch": 2.33, + "learning_rate": 3.581417869843941e-05, + "loss": 1.4338, + "step": 29564 + }, + { + "epoch": 2.33, + "learning_rate": 3.580616416059063e-05, + "loss": 1.4657, + "step": 29565 + }, + { + "epoch": 2.33, + "learning_rate": 3.5798150398054984e-05, + "loss": 1.4517, + "step": 29566 + }, + { + "epoch": 2.33, + "learning_rate": 3.5790137410886836e-05, + "loss": 1.4792, + "step": 29567 + }, + { + "epoch": 2.33, + "learning_rate": 3.578212519914066e-05, + "loss": 1.4874, + "step": 29568 + }, + { + "epoch": 2.33, + "learning_rate": 3.577411376287082e-05, + "loss": 1.5343, + "step": 29569 + }, + { + "epoch": 2.33, + "learning_rate": 3.5766103102131693e-05, + "loss": 1.444, + "step": 29570 + }, + { + "epoch": 2.33, + "learning_rate": 3.575809321697766e-05, + "loss": 1.4222, + "step": 29571 + }, + { + "epoch": 2.33, + "learning_rate": 3.575008410746318e-05, + "loss": 1.464, + "step": 29572 + }, + { + "epoch": 2.33, + "learning_rate": 3.57420757736426e-05, + "loss": 1.4307, + "step": 29573 + }, + { + "epoch": 2.33, + "learning_rate": 3.573406821557021e-05, + "loss": 1.4463, + "step": 29574 + }, + { + "epoch": 2.33, + "learning_rate": 3.5726061433300494e-05, + "loss": 1.4624, + "step": 29575 + }, + { + "epoch": 2.33, + "learning_rate": 3.571805542688774e-05, + "loss": 1.4635, + "step": 29576 + }, + { + "epoch": 2.33, + "learning_rate": 3.571005019638631e-05, + "loss": 1.4115, + "step": 29577 + }, + { + "epoch": 2.33, + "learning_rate": 3.570204574185058e-05, + "loss": 1.4472, + "step": 29578 + }, + { + "epoch": 2.33, + "learning_rate": 3.5694042063334906e-05, + "loss": 1.4264, + "step": 29579 + }, + { + "epoch": 2.33, + "learning_rate": 3.56860391608936e-05, + "loss": 1.4432, + "step": 29580 + }, + { + "epoch": 2.33, + "learning_rate": 3.567803703458097e-05, + "loss": 1.3925, + "step": 29581 + }, + { + "epoch": 2.33, + "learning_rate": 3.567003568445141e-05, + "loss": 1.4766, + "step": 29582 + }, + { + "epoch": 2.33, + "learning_rate": 3.566203511055922e-05, + "loss": 1.4544, + "step": 29583 + }, + { + "epoch": 2.33, + "learning_rate": 3.565403531295867e-05, + "loss": 1.4366, + "step": 29584 + }, + { + "epoch": 2.33, + "learning_rate": 3.564603629170416e-05, + "loss": 1.4256, + "step": 29585 + }, + { + "epoch": 2.33, + "learning_rate": 3.5638038046849925e-05, + "loss": 1.408, + "step": 29586 + }, + { + "epoch": 2.33, + "learning_rate": 3.563004057845034e-05, + "loss": 1.4617, + "step": 29587 + }, + { + "epoch": 2.33, + "learning_rate": 3.562204388655962e-05, + "loss": 1.4611, + "step": 29588 + }, + { + "epoch": 2.33, + "learning_rate": 3.561404797123215e-05, + "loss": 1.4919, + "step": 29589 + }, + { + "epoch": 2.33, + "learning_rate": 3.560605283252217e-05, + "loss": 1.4122, + "step": 29590 + }, + { + "epoch": 2.33, + "learning_rate": 3.5598058470483914e-05, + "loss": 1.4594, + "step": 29591 + }, + { + "epoch": 2.33, + "learning_rate": 3.559006488517176e-05, + "loss": 1.4706, + "step": 29592 + }, + { + "epoch": 2.33, + "learning_rate": 3.558207207663993e-05, + "loss": 1.4812, + "step": 29593 + }, + { + "epoch": 2.33, + "learning_rate": 3.557408004494264e-05, + "loss": 1.499, + "step": 29594 + }, + { + "epoch": 2.33, + "learning_rate": 3.5566088790134246e-05, + "loss": 1.4414, + "step": 29595 + }, + { + "epoch": 2.33, + "learning_rate": 3.555809831226896e-05, + "loss": 1.4927, + "step": 29596 + }, + { + "epoch": 2.33, + "learning_rate": 3.5550108611400984e-05, + "loss": 1.4578, + "step": 29597 + }, + { + "epoch": 2.33, + "learning_rate": 3.554211968758465e-05, + "loss": 1.4296, + "step": 29598 + }, + { + "epoch": 2.33, + "learning_rate": 3.553413154087418e-05, + "loss": 1.4729, + "step": 29599 + }, + { + "epoch": 2.33, + "learning_rate": 3.552614417132378e-05, + "loss": 1.4442, + "step": 29600 + }, + { + "epoch": 2.33, + "learning_rate": 3.551815757898765e-05, + "loss": 1.4548, + "step": 29601 + }, + { + "epoch": 2.33, + "learning_rate": 3.551017176392004e-05, + "loss": 1.4555, + "step": 29602 + }, + { + "epoch": 2.33, + "learning_rate": 3.550218672617524e-05, + "loss": 1.4646, + "step": 29603 + }, + { + "epoch": 2.33, + "learning_rate": 3.54942024658074e-05, + "loss": 1.4541, + "step": 29604 + }, + { + "epoch": 2.33, + "learning_rate": 3.5486218982870694e-05, + "loss": 1.461, + "step": 29605 + }, + { + "epoch": 2.33, + "learning_rate": 3.5478236277419405e-05, + "loss": 1.4468, + "step": 29606 + }, + { + "epoch": 2.33, + "learning_rate": 3.5470254349507694e-05, + "loss": 1.4808, + "step": 29607 + }, + { + "epoch": 2.33, + "learning_rate": 3.5462273199189725e-05, + "loss": 1.4288, + "step": 29608 + }, + { + "epoch": 2.33, + "learning_rate": 3.545429282651975e-05, + "loss": 1.4555, + "step": 29609 + }, + { + "epoch": 2.33, + "learning_rate": 3.544631323155191e-05, + "loss": 1.4589, + "step": 29610 + }, + { + "epoch": 2.33, + "learning_rate": 3.5438334414340344e-05, + "loss": 1.5048, + "step": 29611 + }, + { + "epoch": 2.33, + "learning_rate": 3.5430356374939315e-05, + "loss": 1.4504, + "step": 29612 + }, + { + "epoch": 2.33, + "learning_rate": 3.542237911340293e-05, + "loss": 1.4869, + "step": 29613 + }, + { + "epoch": 2.33, + "learning_rate": 3.541440262978533e-05, + "loss": 1.4665, + "step": 29614 + }, + { + "epoch": 2.33, + "learning_rate": 3.540642692414074e-05, + "loss": 1.4656, + "step": 29615 + }, + { + "epoch": 2.33, + "learning_rate": 3.5398451996523274e-05, + "loss": 1.3916, + "step": 29616 + }, + { + "epoch": 2.33, + "learning_rate": 3.539047784698704e-05, + "loss": 1.4829, + "step": 29617 + }, + { + "epoch": 2.33, + "learning_rate": 3.538250447558622e-05, + "loss": 1.5455, + "step": 29618 + }, + { + "epoch": 2.33, + "learning_rate": 3.5374531882374966e-05, + "loss": 1.4134, + "step": 29619 + }, + { + "epoch": 2.33, + "learning_rate": 3.536656006740741e-05, + "loss": 1.4495, + "step": 29620 + }, + { + "epoch": 2.33, + "learning_rate": 3.535858903073762e-05, + "loss": 1.4789, + "step": 29621 + }, + { + "epoch": 2.33, + "learning_rate": 3.535061877241972e-05, + "loss": 1.4761, + "step": 29622 + }, + { + "epoch": 2.33, + "learning_rate": 3.534264929250791e-05, + "loss": 1.4609, + "step": 29623 + }, + { + "epoch": 2.33, + "learning_rate": 3.533468059105621e-05, + "loss": 1.4217, + "step": 29624 + }, + { + "epoch": 2.33, + "learning_rate": 3.532671266811871e-05, + "loss": 1.4289, + "step": 29625 + }, + { + "epoch": 2.33, + "learning_rate": 3.531874552374961e-05, + "loss": 1.4431, + "step": 29626 + }, + { + "epoch": 2.33, + "learning_rate": 3.531077915800294e-05, + "loss": 1.496, + "step": 29627 + }, + { + "epoch": 2.33, + "learning_rate": 3.5302813570932725e-05, + "loss": 1.4204, + "step": 29628 + }, + { + "epoch": 2.33, + "learning_rate": 3.529484876259317e-05, + "loss": 1.4972, + "step": 29629 + }, + { + "epoch": 2.33, + "learning_rate": 3.5286884733038297e-05, + "loss": 1.449, + "step": 29630 + }, + { + "epoch": 2.33, + "learning_rate": 3.5278921482322125e-05, + "loss": 1.4871, + "step": 29631 + }, + { + "epoch": 2.33, + "learning_rate": 3.527095901049881e-05, + "loss": 1.4786, + "step": 29632 + }, + { + "epoch": 2.33, + "learning_rate": 3.526299731762233e-05, + "loss": 1.421, + "step": 29633 + }, + { + "epoch": 2.33, + "learning_rate": 3.525503640374681e-05, + "loss": 1.4878, + "step": 29634 + }, + { + "epoch": 2.33, + "learning_rate": 3.5247076268926236e-05, + "loss": 1.4713, + "step": 29635 + }, + { + "epoch": 2.33, + "learning_rate": 3.523911691321473e-05, + "loss": 1.4545, + "step": 29636 + }, + { + "epoch": 2.33, + "learning_rate": 3.52311583366663e-05, + "loss": 1.3995, + "step": 29637 + }, + { + "epoch": 2.33, + "learning_rate": 3.522320053933495e-05, + "loss": 1.4813, + "step": 29638 + }, + { + "epoch": 2.33, + "learning_rate": 3.521524352127471e-05, + "loss": 1.4713, + "step": 29639 + }, + { + "epoch": 2.33, + "learning_rate": 3.520728728253965e-05, + "loss": 1.4417, + "step": 29640 + }, + { + "epoch": 2.33, + "learning_rate": 3.519933182318377e-05, + "loss": 1.463, + "step": 29641 + }, + { + "epoch": 2.33, + "learning_rate": 3.519137714326103e-05, + "loss": 1.4434, + "step": 29642 + }, + { + "epoch": 2.33, + "learning_rate": 3.5183423242825524e-05, + "loss": 1.5056, + "step": 29643 + }, + { + "epoch": 2.33, + "learning_rate": 3.517547012193122e-05, + "loss": 1.4312, + "step": 29644 + }, + { + "epoch": 2.33, + "learning_rate": 3.5167517780632054e-05, + "loss": 1.4398, + "step": 29645 + }, + { + "epoch": 2.33, + "learning_rate": 3.5159566218982115e-05, + "loss": 1.4363, + "step": 29646 + }, + { + "epoch": 2.33, + "learning_rate": 3.515161543703536e-05, + "loss": 1.452, + "step": 29647 + }, + { + "epoch": 2.33, + "learning_rate": 3.51436654348457e-05, + "loss": 1.4242, + "step": 29648 + }, + { + "epoch": 2.33, + "learning_rate": 3.513571621246719e-05, + "loss": 1.4005, + "step": 29649 + }, + { + "epoch": 2.33, + "learning_rate": 3.51277677699538e-05, + "loss": 1.4196, + "step": 29650 + }, + { + "epoch": 2.33, + "learning_rate": 3.511982010735949e-05, + "loss": 1.4581, + "step": 29651 + }, + { + "epoch": 2.33, + "learning_rate": 3.5111873224738154e-05, + "loss": 1.4531, + "step": 29652 + }, + { + "epoch": 2.33, + "learning_rate": 3.510392712214384e-05, + "loss": 1.4129, + "step": 29653 + }, + { + "epoch": 2.33, + "learning_rate": 3.5095981799630455e-05, + "loss": 1.4571, + "step": 29654 + }, + { + "epoch": 2.33, + "learning_rate": 3.508803725725192e-05, + "loss": 1.4592, + "step": 29655 + }, + { + "epoch": 2.33, + "learning_rate": 3.508009349506222e-05, + "loss": 1.3963, + "step": 29656 + }, + { + "epoch": 2.33, + "learning_rate": 3.507215051311528e-05, + "loss": 1.4715, + "step": 29657 + }, + { + "epoch": 2.33, + "learning_rate": 3.5064208311465e-05, + "loss": 1.5005, + "step": 29658 + }, + { + "epoch": 2.33, + "learning_rate": 3.5056266890165293e-05, + "loss": 1.4334, + "step": 29659 + }, + { + "epoch": 2.33, + "learning_rate": 3.504832624927013e-05, + "loss": 1.443, + "step": 29660 + }, + { + "epoch": 2.33, + "learning_rate": 3.5040386388833414e-05, + "loss": 1.3982, + "step": 29661 + }, + { + "epoch": 2.33, + "learning_rate": 3.503244730890898e-05, + "loss": 1.4995, + "step": 29662 + }, + { + "epoch": 2.33, + "learning_rate": 3.502450900955082e-05, + "loss": 1.5131, + "step": 29663 + }, + { + "epoch": 2.33, + "learning_rate": 3.501657149081277e-05, + "loss": 1.4724, + "step": 29664 + }, + { + "epoch": 2.33, + "learning_rate": 3.500863475274877e-05, + "loss": 1.4594, + "step": 29665 + }, + { + "epoch": 2.33, + "learning_rate": 3.500069879541266e-05, + "loss": 1.4193, + "step": 29666 + }, + { + "epoch": 2.33, + "learning_rate": 3.4992763618858385e-05, + "loss": 1.491, + "step": 29667 + }, + { + "epoch": 2.33, + "learning_rate": 3.4984829223139754e-05, + "loss": 1.4821, + "step": 29668 + }, + { + "epoch": 2.33, + "learning_rate": 3.497689560831064e-05, + "loss": 1.4713, + "step": 29669 + }, + { + "epoch": 2.33, + "learning_rate": 3.4968962774424964e-05, + "loss": 1.4549, + "step": 29670 + }, + { + "epoch": 2.33, + "learning_rate": 3.496103072153657e-05, + "loss": 1.4074, + "step": 29671 + }, + { + "epoch": 2.33, + "learning_rate": 3.4953099449699224e-05, + "loss": 1.5109, + "step": 29672 + }, + { + "epoch": 2.33, + "learning_rate": 3.49451689589669e-05, + "loss": 1.403, + "step": 29673 + }, + { + "epoch": 2.33, + "learning_rate": 3.493723924939339e-05, + "loss": 1.4242, + "step": 29674 + }, + { + "epoch": 2.33, + "learning_rate": 3.4929310321032526e-05, + "loss": 1.4424, + "step": 29675 + }, + { + "epoch": 2.33, + "learning_rate": 3.49213821739381e-05, + "loss": 1.4288, + "step": 29676 + }, + { + "epoch": 2.34, + "learning_rate": 3.491345480816403e-05, + "loss": 1.4424, + "step": 29677 + }, + { + "epoch": 2.34, + "learning_rate": 3.490552822376408e-05, + "loss": 1.4373, + "step": 29678 + }, + { + "epoch": 2.34, + "learning_rate": 3.4897602420792045e-05, + "loss": 1.464, + "step": 29679 + }, + { + "epoch": 2.34, + "learning_rate": 3.488967739930176e-05, + "loss": 1.4398, + "step": 29680 + }, + { + "epoch": 2.34, + "learning_rate": 3.48817531593471e-05, + "loss": 1.4675, + "step": 29681 + }, + { + "epoch": 2.34, + "learning_rate": 3.487382970098181e-05, + "loss": 1.4637, + "step": 29682 + }, + { + "epoch": 2.34, + "learning_rate": 3.486590702425964e-05, + "loss": 1.4222, + "step": 29683 + }, + { + "epoch": 2.34, + "learning_rate": 3.4857985129234456e-05, + "loss": 1.456, + "step": 29684 + }, + { + "epoch": 2.34, + "learning_rate": 3.485006401596002e-05, + "loss": 1.4367, + "step": 29685 + }, + { + "epoch": 2.34, + "learning_rate": 3.4842143684490056e-05, + "loss": 1.3734, + "step": 29686 + }, + { + "epoch": 2.34, + "learning_rate": 3.483422413487844e-05, + "loss": 1.423, + "step": 29687 + }, + { + "epoch": 2.34, + "learning_rate": 3.482630536717887e-05, + "loss": 1.4814, + "step": 29688 + }, + { + "epoch": 2.34, + "learning_rate": 3.48183873814451e-05, + "loss": 1.4212, + "step": 29689 + }, + { + "epoch": 2.34, + "learning_rate": 3.481047017773096e-05, + "loss": 1.4796, + "step": 29690 + }, + { + "epoch": 2.34, + "learning_rate": 3.480255375609017e-05, + "loss": 1.5108, + "step": 29691 + }, + { + "epoch": 2.34, + "learning_rate": 3.479463811657645e-05, + "loss": 1.4182, + "step": 29692 + }, + { + "epoch": 2.34, + "learning_rate": 3.4786723259243534e-05, + "loss": 1.4203, + "step": 29693 + }, + { + "epoch": 2.34, + "learning_rate": 3.4778809184145225e-05, + "loss": 1.4516, + "step": 29694 + }, + { + "epoch": 2.34, + "learning_rate": 3.477089589133521e-05, + "loss": 1.5071, + "step": 29695 + }, + { + "epoch": 2.34, + "learning_rate": 3.476298338086715e-05, + "loss": 1.4385, + "step": 29696 + }, + { + "epoch": 2.34, + "learning_rate": 3.475507165279491e-05, + "loss": 1.4786, + "step": 29697 + }, + { + "epoch": 2.34, + "learning_rate": 3.474716070717215e-05, + "loss": 1.3884, + "step": 29698 + }, + { + "epoch": 2.34, + "learning_rate": 3.4739250544052546e-05, + "loss": 1.4688, + "step": 29699 + }, + { + "epoch": 2.34, + "learning_rate": 3.47313411634898e-05, + "loss": 1.4475, + "step": 29700 + }, + { + "epoch": 2.34, + "learning_rate": 3.4723432565537676e-05, + "loss": 1.4395, + "step": 29701 + }, + { + "epoch": 2.34, + "learning_rate": 3.471552475024984e-05, + "loss": 1.5443, + "step": 29702 + }, + { + "epoch": 2.34, + "learning_rate": 3.470761771767992e-05, + "loss": 1.4227, + "step": 29703 + }, + { + "epoch": 2.34, + "learning_rate": 3.4699711467881694e-05, + "loss": 1.4416, + "step": 29704 + }, + { + "epoch": 2.34, + "learning_rate": 3.4691806000908794e-05, + "loss": 1.4049, + "step": 29705 + }, + { + "epoch": 2.34, + "learning_rate": 3.4683901316814864e-05, + "loss": 1.4156, + "step": 29706 + }, + { + "epoch": 2.34, + "learning_rate": 3.4675997415653646e-05, + "loss": 1.4211, + "step": 29707 + }, + { + "epoch": 2.34, + "learning_rate": 3.466809429747877e-05, + "loss": 1.4797, + "step": 29708 + }, + { + "epoch": 2.34, + "learning_rate": 3.4660191962343845e-05, + "loss": 1.4944, + "step": 29709 + }, + { + "epoch": 2.34, + "learning_rate": 3.465229041030261e-05, + "loss": 1.4388, + "step": 29710 + }, + { + "epoch": 2.34, + "learning_rate": 3.464438964140866e-05, + "loss": 1.4269, + "step": 29711 + }, + { + "epoch": 2.34, + "learning_rate": 3.463648965571561e-05, + "loss": 1.4703, + "step": 29712 + }, + { + "epoch": 2.34, + "learning_rate": 3.462859045327714e-05, + "loss": 1.4249, + "step": 29713 + }, + { + "epoch": 2.34, + "learning_rate": 3.4620692034146904e-05, + "loss": 1.4091, + "step": 29714 + }, + { + "epoch": 2.34, + "learning_rate": 3.461279439837849e-05, + "loss": 1.4814, + "step": 29715 + }, + { + "epoch": 2.34, + "learning_rate": 3.460489754602554e-05, + "loss": 1.4713, + "step": 29716 + }, + { + "epoch": 2.34, + "learning_rate": 3.4597001477141605e-05, + "loss": 1.4032, + "step": 29717 + }, + { + "epoch": 2.34, + "learning_rate": 3.4589106191780396e-05, + "loss": 1.4644, + "step": 29718 + }, + { + "epoch": 2.34, + "learning_rate": 3.4581211689995475e-05, + "loss": 1.4113, + "step": 29719 + }, + { + "epoch": 2.34, + "learning_rate": 3.457331797184038e-05, + "loss": 1.4579, + "step": 29720 + }, + { + "epoch": 2.34, + "learning_rate": 3.456542503736879e-05, + "loss": 1.4775, + "step": 29721 + }, + { + "epoch": 2.34, + "learning_rate": 3.455753288663427e-05, + "loss": 1.4479, + "step": 29722 + }, + { + "epoch": 2.34, + "learning_rate": 3.454964151969037e-05, + "loss": 1.4576, + "step": 29723 + }, + { + "epoch": 2.34, + "learning_rate": 3.454175093659071e-05, + "loss": 1.4159, + "step": 29724 + }, + { + "epoch": 2.34, + "learning_rate": 3.453386113738886e-05, + "loss": 1.4876, + "step": 29725 + }, + { + "epoch": 2.34, + "learning_rate": 3.452597212213833e-05, + "loss": 1.4548, + "step": 29726 + }, + { + "epoch": 2.34, + "learning_rate": 3.451808389089271e-05, + "loss": 1.4977, + "step": 29727 + }, + { + "epoch": 2.34, + "learning_rate": 3.451019644370563e-05, + "loss": 1.43, + "step": 29728 + }, + { + "epoch": 2.34, + "learning_rate": 3.450230978063059e-05, + "loss": 1.4554, + "step": 29729 + }, + { + "epoch": 2.34, + "learning_rate": 3.449442390172108e-05, + "loss": 1.4805, + "step": 29730 + }, + { + "epoch": 2.34, + "learning_rate": 3.4486538807030725e-05, + "loss": 1.4061, + "step": 29731 + }, + { + "epoch": 2.34, + "learning_rate": 3.447865449661304e-05, + "loss": 1.5178, + "step": 29732 + }, + { + "epoch": 2.34, + "learning_rate": 3.447077097052152e-05, + "loss": 1.4181, + "step": 29733 + }, + { + "epoch": 2.34, + "learning_rate": 3.44628882288097e-05, + "loss": 1.4646, + "step": 29734 + }, + { + "epoch": 2.34, + "learning_rate": 3.445500627153113e-05, + "loss": 1.4547, + "step": 29735 + }, + { + "epoch": 2.34, + "learning_rate": 3.44471250987393e-05, + "loss": 1.4209, + "step": 29736 + }, + { + "epoch": 2.34, + "learning_rate": 3.44392447104877e-05, + "loss": 1.4063, + "step": 29737 + }, + { + "epoch": 2.34, + "learning_rate": 3.443136510682988e-05, + "loss": 1.4589, + "step": 29738 + }, + { + "epoch": 2.34, + "learning_rate": 3.442348628781934e-05, + "loss": 1.4704, + "step": 29739 + }, + { + "epoch": 2.34, + "learning_rate": 3.441560825350948e-05, + "loss": 1.4716, + "step": 29740 + }, + { + "epoch": 2.34, + "learning_rate": 3.4407731003953906e-05, + "loss": 1.5079, + "step": 29741 + }, + { + "epoch": 2.34, + "learning_rate": 3.4399854539206046e-05, + "loss": 1.4379, + "step": 29742 + }, + { + "epoch": 2.34, + "learning_rate": 3.439197885931935e-05, + "loss": 1.4546, + "step": 29743 + }, + { + "epoch": 2.34, + "learning_rate": 3.43841039643473e-05, + "loss": 1.4211, + "step": 29744 + }, + { + "epoch": 2.34, + "learning_rate": 3.437622985434344e-05, + "loss": 1.4027, + "step": 29745 + }, + { + "epoch": 2.34, + "learning_rate": 3.436835652936116e-05, + "loss": 1.471, + "step": 29746 + }, + { + "epoch": 2.34, + "learning_rate": 3.4360483989453905e-05, + "loss": 1.5049, + "step": 29747 + }, + { + "epoch": 2.34, + "learning_rate": 3.435261223467518e-05, + "loss": 1.4883, + "step": 29748 + }, + { + "epoch": 2.34, + "learning_rate": 3.434474126507841e-05, + "loss": 1.5152, + "step": 29749 + }, + { + "epoch": 2.34, + "learning_rate": 3.433687108071701e-05, + "loss": 1.4324, + "step": 29750 + }, + { + "epoch": 2.34, + "learning_rate": 3.432900168164438e-05, + "loss": 1.4703, + "step": 29751 + }, + { + "epoch": 2.34, + "learning_rate": 3.432113306791404e-05, + "loss": 1.4594, + "step": 29752 + }, + { + "epoch": 2.34, + "learning_rate": 3.4313265239579386e-05, + "loss": 1.438, + "step": 29753 + }, + { + "epoch": 2.34, + "learning_rate": 3.430539819669377e-05, + "loss": 1.469, + "step": 29754 + }, + { + "epoch": 2.34, + "learning_rate": 3.429753193931068e-05, + "loss": 1.4318, + "step": 29755 + }, + { + "epoch": 2.34, + "learning_rate": 3.428966646748351e-05, + "loss": 1.4832, + "step": 29756 + }, + { + "epoch": 2.34, + "learning_rate": 3.428180178126562e-05, + "loss": 1.4182, + "step": 29757 + }, + { + "epoch": 2.34, + "learning_rate": 3.427393788071047e-05, + "loss": 1.4552, + "step": 29758 + }, + { + "epoch": 2.34, + "learning_rate": 3.426607476587137e-05, + "loss": 1.4946, + "step": 29759 + }, + { + "epoch": 2.34, + "learning_rate": 3.425821243680181e-05, + "loss": 1.4513, + "step": 29760 + }, + { + "epoch": 2.34, + "learning_rate": 3.425035089355507e-05, + "loss": 1.4439, + "step": 29761 + }, + { + "epoch": 2.34, + "learning_rate": 3.424249013618461e-05, + "loss": 1.4622, + "step": 29762 + }, + { + "epoch": 2.34, + "learning_rate": 3.4234630164743756e-05, + "loss": 1.4539, + "step": 29763 + }, + { + "epoch": 2.34, + "learning_rate": 3.4226770979285846e-05, + "loss": 1.3995, + "step": 29764 + }, + { + "epoch": 2.34, + "learning_rate": 3.421891257986431e-05, + "loss": 1.4373, + "step": 29765 + }, + { + "epoch": 2.34, + "learning_rate": 3.421105496653246e-05, + "loss": 1.4935, + "step": 29766 + }, + { + "epoch": 2.34, + "learning_rate": 3.4203198139343614e-05, + "loss": 1.4552, + "step": 29767 + }, + { + "epoch": 2.34, + "learning_rate": 3.4195342098351194e-05, + "loss": 1.459, + "step": 29768 + }, + { + "epoch": 2.34, + "learning_rate": 3.418748684360849e-05, + "loss": 1.4261, + "step": 29769 + }, + { + "epoch": 2.34, + "learning_rate": 3.417963237516884e-05, + "loss": 1.4644, + "step": 29770 + }, + { + "epoch": 2.34, + "learning_rate": 3.417177869308553e-05, + "loss": 1.4791, + "step": 29771 + }, + { + "epoch": 2.34, + "learning_rate": 3.416392579741197e-05, + "loss": 1.4668, + "step": 29772 + }, + { + "epoch": 2.34, + "learning_rate": 3.415607368820143e-05, + "loss": 1.4569, + "step": 29773 + }, + { + "epoch": 2.34, + "learning_rate": 3.414822236550718e-05, + "loss": 1.4651, + "step": 29774 + }, + { + "epoch": 2.34, + "learning_rate": 3.414037182938255e-05, + "loss": 1.4398, + "step": 29775 + }, + { + "epoch": 2.34, + "learning_rate": 3.4132522079880925e-05, + "loss": 1.4328, + "step": 29776 + }, + { + "epoch": 2.34, + "learning_rate": 3.412467311705552e-05, + "loss": 1.4051, + "step": 29777 + }, + { + "epoch": 2.34, + "learning_rate": 3.41168249409596e-05, + "loss": 1.3877, + "step": 29778 + }, + { + "epoch": 2.34, + "learning_rate": 3.4108977551646536e-05, + "loss": 1.4924, + "step": 29779 + }, + { + "epoch": 2.34, + "learning_rate": 3.4101130949169556e-05, + "loss": 1.4936, + "step": 29780 + }, + { + "epoch": 2.34, + "learning_rate": 3.4093285133581887e-05, + "loss": 1.4438, + "step": 29781 + }, + { + "epoch": 2.34, + "learning_rate": 3.408544010493692e-05, + "loss": 1.4648, + "step": 29782 + }, + { + "epoch": 2.34, + "learning_rate": 3.4077595863287815e-05, + "loss": 1.4347, + "step": 29783 + }, + { + "epoch": 2.34, + "learning_rate": 3.406975240868784e-05, + "loss": 1.4427, + "step": 29784 + }, + { + "epoch": 2.34, + "learning_rate": 3.406190974119031e-05, + "loss": 1.4551, + "step": 29785 + }, + { + "epoch": 2.34, + "learning_rate": 3.405406786084843e-05, + "loss": 1.4499, + "step": 29786 + }, + { + "epoch": 2.34, + "learning_rate": 3.404622676771544e-05, + "loss": 1.4745, + "step": 29787 + }, + { + "epoch": 2.34, + "learning_rate": 3.403838646184454e-05, + "loss": 1.4705, + "step": 29788 + }, + { + "epoch": 2.34, + "learning_rate": 3.403054694328906e-05, + "loss": 1.46, + "step": 29789 + }, + { + "epoch": 2.34, + "learning_rate": 3.402270821210212e-05, + "loss": 1.483, + "step": 29790 + }, + { + "epoch": 2.34, + "learning_rate": 3.401487026833702e-05, + "loss": 1.4815, + "step": 29791 + }, + { + "epoch": 2.34, + "learning_rate": 3.400703311204692e-05, + "loss": 1.4527, + "step": 29792 + }, + { + "epoch": 2.34, + "learning_rate": 3.399919674328509e-05, + "loss": 1.4409, + "step": 29793 + }, + { + "epoch": 2.34, + "learning_rate": 3.39913611621047e-05, + "loss": 1.4208, + "step": 29794 + }, + { + "epoch": 2.34, + "learning_rate": 3.39835263685589e-05, + "loss": 1.3996, + "step": 29795 + }, + { + "epoch": 2.34, + "learning_rate": 3.397569236270097e-05, + "loss": 1.4749, + "step": 29796 + }, + { + "epoch": 2.34, + "learning_rate": 3.396785914458408e-05, + "loss": 1.4938, + "step": 29797 + }, + { + "epoch": 2.34, + "learning_rate": 3.396002671426134e-05, + "loss": 1.4517, + "step": 29798 + }, + { + "epoch": 2.34, + "learning_rate": 3.3952195071786025e-05, + "loss": 1.4637, + "step": 29799 + }, + { + "epoch": 2.34, + "learning_rate": 3.3944364217211274e-05, + "loss": 1.4086, + "step": 29800 + }, + { + "epoch": 2.34, + "learning_rate": 3.39365341505902e-05, + "loss": 1.449, + "step": 29801 + }, + { + "epoch": 2.34, + "learning_rate": 3.3928704871976045e-05, + "loss": 1.4683, + "step": 29802 + }, + { + "epoch": 2.34, + "learning_rate": 3.392087638142194e-05, + "loss": 1.459, + "step": 29803 + }, + { + "epoch": 2.35, + "learning_rate": 3.3913048678981024e-05, + "loss": 1.4471, + "step": 29804 + }, + { + "epoch": 2.35, + "learning_rate": 3.390522176470639e-05, + "loss": 1.4511, + "step": 29805 + }, + { + "epoch": 2.35, + "learning_rate": 3.3897395638651246e-05, + "loss": 1.4212, + "step": 29806 + }, + { + "epoch": 2.35, + "learning_rate": 3.3889570300868765e-05, + "loss": 1.4681, + "step": 29807 + }, + { + "epoch": 2.35, + "learning_rate": 3.3881745751411975e-05, + "loss": 1.4381, + "step": 29808 + }, + { + "epoch": 2.35, + "learning_rate": 3.3873921990334095e-05, + "loss": 1.4719, + "step": 29809 + }, + { + "epoch": 2.35, + "learning_rate": 3.3866099017688204e-05, + "loss": 1.4543, + "step": 29810 + }, + { + "epoch": 2.35, + "learning_rate": 3.38582768335274e-05, + "loss": 1.4983, + "step": 29811 + }, + { + "epoch": 2.35, + "learning_rate": 3.385045543790477e-05, + "loss": 1.4836, + "step": 29812 + }, + { + "epoch": 2.35, + "learning_rate": 3.3842634830873496e-05, + "loss": 1.4598, + "step": 29813 + }, + { + "epoch": 2.35, + "learning_rate": 3.3834815012486625e-05, + "loss": 1.4043, + "step": 29814 + }, + { + "epoch": 2.35, + "learning_rate": 3.382699598279723e-05, + "loss": 1.4236, + "step": 29815 + }, + { + "epoch": 2.35, + "learning_rate": 3.3819177741858445e-05, + "loss": 1.4534, + "step": 29816 + }, + { + "epoch": 2.35, + "learning_rate": 3.3811360289723334e-05, + "loss": 1.419, + "step": 29817 + }, + { + "epoch": 2.35, + "learning_rate": 3.3803543626444934e-05, + "loss": 1.4444, + "step": 29818 + }, + { + "epoch": 2.35, + "learning_rate": 3.379572775207637e-05, + "loss": 1.477, + "step": 29819 + }, + { + "epoch": 2.35, + "learning_rate": 3.378791266667071e-05, + "loss": 1.5221, + "step": 29820 + }, + { + "epoch": 2.35, + "learning_rate": 3.378009837028095e-05, + "loss": 1.4329, + "step": 29821 + }, + { + "epoch": 2.35, + "learning_rate": 3.3772284862960173e-05, + "loss": 1.5175, + "step": 29822 + }, + { + "epoch": 2.35, + "learning_rate": 3.376447214476149e-05, + "loss": 1.4436, + "step": 29823 + }, + { + "epoch": 2.35, + "learning_rate": 3.3756660215737915e-05, + "loss": 1.4901, + "step": 29824 + }, + { + "epoch": 2.35, + "learning_rate": 3.3748849075942404e-05, + "loss": 1.4539, + "step": 29825 + }, + { + "epoch": 2.35, + "learning_rate": 3.37410387254281e-05, + "loss": 1.4524, + "step": 29826 + }, + { + "epoch": 2.35, + "learning_rate": 3.373322916424799e-05, + "loss": 1.3772, + "step": 29827 + }, + { + "epoch": 2.35, + "learning_rate": 3.372542039245509e-05, + "loss": 1.4833, + "step": 29828 + }, + { + "epoch": 2.35, + "learning_rate": 3.3717612410102375e-05, + "loss": 1.4376, + "step": 29829 + }, + { + "epoch": 2.35, + "learning_rate": 3.370980521724296e-05, + "loss": 1.433, + "step": 29830 + }, + { + "epoch": 2.35, + "learning_rate": 3.370199881392977e-05, + "loss": 1.4381, + "step": 29831 + }, + { + "epoch": 2.35, + "learning_rate": 3.36941932002158e-05, + "loss": 1.4541, + "step": 29832 + }, + { + "epoch": 2.35, + "learning_rate": 3.368638837615413e-05, + "loss": 1.4253, + "step": 29833 + }, + { + "epoch": 2.35, + "learning_rate": 3.367858434179767e-05, + "loss": 1.4469, + "step": 29834 + }, + { + "epoch": 2.35, + "learning_rate": 3.367078109719941e-05, + "loss": 1.4766, + "step": 29835 + }, + { + "epoch": 2.35, + "learning_rate": 3.366297864241237e-05, + "loss": 1.3989, + "step": 29836 + }, + { + "epoch": 2.35, + "learning_rate": 3.365517697748948e-05, + "loss": 1.4306, + "step": 29837 + }, + { + "epoch": 2.35, + "learning_rate": 3.364737610248378e-05, + "loss": 1.4414, + "step": 29838 + }, + { + "epoch": 2.35, + "learning_rate": 3.363957601744814e-05, + "loss": 1.4451, + "step": 29839 + }, + { + "epoch": 2.35, + "learning_rate": 3.36317767224356e-05, + "loss": 1.4382, + "step": 29840 + }, + { + "epoch": 2.35, + "learning_rate": 3.3623978217499096e-05, + "loss": 1.435, + "step": 29841 + }, + { + "epoch": 2.35, + "learning_rate": 3.3616180502691507e-05, + "loss": 1.4235, + "step": 29842 + }, + { + "epoch": 2.35, + "learning_rate": 3.3608383578065856e-05, + "loss": 1.4615, + "step": 29843 + }, + { + "epoch": 2.35, + "learning_rate": 3.360058744367507e-05, + "loss": 1.4365, + "step": 29844 + }, + { + "epoch": 2.35, + "learning_rate": 3.359279209957204e-05, + "loss": 1.5141, + "step": 29845 + }, + { + "epoch": 2.35, + "learning_rate": 3.35849975458097e-05, + "loss": 1.4068, + "step": 29846 + }, + { + "epoch": 2.35, + "learning_rate": 3.3577203782440996e-05, + "loss": 1.4147, + "step": 29847 + }, + { + "epoch": 2.35, + "learning_rate": 3.3569410809518846e-05, + "loss": 1.4577, + "step": 29848 + }, + { + "epoch": 2.35, + "learning_rate": 3.35616186270961e-05, + "loss": 1.503, + "step": 29849 + }, + { + "epoch": 2.35, + "learning_rate": 3.355382723522576e-05, + "loss": 1.5186, + "step": 29850 + }, + { + "epoch": 2.35, + "learning_rate": 3.3546036633960656e-05, + "loss": 1.4588, + "step": 29851 + }, + { + "epoch": 2.35, + "learning_rate": 3.3538246823353656e-05, + "loss": 1.4237, + "step": 29852 + }, + { + "epoch": 2.35, + "learning_rate": 3.353045780345771e-05, + "loss": 1.5027, + "step": 29853 + }, + { + "epoch": 2.35, + "learning_rate": 3.35226695743257e-05, + "loss": 1.4356, + "step": 29854 + }, + { + "epoch": 2.35, + "learning_rate": 3.3514882136010504e-05, + "loss": 1.483, + "step": 29855 + }, + { + "epoch": 2.35, + "learning_rate": 3.350709548856492e-05, + "loss": 1.4397, + "step": 29856 + }, + { + "epoch": 2.35, + "learning_rate": 3.3499309632041936e-05, + "loss": 1.4828, + "step": 29857 + }, + { + "epoch": 2.35, + "learning_rate": 3.3491524566494336e-05, + "loss": 1.4846, + "step": 29858 + }, + { + "epoch": 2.35, + "learning_rate": 3.348374029197495e-05, + "loss": 1.4592, + "step": 29859 + }, + { + "epoch": 2.35, + "learning_rate": 3.3475956808536705e-05, + "loss": 1.4177, + "step": 29860 + }, + { + "epoch": 2.35, + "learning_rate": 3.346817411623241e-05, + "loss": 1.5111, + "step": 29861 + }, + { + "epoch": 2.35, + "learning_rate": 3.346039221511486e-05, + "loss": 1.4677, + "step": 29862 + }, + { + "epoch": 2.35, + "learning_rate": 3.345261110523699e-05, + "loss": 1.4193, + "step": 29863 + }, + { + "epoch": 2.35, + "learning_rate": 3.3444830786651564e-05, + "loss": 1.4848, + "step": 29864 + }, + { + "epoch": 2.35, + "learning_rate": 3.343705125941142e-05, + "loss": 1.4514, + "step": 29865 + }, + { + "epoch": 2.35, + "learning_rate": 3.342927252356933e-05, + "loss": 1.3814, + "step": 29866 + }, + { + "epoch": 2.35, + "learning_rate": 3.34214945791782e-05, + "loss": 1.4355, + "step": 29867 + }, + { + "epoch": 2.35, + "learning_rate": 3.341371742629078e-05, + "loss": 1.4065, + "step": 29868 + }, + { + "epoch": 2.35, + "learning_rate": 3.340594106495984e-05, + "loss": 1.4719, + "step": 29869 + }, + { + "epoch": 2.35, + "learning_rate": 3.3398165495238215e-05, + "loss": 1.44, + "step": 29870 + }, + { + "epoch": 2.35, + "learning_rate": 3.339039071717874e-05, + "loss": 1.4763, + "step": 29871 + }, + { + "epoch": 2.35, + "learning_rate": 3.338261673083418e-05, + "loss": 1.4673, + "step": 29872 + }, + { + "epoch": 2.35, + "learning_rate": 3.337484353625724e-05, + "loss": 1.436, + "step": 29873 + }, + { + "epoch": 2.35, + "learning_rate": 3.3367071133500804e-05, + "loss": 1.457, + "step": 29874 + }, + { + "epoch": 2.35, + "learning_rate": 3.335929952261759e-05, + "loss": 1.4429, + "step": 29875 + }, + { + "epoch": 2.35, + "learning_rate": 3.335152870366031e-05, + "loss": 1.4514, + "step": 29876 + }, + { + "epoch": 2.35, + "learning_rate": 3.334375867668184e-05, + "loss": 1.4323, + "step": 29877 + }, + { + "epoch": 2.35, + "learning_rate": 3.333598944173485e-05, + "loss": 1.4833, + "step": 29878 + }, + { + "epoch": 2.35, + "learning_rate": 3.332822099887208e-05, + "loss": 1.4592, + "step": 29879 + }, + { + "epoch": 2.35, + "learning_rate": 3.332045334814635e-05, + "loss": 1.459, + "step": 29880 + }, + { + "epoch": 2.35, + "learning_rate": 3.3312686489610345e-05, + "loss": 1.3942, + "step": 29881 + }, + { + "epoch": 2.35, + "learning_rate": 3.330492042331682e-05, + "loss": 1.4833, + "step": 29882 + }, + { + "epoch": 2.35, + "learning_rate": 3.329715514931843e-05, + "loss": 1.4496, + "step": 29883 + }, + { + "epoch": 2.35, + "learning_rate": 3.328939066766797e-05, + "loss": 1.4466, + "step": 29884 + }, + { + "epoch": 2.35, + "learning_rate": 3.328162697841817e-05, + "loss": 1.5132, + "step": 29885 + }, + { + "epoch": 2.35, + "learning_rate": 3.327386408162172e-05, + "loss": 1.4621, + "step": 29886 + }, + { + "epoch": 2.35, + "learning_rate": 3.3266101977331266e-05, + "loss": 1.4492, + "step": 29887 + }, + { + "epoch": 2.35, + "learning_rate": 3.325834066559962e-05, + "loss": 1.4242, + "step": 29888 + }, + { + "epoch": 2.35, + "learning_rate": 3.325058014647939e-05, + "loss": 1.4312, + "step": 29889 + }, + { + "epoch": 2.35, + "learning_rate": 3.3242820420023284e-05, + "loss": 1.4861, + "step": 29890 + }, + { + "epoch": 2.35, + "learning_rate": 3.323506148628402e-05, + "loss": 1.4496, + "step": 29891 + }, + { + "epoch": 2.35, + "learning_rate": 3.3227303345314246e-05, + "loss": 1.4147, + "step": 29892 + }, + { + "epoch": 2.35, + "learning_rate": 3.321954599716661e-05, + "loss": 1.518, + "step": 29893 + }, + { + "epoch": 2.35, + "learning_rate": 3.321178944189385e-05, + "loss": 1.4477, + "step": 29894 + }, + { + "epoch": 2.35, + "learning_rate": 3.320403367954858e-05, + "loss": 1.4972, + "step": 29895 + }, + { + "epoch": 2.35, + "learning_rate": 3.3196278710183444e-05, + "loss": 1.4733, + "step": 29896 + }, + { + "epoch": 2.35, + "learning_rate": 3.318852453385115e-05, + "loss": 1.4587, + "step": 29897 + }, + { + "epoch": 2.35, + "learning_rate": 3.3180771150604315e-05, + "loss": 1.4572, + "step": 29898 + }, + { + "epoch": 2.35, + "learning_rate": 3.3173018560495584e-05, + "loss": 1.5104, + "step": 29899 + }, + { + "epoch": 2.35, + "learning_rate": 3.316526676357749e-05, + "loss": 1.476, + "step": 29900 + }, + { + "epoch": 2.35, + "learning_rate": 3.315751575990286e-05, + "loss": 1.4175, + "step": 29901 + }, + { + "epoch": 2.35, + "learning_rate": 3.314976554952421e-05, + "loss": 1.3771, + "step": 29902 + }, + { + "epoch": 2.35, + "learning_rate": 3.314201613249417e-05, + "loss": 1.4905, + "step": 29903 + }, + { + "epoch": 2.35, + "learning_rate": 3.31342675088653e-05, + "loss": 1.4709, + "step": 29904 + }, + { + "epoch": 2.35, + "learning_rate": 3.312651967869031e-05, + "loss": 1.4662, + "step": 29905 + }, + { + "epoch": 2.35, + "learning_rate": 3.3118772642021764e-05, + "loss": 1.441, + "step": 29906 + }, + { + "epoch": 2.35, + "learning_rate": 3.311102639891221e-05, + "loss": 1.4592, + "step": 29907 + }, + { + "epoch": 2.35, + "learning_rate": 3.310328094941432e-05, + "loss": 1.4859, + "step": 29908 + }, + { + "epoch": 2.35, + "learning_rate": 3.3095536293580624e-05, + "loss": 1.4449, + "step": 29909 + }, + { + "epoch": 2.35, + "learning_rate": 3.308779243146371e-05, + "loss": 1.4377, + "step": 29910 + }, + { + "epoch": 2.35, + "learning_rate": 3.3080049363116196e-05, + "loss": 1.4453, + "step": 29911 + }, + { + "epoch": 2.35, + "learning_rate": 3.3072307088590625e-05, + "loss": 1.4071, + "step": 29912 + }, + { + "epoch": 2.35, + "learning_rate": 3.3064565607939534e-05, + "loss": 1.4186, + "step": 29913 + }, + { + "epoch": 2.35, + "learning_rate": 3.305682492121553e-05, + "loss": 1.449, + "step": 29914 + }, + { + "epoch": 2.35, + "learning_rate": 3.304908502847116e-05, + "loss": 1.4551, + "step": 29915 + }, + { + "epoch": 2.35, + "learning_rate": 3.3041345929758936e-05, + "loss": 1.4282, + "step": 29916 + }, + { + "epoch": 2.35, + "learning_rate": 3.303360762513142e-05, + "loss": 1.4197, + "step": 29917 + }, + { + "epoch": 2.35, + "learning_rate": 3.3025870114641196e-05, + "loss": 1.4799, + "step": 29918 + }, + { + "epoch": 2.35, + "learning_rate": 3.301813339834077e-05, + "loss": 1.4444, + "step": 29919 + }, + { + "epoch": 2.35, + "learning_rate": 3.301039747628263e-05, + "loss": 1.4656, + "step": 29920 + }, + { + "epoch": 2.35, + "learning_rate": 3.3002662348519354e-05, + "loss": 1.468, + "step": 29921 + }, + { + "epoch": 2.35, + "learning_rate": 3.299492801510345e-05, + "loss": 1.4391, + "step": 29922 + }, + { + "epoch": 2.35, + "learning_rate": 3.298719447608741e-05, + "loss": 1.4149, + "step": 29923 + }, + { + "epoch": 2.35, + "learning_rate": 3.2979461731523706e-05, + "loss": 1.4149, + "step": 29924 + }, + { + "epoch": 2.35, + "learning_rate": 3.2971729781464914e-05, + "loss": 1.4447, + "step": 29925 + }, + { + "epoch": 2.35, + "learning_rate": 3.296399862596351e-05, + "loss": 1.4861, + "step": 29926 + }, + { + "epoch": 2.35, + "learning_rate": 3.2956268265071914e-05, + "loss": 1.4497, + "step": 29927 + }, + { + "epoch": 2.35, + "learning_rate": 3.2948538698842706e-05, + "loss": 1.4539, + "step": 29928 + }, + { + "epoch": 2.35, + "learning_rate": 3.2940809927328336e-05, + "loss": 1.4752, + "step": 29929 + }, + { + "epoch": 2.35, + "learning_rate": 3.293308195058123e-05, + "loss": 1.4805, + "step": 29930 + }, + { + "epoch": 2.36, + "learning_rate": 3.292535476865392e-05, + "loss": 1.4354, + "step": 29931 + }, + { + "epoch": 2.36, + "learning_rate": 3.291762838159882e-05, + "loss": 1.4199, + "step": 29932 + }, + { + "epoch": 2.36, + "learning_rate": 3.2909902789468446e-05, + "loss": 1.439, + "step": 29933 + }, + { + "epoch": 2.36, + "learning_rate": 3.290217799231517e-05, + "loss": 1.4728, + "step": 29934 + }, + { + "epoch": 2.36, + "learning_rate": 3.289445399019154e-05, + "loss": 1.4729, + "step": 29935 + }, + { + "epoch": 2.36, + "learning_rate": 3.2886730783149926e-05, + "loss": 1.4502, + "step": 29936 + }, + { + "epoch": 2.36, + "learning_rate": 3.287900837124275e-05, + "loss": 1.4924, + "step": 29937 + }, + { + "epoch": 2.36, + "learning_rate": 3.287128675452251e-05, + "loss": 1.4457, + "step": 29938 + }, + { + "epoch": 2.36, + "learning_rate": 3.286356593304161e-05, + "loss": 1.481, + "step": 29939 + }, + { + "epoch": 2.36, + "learning_rate": 3.285584590685244e-05, + "loss": 1.5002, + "step": 29940 + }, + { + "epoch": 2.36, + "learning_rate": 3.28481266760074e-05, + "loss": 1.4355, + "step": 29941 + }, + { + "epoch": 2.36, + "learning_rate": 3.284040824055897e-05, + "loss": 1.5042, + "step": 29942 + }, + { + "epoch": 2.36, + "learning_rate": 3.283269060055951e-05, + "loss": 1.4211, + "step": 29943 + }, + { + "epoch": 2.36, + "learning_rate": 3.2824973756061376e-05, + "loss": 1.5006, + "step": 29944 + }, + { + "epoch": 2.36, + "learning_rate": 3.2817257707117054e-05, + "loss": 1.5371, + "step": 29945 + }, + { + "epoch": 2.36, + "learning_rate": 3.280954245377889e-05, + "loss": 1.413, + "step": 29946 + }, + { + "epoch": 2.36, + "learning_rate": 3.280182799609922e-05, + "loss": 1.4641, + "step": 29947 + }, + { + "epoch": 2.36, + "learning_rate": 3.279411433413046e-05, + "loss": 1.4268, + "step": 29948 + }, + { + "epoch": 2.36, + "learning_rate": 3.2786401467925026e-05, + "loss": 1.4964, + "step": 29949 + }, + { + "epoch": 2.36, + "learning_rate": 3.2778689397535244e-05, + "loss": 1.4732, + "step": 29950 + }, + { + "epoch": 2.36, + "learning_rate": 3.277097812301344e-05, + "loss": 1.4689, + "step": 29951 + }, + { + "epoch": 2.36, + "learning_rate": 3.276326764441202e-05, + "loss": 1.4448, + "step": 29952 + }, + { + "epoch": 2.36, + "learning_rate": 3.275555796178333e-05, + "loss": 1.458, + "step": 29953 + }, + { + "epoch": 2.36, + "learning_rate": 3.274784907517967e-05, + "loss": 1.4522, + "step": 29954 + }, + { + "epoch": 2.36, + "learning_rate": 3.2740140984653424e-05, + "loss": 1.4897, + "step": 29955 + }, + { + "epoch": 2.36, + "learning_rate": 3.273243369025693e-05, + "loss": 1.4824, + "step": 29956 + }, + { + "epoch": 2.36, + "learning_rate": 3.27247271920425e-05, + "loss": 1.444, + "step": 29957 + }, + { + "epoch": 2.36, + "learning_rate": 3.27170214900624e-05, + "loss": 1.4687, + "step": 29958 + }, + { + "epoch": 2.36, + "learning_rate": 3.270931658436905e-05, + "loss": 1.4343, + "step": 29959 + }, + { + "epoch": 2.36, + "learning_rate": 3.270161247501472e-05, + "loss": 1.4648, + "step": 29960 + }, + { + "epoch": 2.36, + "learning_rate": 3.2693909162051674e-05, + "loss": 1.4401, + "step": 29961 + }, + { + "epoch": 2.36, + "learning_rate": 3.268620664553227e-05, + "loss": 1.4096, + "step": 29962 + }, + { + "epoch": 2.36, + "learning_rate": 3.2678504925508754e-05, + "loss": 1.4585, + "step": 29963 + }, + { + "epoch": 2.36, + "learning_rate": 3.26708040020335e-05, + "loss": 1.4765, + "step": 29964 + }, + { + "epoch": 2.36, + "learning_rate": 3.2663103875158673e-05, + "loss": 1.4345, + "step": 29965 + }, + { + "epoch": 2.36, + "learning_rate": 3.265540454493668e-05, + "loss": 1.4648, + "step": 29966 + }, + { + "epoch": 2.36, + "learning_rate": 3.2647706011419724e-05, + "loss": 1.4396, + "step": 29967 + }, + { + "epoch": 2.36, + "learning_rate": 3.264000827466004e-05, + "loss": 1.4588, + "step": 29968 + }, + { + "epoch": 2.36, + "learning_rate": 3.2632311334709995e-05, + "loss": 1.4464, + "step": 29969 + }, + { + "epoch": 2.36, + "learning_rate": 3.262461519162177e-05, + "loss": 1.4282, + "step": 29970 + }, + { + "epoch": 2.36, + "learning_rate": 3.261691984544759e-05, + "loss": 1.4746, + "step": 29971 + }, + { + "epoch": 2.36, + "learning_rate": 3.260922529623979e-05, + "loss": 1.451, + "step": 29972 + }, + { + "epoch": 2.36, + "learning_rate": 3.2601531544050584e-05, + "loss": 1.5088, + "step": 29973 + }, + { + "epoch": 2.36, + "learning_rate": 3.259383858893214e-05, + "loss": 1.4357, + "step": 29974 + }, + { + "epoch": 2.36, + "learning_rate": 3.258614643093679e-05, + "loss": 1.449, + "step": 29975 + }, + { + "epoch": 2.36, + "learning_rate": 3.25784550701167e-05, + "loss": 1.4608, + "step": 29976 + }, + { + "epoch": 2.36, + "learning_rate": 3.257076450652411e-05, + "loss": 1.4821, + "step": 29977 + }, + { + "epoch": 2.36, + "learning_rate": 3.256307474021118e-05, + "loss": 1.4131, + "step": 29978 + }, + { + "epoch": 2.36, + "learning_rate": 3.255538577123017e-05, + "loss": 1.4273, + "step": 29979 + }, + { + "epoch": 2.36, + "learning_rate": 3.254769759963332e-05, + "loss": 1.4321, + "step": 29980 + }, + { + "epoch": 2.36, + "learning_rate": 3.2540010225472795e-05, + "loss": 1.4039, + "step": 29981 + }, + { + "epoch": 2.36, + "learning_rate": 3.253232364880072e-05, + "loss": 1.4308, + "step": 29982 + }, + { + "epoch": 2.36, + "learning_rate": 3.2524637869669406e-05, + "loss": 1.398, + "step": 29983 + }, + { + "epoch": 2.36, + "learning_rate": 3.2516952888130955e-05, + "loss": 1.4389, + "step": 29984 + }, + { + "epoch": 2.36, + "learning_rate": 3.2509268704237534e-05, + "loss": 1.4459, + "step": 29985 + }, + { + "epoch": 2.36, + "learning_rate": 3.2501585318041376e-05, + "loss": 1.4441, + "step": 29986 + }, + { + "epoch": 2.36, + "learning_rate": 3.249390272959461e-05, + "loss": 1.4671, + "step": 29987 + }, + { + "epoch": 2.36, + "learning_rate": 3.248622093894936e-05, + "loss": 1.4294, + "step": 29988 + }, + { + "epoch": 2.36, + "learning_rate": 3.247853994615787e-05, + "loss": 1.4503, + "step": 29989 + }, + { + "epoch": 2.36, + "learning_rate": 3.247085975127223e-05, + "loss": 1.4523, + "step": 29990 + }, + { + "epoch": 2.36, + "learning_rate": 3.246318035434455e-05, + "loss": 1.4455, + "step": 29991 + }, + { + "epoch": 2.36, + "learning_rate": 3.245550175542706e-05, + "loss": 1.4227, + "step": 29992 + }, + { + "epoch": 2.36, + "learning_rate": 3.244782395457186e-05, + "loss": 1.4413, + "step": 29993 + }, + { + "epoch": 2.36, + "learning_rate": 3.244014695183101e-05, + "loss": 1.4403, + "step": 29994 + }, + { + "epoch": 2.36, + "learning_rate": 3.243247074725668e-05, + "loss": 1.4698, + "step": 29995 + }, + { + "epoch": 2.36, + "learning_rate": 3.242479534090104e-05, + "loss": 1.5069, + "step": 29996 + }, + { + "epoch": 2.36, + "learning_rate": 3.2417120732816165e-05, + "loss": 1.4667, + "step": 29997 + }, + { + "epoch": 2.36, + "learning_rate": 3.240944692305415e-05, + "loss": 1.4484, + "step": 29998 + }, + { + "epoch": 2.36, + "learning_rate": 3.240177391166705e-05, + "loss": 1.4136, + "step": 29999 + }, + { + "epoch": 2.36, + "learning_rate": 3.239410169870706e-05, + "loss": 1.4584, + "step": 30000 + }, + { + "epoch": 2.36, + "learning_rate": 3.2386430284226216e-05, + "loss": 1.4815, + "step": 30001 + }, + { + "epoch": 2.36, + "learning_rate": 3.237875966827657e-05, + "loss": 1.4452, + "step": 30002 + }, + { + "epoch": 2.36, + "learning_rate": 3.237108985091027e-05, + "loss": 1.4112, + "step": 30003 + }, + { + "epoch": 2.36, + "learning_rate": 3.2363420832179354e-05, + "loss": 1.4124, + "step": 30004 + }, + { + "epoch": 2.36, + "learning_rate": 3.235575261213586e-05, + "loss": 1.4207, + "step": 30005 + }, + { + "epoch": 2.36, + "learning_rate": 3.2348085190831924e-05, + "loss": 1.4611, + "step": 30006 + }, + { + "epoch": 2.36, + "learning_rate": 3.234041856831956e-05, + "loss": 1.4553, + "step": 30007 + }, + { + "epoch": 2.36, + "learning_rate": 3.233275274465077e-05, + "loss": 1.4295, + "step": 30008 + }, + { + "epoch": 2.36, + "learning_rate": 3.2325087719877714e-05, + "loss": 1.51, + "step": 30009 + }, + { + "epoch": 2.36, + "learning_rate": 3.231742349405234e-05, + "loss": 1.4647, + "step": 30010 + }, + { + "epoch": 2.36, + "learning_rate": 3.230976006722674e-05, + "loss": 1.3984, + "step": 30011 + }, + { + "epoch": 2.36, + "learning_rate": 3.230209743945289e-05, + "loss": 1.4478, + "step": 30012 + }, + { + "epoch": 2.36, + "learning_rate": 3.229443561078289e-05, + "loss": 1.4273, + "step": 30013 + }, + { + "epoch": 2.36, + "learning_rate": 3.228677458126872e-05, + "loss": 1.4559, + "step": 30014 + }, + { + "epoch": 2.36, + "learning_rate": 3.227911435096238e-05, + "loss": 1.4974, + "step": 30015 + }, + { + "epoch": 2.36, + "learning_rate": 3.227145491991585e-05, + "loss": 1.4402, + "step": 30016 + }, + { + "epoch": 2.36, + "learning_rate": 3.226379628818122e-05, + "loss": 1.3773, + "step": 30017 + }, + { + "epoch": 2.36, + "learning_rate": 3.225613845581045e-05, + "loss": 1.4488, + "step": 30018 + }, + { + "epoch": 2.36, + "learning_rate": 3.224848142285546e-05, + "loss": 1.477, + "step": 30019 + }, + { + "epoch": 2.36, + "learning_rate": 3.2240825189368364e-05, + "loss": 1.4125, + "step": 30020 + }, + { + "epoch": 2.36, + "learning_rate": 3.223316975540107e-05, + "loss": 1.4531, + "step": 30021 + }, + { + "epoch": 2.36, + "learning_rate": 3.2225515121005513e-05, + "loss": 1.4329, + "step": 30022 + }, + { + "epoch": 2.36, + "learning_rate": 3.221786128623377e-05, + "loss": 1.4469, + "step": 30023 + }, + { + "epoch": 2.36, + "learning_rate": 3.221020825113775e-05, + "loss": 1.4896, + "step": 30024 + }, + { + "epoch": 2.36, + "learning_rate": 3.220255601576937e-05, + "loss": 1.4631, + "step": 30025 + }, + { + "epoch": 2.36, + "learning_rate": 3.2194904580180635e-05, + "loss": 1.4539, + "step": 30026 + }, + { + "epoch": 2.36, + "learning_rate": 3.2187253944423516e-05, + "loss": 1.5287, + "step": 30027 + }, + { + "epoch": 2.36, + "learning_rate": 3.2179604108549946e-05, + "loss": 1.4871, + "step": 30028 + }, + { + "epoch": 2.36, + "learning_rate": 3.217195507261179e-05, + "loss": 1.38, + "step": 30029 + }, + { + "epoch": 2.36, + "learning_rate": 3.216430683666107e-05, + "loss": 1.404, + "step": 30030 + }, + { + "epoch": 2.36, + "learning_rate": 3.2156659400749696e-05, + "loss": 1.4302, + "step": 30031 + }, + { + "epoch": 2.36, + "learning_rate": 3.214901276492953e-05, + "loss": 1.4526, + "step": 30032 + }, + { + "epoch": 2.36, + "learning_rate": 3.214136692925256e-05, + "loss": 1.4653, + "step": 30033 + }, + { + "epoch": 2.36, + "learning_rate": 3.2133721893770685e-05, + "loss": 1.4076, + "step": 30034 + }, + { + "epoch": 2.36, + "learning_rate": 3.212607765853578e-05, + "loss": 1.4454, + "step": 30035 + }, + { + "epoch": 2.36, + "learning_rate": 3.211843422359974e-05, + "loss": 1.4278, + "step": 30036 + }, + { + "epoch": 2.36, + "learning_rate": 3.2110791589014494e-05, + "loss": 1.4557, + "step": 30037 + }, + { + "epoch": 2.36, + "learning_rate": 3.210314975483193e-05, + "loss": 1.3849, + "step": 30038 + }, + { + "epoch": 2.36, + "learning_rate": 3.209550872110389e-05, + "loss": 1.4434, + "step": 30039 + }, + { + "epoch": 2.36, + "learning_rate": 3.20878684878823e-05, + "loss": 1.4686, + "step": 30040 + }, + { + "epoch": 2.36, + "learning_rate": 3.208022905521902e-05, + "loss": 1.4426, + "step": 30041 + }, + { + "epoch": 2.36, + "learning_rate": 3.2072590423165864e-05, + "loss": 1.4768, + "step": 30042 + }, + { + "epoch": 2.36, + "learning_rate": 3.206495259177475e-05, + "loss": 1.4569, + "step": 30043 + }, + { + "epoch": 2.36, + "learning_rate": 3.205731556109758e-05, + "loss": 1.5233, + "step": 30044 + }, + { + "epoch": 2.36, + "learning_rate": 3.204967933118613e-05, + "loss": 1.4277, + "step": 30045 + }, + { + "epoch": 2.36, + "learning_rate": 3.2042043902092223e-05, + "loss": 1.4101, + "step": 30046 + }, + { + "epoch": 2.36, + "learning_rate": 3.2034409273867806e-05, + "loss": 1.4801, + "step": 30047 + }, + { + "epoch": 2.36, + "learning_rate": 3.2026775446564635e-05, + "loss": 1.4438, + "step": 30048 + }, + { + "epoch": 2.36, + "learning_rate": 3.2019142420234514e-05, + "loss": 1.4578, + "step": 30049 + }, + { + "epoch": 2.36, + "learning_rate": 3.201151019492936e-05, + "loss": 1.4916, + "step": 30050 + }, + { + "epoch": 2.36, + "learning_rate": 3.2003878770700934e-05, + "loss": 1.4645, + "step": 30051 + }, + { + "epoch": 2.36, + "learning_rate": 3.199624814760106e-05, + "loss": 1.4221, + "step": 30052 + }, + { + "epoch": 2.36, + "learning_rate": 3.1988618325681495e-05, + "loss": 1.451, + "step": 30053 + }, + { + "epoch": 2.36, + "learning_rate": 3.198098930499413e-05, + "loss": 1.4466, + "step": 30054 + }, + { + "epoch": 2.36, + "learning_rate": 3.197336108559072e-05, + "loss": 1.3912, + "step": 30055 + }, + { + "epoch": 2.36, + "learning_rate": 3.1965733667523025e-05, + "loss": 1.4483, + "step": 30056 + }, + { + "epoch": 2.36, + "learning_rate": 3.1958107050842835e-05, + "loss": 1.4384, + "step": 30057 + }, + { + "epoch": 2.37, + "learning_rate": 3.1950481235602024e-05, + "loss": 1.4217, + "step": 30058 + }, + { + "epoch": 2.37, + "learning_rate": 3.194285622185229e-05, + "loss": 1.4148, + "step": 30059 + }, + { + "epoch": 2.37, + "learning_rate": 3.1935232009645374e-05, + "loss": 1.4301, + "step": 30060 + }, + { + "epoch": 2.37, + "learning_rate": 3.192760859903311e-05, + "loss": 1.4196, + "step": 30061 + }, + { + "epoch": 2.37, + "learning_rate": 3.1919985990067245e-05, + "loss": 1.3839, + "step": 30062 + }, + { + "epoch": 2.37, + "learning_rate": 3.191236418279946e-05, + "loss": 1.5227, + "step": 30063 + }, + { + "epoch": 2.37, + "learning_rate": 3.190474317728161e-05, + "loss": 1.4187, + "step": 30064 + }, + { + "epoch": 2.37, + "learning_rate": 3.189712297356536e-05, + "loss": 1.4032, + "step": 30065 + }, + { + "epoch": 2.37, + "learning_rate": 3.188950357170244e-05, + "loss": 1.444, + "step": 30066 + }, + { + "epoch": 2.37, + "learning_rate": 3.188188497174466e-05, + "loss": 1.465, + "step": 30067 + }, + { + "epoch": 2.37, + "learning_rate": 3.1874267173743687e-05, + "loss": 1.4527, + "step": 30068 + }, + { + "epoch": 2.37, + "learning_rate": 3.186665017775126e-05, + "loss": 1.4452, + "step": 30069 + }, + { + "epoch": 2.37, + "learning_rate": 3.1859033983819056e-05, + "loss": 1.4762, + "step": 30070 + }, + { + "epoch": 2.37, + "learning_rate": 3.185141859199884e-05, + "loss": 1.4907, + "step": 30071 + }, + { + "epoch": 2.37, + "learning_rate": 3.1843804002342296e-05, + "loss": 1.412, + "step": 30072 + }, + { + "epoch": 2.37, + "learning_rate": 3.183619021490104e-05, + "loss": 1.4581, + "step": 30073 + }, + { + "epoch": 2.37, + "learning_rate": 3.182857722972693e-05, + "loss": 1.4782, + "step": 30074 + }, + { + "epoch": 2.37, + "learning_rate": 3.1820965046871554e-05, + "loss": 1.4398, + "step": 30075 + }, + { + "epoch": 2.37, + "learning_rate": 3.181335366638662e-05, + "loss": 1.4169, + "step": 30076 + }, + { + "epoch": 2.37, + "learning_rate": 3.180574308832375e-05, + "loss": 1.4382, + "step": 30077 + }, + { + "epoch": 2.37, + "learning_rate": 3.1798133312734695e-05, + "loss": 1.4485, + "step": 30078 + }, + { + "epoch": 2.37, + "learning_rate": 3.1790524339671093e-05, + "loss": 1.4886, + "step": 30079 + }, + { + "epoch": 2.37, + "learning_rate": 3.178291616918456e-05, + "loss": 1.4439, + "step": 30080 + }, + { + "epoch": 2.37, + "learning_rate": 3.177530880132682e-05, + "loss": 1.4703, + "step": 30081 + }, + { + "epoch": 2.37, + "learning_rate": 3.176770223614949e-05, + "loss": 1.4405, + "step": 30082 + }, + { + "epoch": 2.37, + "learning_rate": 3.176009647370419e-05, + "loss": 1.4365, + "step": 30083 + }, + { + "epoch": 2.37, + "learning_rate": 3.175249151404261e-05, + "loss": 1.4405, + "step": 30084 + }, + { + "epoch": 2.37, + "learning_rate": 3.1744887357216365e-05, + "loss": 1.435, + "step": 30085 + }, + { + "epoch": 2.37, + "learning_rate": 3.173728400327704e-05, + "loss": 1.4877, + "step": 30086 + }, + { + "epoch": 2.37, + "learning_rate": 3.1729681452276336e-05, + "loss": 1.4938, + "step": 30087 + }, + { + "epoch": 2.37, + "learning_rate": 3.172207970426582e-05, + "loss": 1.4546, + "step": 30088 + }, + { + "epoch": 2.37, + "learning_rate": 3.171447875929707e-05, + "loss": 1.4938, + "step": 30089 + }, + { + "epoch": 2.37, + "learning_rate": 3.170687861742173e-05, + "loss": 1.4522, + "step": 30090 + }, + { + "epoch": 2.37, + "learning_rate": 3.169927927869145e-05, + "loss": 1.4736, + "step": 30091 + }, + { + "epoch": 2.37, + "learning_rate": 3.1691680743157786e-05, + "loss": 1.4446, + "step": 30092 + }, + { + "epoch": 2.37, + "learning_rate": 3.168408301087232e-05, + "loss": 1.4296, + "step": 30093 + }, + { + "epoch": 2.37, + "learning_rate": 3.167648608188659e-05, + "loss": 1.4417, + "step": 30094 + }, + { + "epoch": 2.37, + "learning_rate": 3.166888995625227e-05, + "loss": 1.4744, + "step": 30095 + }, + { + "epoch": 2.37, + "learning_rate": 3.1661294634020876e-05, + "loss": 1.4007, + "step": 30096 + }, + { + "epoch": 2.37, + "learning_rate": 3.165370011524396e-05, + "loss": 1.4252, + "step": 30097 + }, + { + "epoch": 2.37, + "learning_rate": 3.164610639997315e-05, + "loss": 1.465, + "step": 30098 + }, + { + "epoch": 2.37, + "learning_rate": 3.163851348825996e-05, + "loss": 1.4426, + "step": 30099 + }, + { + "epoch": 2.37, + "learning_rate": 3.1630921380155915e-05, + "loss": 1.4414, + "step": 30100 + }, + { + "epoch": 2.37, + "learning_rate": 3.1623330075712624e-05, + "loss": 1.4189, + "step": 30101 + }, + { + "epoch": 2.37, + "learning_rate": 3.16157395749816e-05, + "loss": 1.522, + "step": 30102 + }, + { + "epoch": 2.37, + "learning_rate": 3.160814987801433e-05, + "loss": 1.4792, + "step": 30103 + }, + { + "epoch": 2.37, + "learning_rate": 3.160056098486239e-05, + "loss": 1.4939, + "step": 30104 + }, + { + "epoch": 2.37, + "learning_rate": 3.1592972895577345e-05, + "loss": 1.4356, + "step": 30105 + }, + { + "epoch": 2.37, + "learning_rate": 3.158538561021066e-05, + "loss": 1.4809, + "step": 30106 + }, + { + "epoch": 2.37, + "learning_rate": 3.1577799128813835e-05, + "loss": 1.442, + "step": 30107 + }, + { + "epoch": 2.37, + "learning_rate": 3.157021345143844e-05, + "loss": 1.4407, + "step": 30108 + }, + { + "epoch": 2.37, + "learning_rate": 3.156262857813594e-05, + "loss": 1.4633, + "step": 30109 + }, + { + "epoch": 2.37, + "learning_rate": 3.155504450895784e-05, + "loss": 1.4213, + "step": 30110 + }, + { + "epoch": 2.37, + "learning_rate": 3.154746124395556e-05, + "loss": 1.4718, + "step": 30111 + }, + { + "epoch": 2.37, + "learning_rate": 3.15398787831807e-05, + "loss": 1.4336, + "step": 30112 + }, + { + "epoch": 2.37, + "learning_rate": 3.153229712668471e-05, + "loss": 1.3993, + "step": 30113 + }, + { + "epoch": 2.37, + "learning_rate": 3.1524716274519e-05, + "loss": 1.4291, + "step": 30114 + }, + { + "epoch": 2.37, + "learning_rate": 3.151713622673511e-05, + "loss": 1.4359, + "step": 30115 + }, + { + "epoch": 2.37, + "learning_rate": 3.1509556983384496e-05, + "loss": 1.4625, + "step": 30116 + }, + { + "epoch": 2.37, + "learning_rate": 3.150197854451856e-05, + "loss": 1.4669, + "step": 30117 + }, + { + "epoch": 2.37, + "learning_rate": 3.149440091018883e-05, + "loss": 1.4418, + "step": 30118 + }, + { + "epoch": 2.37, + "learning_rate": 3.1486824080446734e-05, + "loss": 1.4941, + "step": 30119 + }, + { + "epoch": 2.37, + "learning_rate": 3.1479248055343655e-05, + "loss": 1.425, + "step": 30120 + }, + { + "epoch": 2.37, + "learning_rate": 3.147167283493107e-05, + "loss": 1.4341, + "step": 30121 + }, + { + "epoch": 2.37, + "learning_rate": 3.146409841926046e-05, + "loss": 1.468, + "step": 30122 + }, + { + "epoch": 2.37, + "learning_rate": 3.1456524808383205e-05, + "loss": 1.4392, + "step": 30123 + }, + { + "epoch": 2.37, + "learning_rate": 3.1448952002350705e-05, + "loss": 1.4508, + "step": 30124 + }, + { + "epoch": 2.37, + "learning_rate": 3.1441380001214414e-05, + "loss": 1.452, + "step": 30125 + }, + { + "epoch": 2.37, + "learning_rate": 3.1433808805025736e-05, + "loss": 1.4334, + "step": 30126 + }, + { + "epoch": 2.37, + "learning_rate": 3.142623841383608e-05, + "loss": 1.4616, + "step": 30127 + }, + { + "epoch": 2.37, + "learning_rate": 3.141866882769678e-05, + "loss": 1.4203, + "step": 30128 + }, + { + "epoch": 2.37, + "learning_rate": 3.141110004665933e-05, + "loss": 1.4581, + "step": 30129 + }, + { + "epoch": 2.37, + "learning_rate": 3.1403532070775064e-05, + "loss": 1.477, + "step": 30130 + }, + { + "epoch": 2.37, + "learning_rate": 3.139596490009531e-05, + "loss": 1.4836, + "step": 30131 + }, + { + "epoch": 2.37, + "learning_rate": 3.138839853467156e-05, + "loss": 1.4636, + "step": 30132 + }, + { + "epoch": 2.37, + "learning_rate": 3.138083297455512e-05, + "loss": 1.4412, + "step": 30133 + }, + { + "epoch": 2.37, + "learning_rate": 3.137326821979733e-05, + "loss": 1.4536, + "step": 30134 + }, + { + "epoch": 2.37, + "learning_rate": 3.136570427044963e-05, + "loss": 1.485, + "step": 30135 + }, + { + "epoch": 2.37, + "learning_rate": 3.135814112656328e-05, + "loss": 1.4007, + "step": 30136 + }, + { + "epoch": 2.37, + "learning_rate": 3.1350578788189735e-05, + "loss": 1.3946, + "step": 30137 + }, + { + "epoch": 2.37, + "learning_rate": 3.134301725538024e-05, + "loss": 1.4404, + "step": 30138 + }, + { + "epoch": 2.37, + "learning_rate": 3.1335456528186196e-05, + "loss": 1.4095, + "step": 30139 + }, + { + "epoch": 2.37, + "learning_rate": 3.132789660665894e-05, + "loss": 1.4704, + "step": 30140 + }, + { + "epoch": 2.37, + "learning_rate": 3.132033749084973e-05, + "loss": 1.4551, + "step": 30141 + }, + { + "epoch": 2.37, + "learning_rate": 3.131277918080998e-05, + "loss": 1.4318, + "step": 30142 + }, + { + "epoch": 2.37, + "learning_rate": 3.130522167659095e-05, + "loss": 1.4937, + "step": 30143 + }, + { + "epoch": 2.37, + "learning_rate": 3.129766497824393e-05, + "loss": 1.4593, + "step": 30144 + }, + { + "epoch": 2.37, + "learning_rate": 3.1290109085820306e-05, + "loss": 1.4738, + "step": 30145 + }, + { + "epoch": 2.37, + "learning_rate": 3.1282553999371324e-05, + "loss": 1.4438, + "step": 30146 + }, + { + "epoch": 2.37, + "learning_rate": 3.12749997189483e-05, + "loss": 1.4292, + "step": 30147 + }, + { + "epoch": 2.37, + "learning_rate": 3.126744624460245e-05, + "loss": 1.4872, + "step": 30148 + }, + { + "epoch": 2.37, + "learning_rate": 3.125989357638516e-05, + "loss": 1.425, + "step": 30149 + }, + { + "epoch": 2.37, + "learning_rate": 3.125234171434769e-05, + "loss": 1.4495, + "step": 30150 + }, + { + "epoch": 2.37, + "learning_rate": 3.124479065854124e-05, + "loss": 1.3968, + "step": 30151 + }, + { + "epoch": 2.37, + "learning_rate": 3.123724040901711e-05, + "loss": 1.4513, + "step": 30152 + }, + { + "epoch": 2.37, + "learning_rate": 3.122969096582664e-05, + "loss": 1.4944, + "step": 30153 + }, + { + "epoch": 2.37, + "learning_rate": 3.1222142329021006e-05, + "loss": 1.4609, + "step": 30154 + }, + { + "epoch": 2.37, + "learning_rate": 3.121459449865144e-05, + "loss": 1.4837, + "step": 30155 + }, + { + "epoch": 2.37, + "learning_rate": 3.120704747476929e-05, + "loss": 1.4343, + "step": 30156 + }, + { + "epoch": 2.37, + "learning_rate": 3.11995012574257e-05, + "loss": 1.4582, + "step": 30157 + }, + { + "epoch": 2.37, + "learning_rate": 3.1191955846671914e-05, + "loss": 1.4338, + "step": 30158 + }, + { + "epoch": 2.37, + "learning_rate": 3.1184411242559224e-05, + "loss": 1.4332, + "step": 30159 + }, + { + "epoch": 2.37, + "learning_rate": 3.117686744513882e-05, + "loss": 1.4568, + "step": 30160 + }, + { + "epoch": 2.37, + "learning_rate": 3.116932445446187e-05, + "loss": 1.5005, + "step": 30161 + }, + { + "epoch": 2.37, + "learning_rate": 3.116178227057967e-05, + "loss": 1.4095, + "step": 30162 + }, + { + "epoch": 2.37, + "learning_rate": 3.115424089354337e-05, + "loss": 1.499, + "step": 30163 + }, + { + "epoch": 2.37, + "learning_rate": 3.1146700323404204e-05, + "loss": 1.4346, + "step": 30164 + }, + { + "epoch": 2.37, + "learning_rate": 3.113916056021332e-05, + "loss": 1.4576, + "step": 30165 + }, + { + "epoch": 2.37, + "learning_rate": 3.1131621604021976e-05, + "loss": 1.4585, + "step": 30166 + }, + { + "epoch": 2.37, + "learning_rate": 3.11240834548813e-05, + "loss": 1.4523, + "step": 30167 + }, + { + "epoch": 2.37, + "learning_rate": 3.111654611284252e-05, + "loss": 1.3779, + "step": 30168 + }, + { + "epoch": 2.37, + "learning_rate": 3.110900957795674e-05, + "loss": 1.4553, + "step": 30169 + }, + { + "epoch": 2.37, + "learning_rate": 3.1101473850275227e-05, + "loss": 1.4228, + "step": 30170 + }, + { + "epoch": 2.37, + "learning_rate": 3.1093938929849094e-05, + "loss": 1.416, + "step": 30171 + }, + { + "epoch": 2.37, + "learning_rate": 3.108640481672945e-05, + "loss": 1.4394, + "step": 30172 + }, + { + "epoch": 2.37, + "learning_rate": 3.107887151096755e-05, + "loss": 1.5123, + "step": 30173 + }, + { + "epoch": 2.37, + "learning_rate": 3.107133901261448e-05, + "loss": 1.444, + "step": 30174 + }, + { + "epoch": 2.37, + "learning_rate": 3.106380732172133e-05, + "loss": 1.5257, + "step": 30175 + }, + { + "epoch": 2.37, + "learning_rate": 3.105627643833935e-05, + "loss": 1.3851, + "step": 30176 + }, + { + "epoch": 2.37, + "learning_rate": 3.104874636251962e-05, + "loss": 1.45, + "step": 30177 + }, + { + "epoch": 2.37, + "learning_rate": 3.1041217094313205e-05, + "loss": 1.4447, + "step": 30178 + }, + { + "epoch": 2.37, + "learning_rate": 3.1033688633771337e-05, + "loss": 1.4623, + "step": 30179 + }, + { + "epoch": 2.37, + "learning_rate": 3.1026160980945057e-05, + "loss": 1.4921, + "step": 30180 + }, + { + "epoch": 2.37, + "learning_rate": 3.1018634135885485e-05, + "loss": 1.4403, + "step": 30181 + }, + { + "epoch": 2.37, + "learning_rate": 3.10111080986437e-05, + "loss": 1.4217, + "step": 30182 + }, + { + "epoch": 2.37, + "learning_rate": 3.1003582869270835e-05, + "loss": 1.4345, + "step": 30183 + }, + { + "epoch": 2.37, + "learning_rate": 3.099605844781799e-05, + "loss": 1.481, + "step": 30184 + }, + { + "epoch": 2.37, + "learning_rate": 3.0988534834336204e-05, + "loss": 1.4455, + "step": 30185 + }, + { + "epoch": 2.38, + "learning_rate": 3.098101202887665e-05, + "loss": 1.4388, + "step": 30186 + }, + { + "epoch": 2.38, + "learning_rate": 3.0973490031490324e-05, + "loss": 1.4912, + "step": 30187 + }, + { + "epoch": 2.38, + "learning_rate": 3.0965968842228326e-05, + "loss": 1.3943, + "step": 30188 + }, + { + "epoch": 2.38, + "learning_rate": 3.095844846114166e-05, + "loss": 1.4519, + "step": 30189 + }, + { + "epoch": 2.38, + "learning_rate": 3.095092888828149e-05, + "loss": 1.422, + "step": 30190 + }, + { + "epoch": 2.38, + "learning_rate": 3.094341012369881e-05, + "loss": 1.4948, + "step": 30191 + }, + { + "epoch": 2.38, + "learning_rate": 3.0935892167444625e-05, + "loss": 1.4586, + "step": 30192 + }, + { + "epoch": 2.38, + "learning_rate": 3.092837501957009e-05, + "loss": 1.4363, + "step": 30193 + }, + { + "epoch": 2.38, + "learning_rate": 3.092085868012616e-05, + "loss": 1.4525, + "step": 30194 + }, + { + "epoch": 2.38, + "learning_rate": 3.091334314916386e-05, + "loss": 1.4861, + "step": 30195 + }, + { + "epoch": 2.38, + "learning_rate": 3.090582842673427e-05, + "loss": 1.4428, + "step": 30196 + }, + { + "epoch": 2.38, + "learning_rate": 3.08983145128884e-05, + "loss": 1.4173, + "step": 30197 + }, + { + "epoch": 2.38, + "learning_rate": 3.0890801407677176e-05, + "loss": 1.4776, + "step": 30198 + }, + { + "epoch": 2.38, + "learning_rate": 3.0883289111151715e-05, + "loss": 1.4453, + "step": 30199 + }, + { + "epoch": 2.38, + "learning_rate": 3.087577762336301e-05, + "loss": 1.4115, + "step": 30200 + }, + { + "epoch": 2.38, + "learning_rate": 3.0868266944362045e-05, + "loss": 1.4322, + "step": 30201 + }, + { + "epoch": 2.38, + "learning_rate": 3.086075707419976e-05, + "loss": 1.4403, + "step": 30202 + }, + { + "epoch": 2.38, + "learning_rate": 3.085324801292723e-05, + "loss": 1.4329, + "step": 30203 + }, + { + "epoch": 2.38, + "learning_rate": 3.084573976059539e-05, + "loss": 1.4667, + "step": 30204 + }, + { + "epoch": 2.38, + "learning_rate": 3.083823231725522e-05, + "loss": 1.4693, + "step": 30205 + }, + { + "epoch": 2.38, + "learning_rate": 3.0830725682957656e-05, + "loss": 1.4855, + "step": 30206 + }, + { + "epoch": 2.38, + "learning_rate": 3.0823219857753754e-05, + "loss": 1.4749, + "step": 30207 + }, + { + "epoch": 2.38, + "learning_rate": 3.0815714841694406e-05, + "loss": 1.4065, + "step": 30208 + }, + { + "epoch": 2.38, + "learning_rate": 3.080821063483055e-05, + "loss": 1.5156, + "step": 30209 + }, + { + "epoch": 2.38, + "learning_rate": 3.0800707237213214e-05, + "loss": 1.455, + "step": 30210 + }, + { + "epoch": 2.38, + "learning_rate": 3.0793204648893285e-05, + "loss": 1.4469, + "step": 30211 + }, + { + "epoch": 2.38, + "learning_rate": 3.0785702869921686e-05, + "loss": 1.4636, + "step": 30212 + }, + { + "epoch": 2.38, + "learning_rate": 3.0778201900349415e-05, + "loss": 1.4472, + "step": 30213 + }, + { + "epoch": 2.38, + "learning_rate": 3.077070174022731e-05, + "loss": 1.4168, + "step": 30214 + }, + { + "epoch": 2.38, + "learning_rate": 3.0763202389606386e-05, + "loss": 1.4327, + "step": 30215 + }, + { + "epoch": 2.38, + "learning_rate": 3.075570384853748e-05, + "loss": 1.4954, + "step": 30216 + }, + { + "epoch": 2.38, + "learning_rate": 3.074820611707159e-05, + "loss": 1.4992, + "step": 30217 + }, + { + "epoch": 2.38, + "learning_rate": 3.074070919525956e-05, + "loss": 1.4401, + "step": 30218 + }, + { + "epoch": 2.38, + "learning_rate": 3.073321308315227e-05, + "loss": 1.4419, + "step": 30219 + }, + { + "epoch": 2.38, + "learning_rate": 3.072571778080067e-05, + "loss": 1.4638, + "step": 30220 + }, + { + "epoch": 2.38, + "learning_rate": 3.0718223288255635e-05, + "loss": 1.4105, + "step": 30221 + }, + { + "epoch": 2.38, + "learning_rate": 3.071072960556804e-05, + "loss": 1.4225, + "step": 30222 + }, + { + "epoch": 2.38, + "learning_rate": 3.070323673278872e-05, + "loss": 1.4439, + "step": 30223 + }, + { + "epoch": 2.38, + "learning_rate": 3.0695744669968636e-05, + "loss": 1.4658, + "step": 30224 + }, + { + "epoch": 2.38, + "learning_rate": 3.068825341715861e-05, + "loss": 1.4463, + "step": 30225 + }, + { + "epoch": 2.38, + "learning_rate": 3.068076297440945e-05, + "loss": 1.41, + "step": 30226 + }, + { + "epoch": 2.38, + "learning_rate": 3.0673273341772105e-05, + "loss": 1.417, + "step": 30227 + }, + { + "epoch": 2.38, + "learning_rate": 3.066578451929739e-05, + "loss": 1.4746, + "step": 30228 + }, + { + "epoch": 2.38, + "learning_rate": 3.06582965070361e-05, + "loss": 1.4222, + "step": 30229 + }, + { + "epoch": 2.38, + "learning_rate": 3.065080930503912e-05, + "loss": 1.4422, + "step": 30230 + }, + { + "epoch": 2.38, + "learning_rate": 3.0643322913357327e-05, + "loss": 1.4936, + "step": 30231 + }, + { + "epoch": 2.38, + "learning_rate": 3.063583733204149e-05, + "loss": 1.4262, + "step": 30232 + }, + { + "epoch": 2.38, + "learning_rate": 3.062835256114242e-05, + "loss": 1.4622, + "step": 30233 + }, + { + "epoch": 2.38, + "learning_rate": 3.062086860071101e-05, + "loss": 1.4039, + "step": 30234 + }, + { + "epoch": 2.38, + "learning_rate": 3.061338545079801e-05, + "loss": 1.4578, + "step": 30235 + }, + { + "epoch": 2.38, + "learning_rate": 3.0605903111454194e-05, + "loss": 1.5228, + "step": 30236 + }, + { + "epoch": 2.38, + "learning_rate": 3.059842158273047e-05, + "loss": 1.4634, + "step": 30237 + }, + { + "epoch": 2.38, + "learning_rate": 3.0590940864677546e-05, + "loss": 1.485, + "step": 30238 + }, + { + "epoch": 2.38, + "learning_rate": 3.058346095734622e-05, + "loss": 1.4553, + "step": 30239 + }, + { + "epoch": 2.38, + "learning_rate": 3.057598186078732e-05, + "loss": 1.3955, + "step": 30240 + }, + { + "epoch": 2.38, + "learning_rate": 3.056850357505161e-05, + "loss": 1.3858, + "step": 30241 + }, + { + "epoch": 2.38, + "learning_rate": 3.056102610018985e-05, + "loss": 1.4939, + "step": 30242 + }, + { + "epoch": 2.38, + "learning_rate": 3.055354943625276e-05, + "loss": 1.4576, + "step": 30243 + }, + { + "epoch": 2.38, + "learning_rate": 3.0546073583291216e-05, + "loss": 1.4392, + "step": 30244 + }, + { + "epoch": 2.38, + "learning_rate": 3.0538598541355894e-05, + "loss": 1.4624, + "step": 30245 + }, + { + "epoch": 2.38, + "learning_rate": 3.053112431049752e-05, + "loss": 1.4493, + "step": 30246 + }, + { + "epoch": 2.38, + "learning_rate": 3.05236508907669e-05, + "loss": 1.4132, + "step": 30247 + }, + { + "epoch": 2.38, + "learning_rate": 3.051617828221478e-05, + "loss": 1.4583, + "step": 30248 + }, + { + "epoch": 2.38, + "learning_rate": 3.0508706484891893e-05, + "loss": 1.4189, + "step": 30249 + }, + { + "epoch": 2.38, + "learning_rate": 3.0501235498848898e-05, + "loss": 1.4466, + "step": 30250 + }, + { + "epoch": 2.38, + "learning_rate": 3.0493765324136605e-05, + "loss": 1.4313, + "step": 30251 + }, + { + "epoch": 2.38, + "learning_rate": 3.0486295960805707e-05, + "loss": 1.4079, + "step": 30252 + }, + { + "epoch": 2.38, + "learning_rate": 3.0478827408906847e-05, + "loss": 1.3629, + "step": 30253 + }, + { + "epoch": 2.38, + "learning_rate": 3.0471359668490852e-05, + "loss": 1.4312, + "step": 30254 + }, + { + "epoch": 2.38, + "learning_rate": 3.046389273960835e-05, + "loss": 1.4627, + "step": 30255 + }, + { + "epoch": 2.38, + "learning_rate": 3.0456426622310027e-05, + "loss": 1.4084, + "step": 30256 + }, + { + "epoch": 2.38, + "learning_rate": 3.044896131664663e-05, + "loss": 1.4497, + "step": 30257 + }, + { + "epoch": 2.38, + "learning_rate": 3.0441496822668802e-05, + "loss": 1.4871, + "step": 30258 + }, + { + "epoch": 2.38, + "learning_rate": 3.0434033140427238e-05, + "loss": 1.4195, + "step": 30259 + }, + { + "epoch": 2.38, + "learning_rate": 3.0426570269972577e-05, + "loss": 1.4159, + "step": 30260 + }, + { + "epoch": 2.38, + "learning_rate": 3.0419108211355547e-05, + "loss": 1.4809, + "step": 30261 + }, + { + "epoch": 2.38, + "learning_rate": 3.041164696462674e-05, + "loss": 1.4558, + "step": 30262 + }, + { + "epoch": 2.38, + "learning_rate": 3.04041865298369e-05, + "loss": 1.45, + "step": 30263 + }, + { + "epoch": 2.38, + "learning_rate": 3.03967269070366e-05, + "loss": 1.4377, + "step": 30264 + }, + { + "epoch": 2.38, + "learning_rate": 3.0389268096276553e-05, + "loss": 1.4573, + "step": 30265 + }, + { + "epoch": 2.38, + "learning_rate": 3.0381810097607383e-05, + "loss": 1.437, + "step": 30266 + }, + { + "epoch": 2.38, + "learning_rate": 3.0374352911079653e-05, + "loss": 1.4494, + "step": 30267 + }, + { + "epoch": 2.38, + "learning_rate": 3.0366896536744102e-05, + "loss": 1.3863, + "step": 30268 + }, + { + "epoch": 2.38, + "learning_rate": 3.0359440974651304e-05, + "loss": 1.4882, + "step": 30269 + }, + { + "epoch": 2.38, + "learning_rate": 3.0351986224851843e-05, + "loss": 1.4129, + "step": 30270 + }, + { + "epoch": 2.38, + "learning_rate": 3.0344532287396407e-05, + "loss": 1.4676, + "step": 30271 + }, + { + "epoch": 2.38, + "learning_rate": 3.0337079162335552e-05, + "loss": 1.4913, + "step": 30272 + }, + { + "epoch": 2.38, + "learning_rate": 3.0329626849719864e-05, + "loss": 1.3802, + "step": 30273 + }, + { + "epoch": 2.38, + "learning_rate": 3.032217534960001e-05, + "loss": 1.4182, + "step": 30274 + }, + { + "epoch": 2.38, + "learning_rate": 3.031472466202655e-05, + "loss": 1.4951, + "step": 30275 + }, + { + "epoch": 2.38, + "learning_rate": 3.030727478705005e-05, + "loss": 1.4778, + "step": 30276 + }, + { + "epoch": 2.38, + "learning_rate": 3.0299825724721033e-05, + "loss": 1.4363, + "step": 30277 + }, + { + "epoch": 2.38, + "learning_rate": 3.0292377475090208e-05, + "loss": 1.4555, + "step": 30278 + }, + { + "epoch": 2.38, + "learning_rate": 3.028493003820808e-05, + "loss": 1.4448, + "step": 30279 + }, + { + "epoch": 2.38, + "learning_rate": 3.0277483414125236e-05, + "loss": 1.4791, + "step": 30280 + }, + { + "epoch": 2.38, + "learning_rate": 3.0270037602892144e-05, + "loss": 1.4504, + "step": 30281 + }, + { + "epoch": 2.38, + "learning_rate": 3.0262592604559482e-05, + "loss": 1.474, + "step": 30282 + }, + { + "epoch": 2.38, + "learning_rate": 3.0255148419177726e-05, + "loss": 1.4662, + "step": 30283 + }, + { + "epoch": 2.38, + "learning_rate": 3.0247705046797404e-05, + "loss": 1.5009, + "step": 30284 + }, + { + "epoch": 2.38, + "learning_rate": 3.0240262487469123e-05, + "loss": 1.4718, + "step": 30285 + }, + { + "epoch": 2.38, + "learning_rate": 3.0232820741243365e-05, + "loss": 1.4593, + "step": 30286 + }, + { + "epoch": 2.38, + "learning_rate": 3.0225379808170614e-05, + "loss": 1.451, + "step": 30287 + }, + { + "epoch": 2.38, + "learning_rate": 3.0217939688301484e-05, + "loss": 1.4914, + "step": 30288 + }, + { + "epoch": 2.38, + "learning_rate": 3.0210500381686437e-05, + "loss": 1.5017, + "step": 30289 + }, + { + "epoch": 2.38, + "learning_rate": 3.0203061888375947e-05, + "loss": 1.4566, + "step": 30290 + }, + { + "epoch": 2.38, + "learning_rate": 3.0195624208420603e-05, + "loss": 1.4902, + "step": 30291 + }, + { + "epoch": 2.38, + "learning_rate": 3.0188187341870857e-05, + "loss": 1.4375, + "step": 30292 + }, + { + "epoch": 2.38, + "learning_rate": 3.018075128877716e-05, + "loss": 1.4194, + "step": 30293 + }, + { + "epoch": 2.38, + "learning_rate": 3.0173316049190044e-05, + "loss": 1.4392, + "step": 30294 + }, + { + "epoch": 2.38, + "learning_rate": 3.0165881623160015e-05, + "loss": 1.4657, + "step": 30295 + }, + { + "epoch": 2.38, + "learning_rate": 3.0158448010737536e-05, + "loss": 1.4202, + "step": 30296 + }, + { + "epoch": 2.38, + "learning_rate": 3.015101521197301e-05, + "loss": 1.4731, + "step": 30297 + }, + { + "epoch": 2.38, + "learning_rate": 3.014358322691699e-05, + "loss": 1.4498, + "step": 30298 + }, + { + "epoch": 2.38, + "learning_rate": 3.0136152055619893e-05, + "loss": 1.4217, + "step": 30299 + }, + { + "epoch": 2.38, + "learning_rate": 3.01287216981322e-05, + "loss": 1.456, + "step": 30300 + }, + { + "epoch": 2.38, + "learning_rate": 3.0121292154504272e-05, + "loss": 1.4692, + "step": 30301 + }, + { + "epoch": 2.38, + "learning_rate": 3.0113863424786666e-05, + "loss": 1.4788, + "step": 30302 + }, + { + "epoch": 2.38, + "learning_rate": 3.0106435509029775e-05, + "loss": 1.4352, + "step": 30303 + }, + { + "epoch": 2.38, + "learning_rate": 3.0099008407283974e-05, + "loss": 1.4876, + "step": 30304 + }, + { + "epoch": 2.38, + "learning_rate": 3.0091582119599794e-05, + "loss": 1.4741, + "step": 30305 + }, + { + "epoch": 2.38, + "learning_rate": 3.0084156646027576e-05, + "loss": 1.4598, + "step": 30306 + }, + { + "epoch": 2.38, + "learning_rate": 3.007673198661774e-05, + "loss": 1.4078, + "step": 30307 + }, + { + "epoch": 2.38, + "learning_rate": 3.0069308141420738e-05, + "loss": 1.484, + "step": 30308 + }, + { + "epoch": 2.38, + "learning_rate": 3.0061885110486927e-05, + "loss": 1.4521, + "step": 30309 + }, + { + "epoch": 2.38, + "learning_rate": 3.0054462893866765e-05, + "loss": 1.4681, + "step": 30310 + }, + { + "epoch": 2.38, + "learning_rate": 3.004704149161056e-05, + "loss": 1.4473, + "step": 30311 + }, + { + "epoch": 2.38, + "learning_rate": 3.0039620903768797e-05, + "loss": 1.4719, + "step": 30312 + }, + { + "epoch": 2.39, + "learning_rate": 3.0032201130391808e-05, + "loss": 1.4486, + "step": 30313 + }, + { + "epoch": 2.39, + "learning_rate": 3.0024782171529927e-05, + "loss": 1.5076, + "step": 30314 + }, + { + "epoch": 2.39, + "learning_rate": 3.0017364027233593e-05, + "loss": 1.465, + "step": 30315 + }, + { + "epoch": 2.39, + "learning_rate": 3.0009946697553165e-05, + "loss": 1.4656, + "step": 30316 + }, + { + "epoch": 2.39, + "learning_rate": 3.0002530182538976e-05, + "loss": 1.5076, + "step": 30317 + }, + { + "epoch": 2.39, + "learning_rate": 2.9995114482241344e-05, + "loss": 1.462, + "step": 30318 + }, + { + "epoch": 2.39, + "learning_rate": 2.99876995967107e-05, + "loss": 1.471, + "step": 30319 + }, + { + "epoch": 2.39, + "learning_rate": 2.9980285525997354e-05, + "loss": 1.5038, + "step": 30320 + }, + { + "epoch": 2.39, + "learning_rate": 2.99728722701516e-05, + "loss": 1.4427, + "step": 30321 + }, + { + "epoch": 2.39, + "learning_rate": 2.9965459829223843e-05, + "loss": 1.4357, + "step": 30322 + }, + { + "epoch": 2.39, + "learning_rate": 2.9958048203264378e-05, + "loss": 1.4744, + "step": 30323 + }, + { + "epoch": 2.39, + "learning_rate": 2.9950637392323468e-05, + "loss": 1.4726, + "step": 30324 + }, + { + "epoch": 2.39, + "learning_rate": 2.9943227396451486e-05, + "loss": 1.4229, + "step": 30325 + }, + { + "epoch": 2.39, + "learning_rate": 2.9935818215698775e-05, + "loss": 1.417, + "step": 30326 + }, + { + "epoch": 2.39, + "learning_rate": 2.9928409850115613e-05, + "loss": 1.4996, + "step": 30327 + }, + { + "epoch": 2.39, + "learning_rate": 2.9921002299752243e-05, + "loss": 1.4962, + "step": 30328 + }, + { + "epoch": 2.39, + "learning_rate": 2.991359556465904e-05, + "loss": 1.4539, + "step": 30329 + }, + { + "epoch": 2.39, + "learning_rate": 2.9906189644886252e-05, + "loss": 1.4527, + "step": 30330 + }, + { + "epoch": 2.39, + "learning_rate": 2.9898784540484116e-05, + "loss": 1.4056, + "step": 30331 + }, + { + "epoch": 2.39, + "learning_rate": 2.989138025150301e-05, + "loss": 1.4887, + "step": 30332 + }, + { + "epoch": 2.39, + "learning_rate": 2.9883976777993147e-05, + "loss": 1.4742, + "step": 30333 + }, + { + "epoch": 2.39, + "learning_rate": 2.9876574120004782e-05, + "loss": 1.4879, + "step": 30334 + }, + { + "epoch": 2.39, + "learning_rate": 2.986917227758816e-05, + "loss": 1.4542, + "step": 30335 + }, + { + "epoch": 2.39, + "learning_rate": 2.9861771250793608e-05, + "loss": 1.4774, + "step": 30336 + }, + { + "epoch": 2.39, + "learning_rate": 2.9854371039671338e-05, + "loss": 1.4016, + "step": 30337 + }, + { + "epoch": 2.39, + "learning_rate": 2.984697164427154e-05, + "loss": 1.4235, + "step": 30338 + }, + { + "epoch": 2.39, + "learning_rate": 2.9839573064644522e-05, + "loss": 1.465, + "step": 30339 + }, + { + "epoch": 2.39, + "learning_rate": 2.9832175300840482e-05, + "loss": 1.4616, + "step": 30340 + }, + { + "epoch": 2.39, + "learning_rate": 2.982477835290968e-05, + "loss": 1.5043, + "step": 30341 + }, + { + "epoch": 2.39, + "learning_rate": 2.981738222090227e-05, + "loss": 1.4862, + "step": 30342 + }, + { + "epoch": 2.39, + "learning_rate": 2.9809986904868566e-05, + "loss": 1.4828, + "step": 30343 + }, + { + "epoch": 2.39, + "learning_rate": 2.980259240485871e-05, + "loss": 1.4205, + "step": 30344 + }, + { + "epoch": 2.39, + "learning_rate": 2.9795198720922898e-05, + "loss": 1.4295, + "step": 30345 + }, + { + "epoch": 2.39, + "learning_rate": 2.9787805853111384e-05, + "loss": 1.5057, + "step": 30346 + }, + { + "epoch": 2.39, + "learning_rate": 2.9780413801474334e-05, + "loss": 1.4594, + "step": 30347 + }, + { + "epoch": 2.39, + "learning_rate": 2.977302256606187e-05, + "loss": 1.4487, + "step": 30348 + }, + { + "epoch": 2.39, + "learning_rate": 2.9765632146924305e-05, + "loss": 1.4079, + "step": 30349 + }, + { + "epoch": 2.39, + "learning_rate": 2.9758242544111733e-05, + "loss": 1.4711, + "step": 30350 + }, + { + "epoch": 2.39, + "learning_rate": 2.975085375767431e-05, + "loss": 1.4449, + "step": 30351 + }, + { + "epoch": 2.39, + "learning_rate": 2.9743465787662245e-05, + "loss": 1.4578, + "step": 30352 + }, + { + "epoch": 2.39, + "learning_rate": 2.9736078634125705e-05, + "loss": 1.442, + "step": 30353 + }, + { + "epoch": 2.39, + "learning_rate": 2.9728692297114825e-05, + "loss": 1.4858, + "step": 30354 + }, + { + "epoch": 2.39, + "learning_rate": 2.9721306776679705e-05, + "loss": 1.5023, + "step": 30355 + }, + { + "epoch": 2.39, + "learning_rate": 2.971392207287055e-05, + "loss": 1.4644, + "step": 30356 + }, + { + "epoch": 2.39, + "learning_rate": 2.9706538185737505e-05, + "loss": 1.415, + "step": 30357 + }, + { + "epoch": 2.39, + "learning_rate": 2.9699155115330697e-05, + "loss": 1.4656, + "step": 30358 + }, + { + "epoch": 2.39, + "learning_rate": 2.9691772861700203e-05, + "loss": 1.4601, + "step": 30359 + }, + { + "epoch": 2.39, + "learning_rate": 2.9684391424896197e-05, + "loss": 1.4508, + "step": 30360 + }, + { + "epoch": 2.39, + "learning_rate": 2.9677010804968794e-05, + "loss": 1.4218, + "step": 30361 + }, + { + "epoch": 2.39, + "learning_rate": 2.9669631001968047e-05, + "loss": 1.5003, + "step": 30362 + }, + { + "epoch": 2.39, + "learning_rate": 2.966225201594414e-05, + "loss": 1.4119, + "step": 30363 + }, + { + "epoch": 2.39, + "learning_rate": 2.9654873846947142e-05, + "loss": 1.4726, + "step": 30364 + }, + { + "epoch": 2.39, + "learning_rate": 2.9647496495027084e-05, + "loss": 1.4519, + "step": 30365 + }, + { + "epoch": 2.39, + "learning_rate": 2.964011996023416e-05, + "loss": 1.4684, + "step": 30366 + }, + { + "epoch": 2.39, + "learning_rate": 2.9632744242618394e-05, + "loss": 1.4803, + "step": 30367 + }, + { + "epoch": 2.39, + "learning_rate": 2.9625369342229833e-05, + "loss": 1.4258, + "step": 30368 + }, + { + "epoch": 2.39, + "learning_rate": 2.9617995259118617e-05, + "loss": 1.499, + "step": 30369 + }, + { + "epoch": 2.39, + "learning_rate": 2.9610621993334787e-05, + "loss": 1.4105, + "step": 30370 + }, + { + "epoch": 2.39, + "learning_rate": 2.960324954492841e-05, + "loss": 1.4532, + "step": 30371 + }, + { + "epoch": 2.39, + "learning_rate": 2.959587791394944e-05, + "loss": 1.4305, + "step": 30372 + }, + { + "epoch": 2.39, + "learning_rate": 2.9588507100448088e-05, + "loss": 1.4619, + "step": 30373 + }, + { + "epoch": 2.39, + "learning_rate": 2.9581137104474333e-05, + "loss": 1.4742, + "step": 30374 + }, + { + "epoch": 2.39, + "learning_rate": 2.9573767926078202e-05, + "loss": 1.4655, + "step": 30375 + }, + { + "epoch": 2.39, + "learning_rate": 2.9566399565309683e-05, + "loss": 1.4397, + "step": 30376 + }, + { + "epoch": 2.39, + "learning_rate": 2.9559032022218894e-05, + "loss": 1.4046, + "step": 30377 + }, + { + "epoch": 2.39, + "learning_rate": 2.955166529685582e-05, + "loss": 1.4366, + "step": 30378 + }, + { + "epoch": 2.39, + "learning_rate": 2.9544299389270425e-05, + "loss": 1.4539, + "step": 30379 + }, + { + "epoch": 2.39, + "learning_rate": 2.9536934299512803e-05, + "loss": 1.4591, + "step": 30380 + }, + { + "epoch": 2.39, + "learning_rate": 2.9529570027632916e-05, + "loss": 1.4394, + "step": 30381 + }, + { + "epoch": 2.39, + "learning_rate": 2.9522206573680734e-05, + "loss": 1.4477, + "step": 30382 + }, + { + "epoch": 2.39, + "learning_rate": 2.951484393770632e-05, + "loss": 1.4166, + "step": 30383 + }, + { + "epoch": 2.39, + "learning_rate": 2.9507482119759623e-05, + "loss": 1.4958, + "step": 30384 + }, + { + "epoch": 2.39, + "learning_rate": 2.9500121119890595e-05, + "loss": 1.4515, + "step": 30385 + }, + { + "epoch": 2.39, + "learning_rate": 2.9492760938149285e-05, + "loss": 1.4773, + "step": 30386 + }, + { + "epoch": 2.39, + "learning_rate": 2.94854015745856e-05, + "loss": 1.5034, + "step": 30387 + }, + { + "epoch": 2.39, + "learning_rate": 2.9478043029249564e-05, + "loss": 1.4508, + "step": 30388 + }, + { + "epoch": 2.39, + "learning_rate": 2.947068530219106e-05, + "loss": 1.4869, + "step": 30389 + }, + { + "epoch": 2.39, + "learning_rate": 2.946332839346013e-05, + "loss": 1.4703, + "step": 30390 + }, + { + "epoch": 2.39, + "learning_rate": 2.9455972303106695e-05, + "loss": 1.457, + "step": 30391 + }, + { + "epoch": 2.39, + "learning_rate": 2.944861703118067e-05, + "loss": 1.4807, + "step": 30392 + }, + { + "epoch": 2.39, + "learning_rate": 2.9441262577731983e-05, + "loss": 1.4944, + "step": 30393 + }, + { + "epoch": 2.39, + "learning_rate": 2.9433908942810623e-05, + "loss": 1.3712, + "step": 30394 + }, + { + "epoch": 2.39, + "learning_rate": 2.9426556126466488e-05, + "loss": 1.4736, + "step": 30395 + }, + { + "epoch": 2.39, + "learning_rate": 2.9419204128749468e-05, + "loss": 1.4167, + "step": 30396 + }, + { + "epoch": 2.39, + "learning_rate": 2.941185294970954e-05, + "loss": 1.4488, + "step": 30397 + }, + { + "epoch": 2.39, + "learning_rate": 2.9404502589396582e-05, + "loss": 1.3992, + "step": 30398 + }, + { + "epoch": 2.39, + "learning_rate": 2.9397153047860474e-05, + "loss": 1.4851, + "step": 30399 + }, + { + "epoch": 2.39, + "learning_rate": 2.9389804325151183e-05, + "loss": 1.4448, + "step": 30400 + }, + { + "epoch": 2.39, + "learning_rate": 2.9382456421318547e-05, + "loss": 1.4898, + "step": 30401 + }, + { + "epoch": 2.39, + "learning_rate": 2.937510933641245e-05, + "loss": 1.4665, + "step": 30402 + }, + { + "epoch": 2.39, + "learning_rate": 2.9367763070482776e-05, + "loss": 1.4315, + "step": 30403 + }, + { + "epoch": 2.39, + "learning_rate": 2.9360417623579463e-05, + "loss": 1.4354, + "step": 30404 + }, + { + "epoch": 2.39, + "learning_rate": 2.935307299575234e-05, + "loss": 1.4252, + "step": 30405 + }, + { + "epoch": 2.39, + "learning_rate": 2.9345729187051253e-05, + "loss": 1.4477, + "step": 30406 + }, + { + "epoch": 2.39, + "learning_rate": 2.9338386197526093e-05, + "loss": 1.4618, + "step": 30407 + }, + { + "epoch": 2.39, + "learning_rate": 2.933104402722672e-05, + "loss": 1.4468, + "step": 30408 + }, + { + "epoch": 2.39, + "learning_rate": 2.9323702676202926e-05, + "loss": 1.4602, + "step": 30409 + }, + { + "epoch": 2.39, + "learning_rate": 2.931636214450464e-05, + "loss": 1.403, + "step": 30410 + }, + { + "epoch": 2.39, + "learning_rate": 2.9309022432181655e-05, + "loss": 1.4758, + "step": 30411 + }, + { + "epoch": 2.39, + "learning_rate": 2.9301683539283798e-05, + "loss": 1.5021, + "step": 30412 + }, + { + "epoch": 2.39, + "learning_rate": 2.9294345465860862e-05, + "loss": 1.394, + "step": 30413 + }, + { + "epoch": 2.39, + "learning_rate": 2.928700821196276e-05, + "loss": 1.4836, + "step": 30414 + }, + { + "epoch": 2.39, + "learning_rate": 2.9279671777639245e-05, + "loss": 1.4266, + "step": 30415 + }, + { + "epoch": 2.39, + "learning_rate": 2.9272336162940102e-05, + "loss": 1.472, + "step": 30416 + }, + { + "epoch": 2.39, + "learning_rate": 2.926500136791522e-05, + "loss": 1.4872, + "step": 30417 + }, + { + "epoch": 2.39, + "learning_rate": 2.925766739261436e-05, + "loss": 1.4317, + "step": 30418 + }, + { + "epoch": 2.39, + "learning_rate": 2.9250334237087246e-05, + "loss": 1.4295, + "step": 30419 + }, + { + "epoch": 2.39, + "learning_rate": 2.9243001901383745e-05, + "loss": 1.4646, + "step": 30420 + }, + { + "epoch": 2.39, + "learning_rate": 2.9235670385553646e-05, + "loss": 1.4878, + "step": 30421 + }, + { + "epoch": 2.39, + "learning_rate": 2.9228339689646707e-05, + "loss": 1.4529, + "step": 30422 + }, + { + "epoch": 2.39, + "learning_rate": 2.9221009813712658e-05, + "loss": 1.4278, + "step": 30423 + }, + { + "epoch": 2.39, + "learning_rate": 2.9213680757801343e-05, + "loss": 1.407, + "step": 30424 + }, + { + "epoch": 2.39, + "learning_rate": 2.920635252196249e-05, + "loss": 1.4624, + "step": 30425 + }, + { + "epoch": 2.39, + "learning_rate": 2.9199025106245787e-05, + "loss": 1.5043, + "step": 30426 + }, + { + "epoch": 2.39, + "learning_rate": 2.9191698510701085e-05, + "loss": 1.4696, + "step": 30427 + }, + { + "epoch": 2.39, + "learning_rate": 2.918437273537807e-05, + "loss": 1.452, + "step": 30428 + }, + { + "epoch": 2.39, + "learning_rate": 2.9177047780326508e-05, + "loss": 1.444, + "step": 30429 + }, + { + "epoch": 2.39, + "learning_rate": 2.916972364559607e-05, + "loss": 1.4765, + "step": 30430 + }, + { + "epoch": 2.39, + "learning_rate": 2.9162400331236575e-05, + "loss": 1.4924, + "step": 30431 + }, + { + "epoch": 2.39, + "learning_rate": 2.915507783729769e-05, + "loss": 1.4272, + "step": 30432 + }, + { + "epoch": 2.39, + "learning_rate": 2.9147756163829117e-05, + "loss": 1.4844, + "step": 30433 + }, + { + "epoch": 2.39, + "learning_rate": 2.914043531088061e-05, + "loss": 1.4766, + "step": 30434 + }, + { + "epoch": 2.39, + "learning_rate": 2.9133115278501816e-05, + "loss": 1.445, + "step": 30435 + }, + { + "epoch": 2.39, + "learning_rate": 2.9125796066742514e-05, + "loss": 1.4372, + "step": 30436 + }, + { + "epoch": 2.39, + "learning_rate": 2.9118477675652306e-05, + "loss": 1.468, + "step": 30437 + }, + { + "epoch": 2.39, + "learning_rate": 2.911116010528096e-05, + "loss": 1.4169, + "step": 30438 + }, + { + "epoch": 2.39, + "learning_rate": 2.9103843355678135e-05, + "loss": 1.4857, + "step": 30439 + }, + { + "epoch": 2.4, + "learning_rate": 2.9096527426893457e-05, + "loss": 1.42, + "step": 30440 + }, + { + "epoch": 2.4, + "learning_rate": 2.9089212318976686e-05, + "loss": 1.432, + "step": 30441 + }, + { + "epoch": 2.4, + "learning_rate": 2.9081898031977413e-05, + "loss": 1.4483, + "step": 30442 + }, + { + "epoch": 2.4, + "learning_rate": 2.90745845659453e-05, + "loss": 1.4399, + "step": 30443 + }, + { + "epoch": 2.4, + "learning_rate": 2.906727192093008e-05, + "loss": 1.4255, + "step": 30444 + }, + { + "epoch": 2.4, + "learning_rate": 2.9059960096981322e-05, + "loss": 1.4511, + "step": 30445 + }, + { + "epoch": 2.4, + "learning_rate": 2.9052649094148706e-05, + "loss": 1.4347, + "step": 30446 + }, + { + "epoch": 2.4, + "learning_rate": 2.9045338912481826e-05, + "loss": 1.4778, + "step": 30447 + }, + { + "epoch": 2.4, + "learning_rate": 2.9038029552030374e-05, + "loss": 1.4277, + "step": 30448 + }, + { + "epoch": 2.4, + "learning_rate": 2.903072101284396e-05, + "loss": 1.4676, + "step": 30449 + }, + { + "epoch": 2.4, + "learning_rate": 2.9023413294972115e-05, + "loss": 1.4551, + "step": 30450 + }, + { + "epoch": 2.4, + "learning_rate": 2.9016106398464595e-05, + "loss": 1.4734, + "step": 30451 + }, + { + "epoch": 2.4, + "learning_rate": 2.900880032337096e-05, + "loss": 1.4808, + "step": 30452 + }, + { + "epoch": 2.4, + "learning_rate": 2.900149506974081e-05, + "loss": 1.4703, + "step": 30453 + }, + { + "epoch": 2.4, + "learning_rate": 2.8994190637623682e-05, + "loss": 1.4732, + "step": 30454 + }, + { + "epoch": 2.4, + "learning_rate": 2.8986887027069272e-05, + "loss": 1.4564, + "step": 30455 + }, + { + "epoch": 2.4, + "learning_rate": 2.8979584238127124e-05, + "loss": 1.419, + "step": 30456 + }, + { + "epoch": 2.4, + "learning_rate": 2.8972282270846765e-05, + "loss": 1.4336, + "step": 30457 + }, + { + "epoch": 2.4, + "learning_rate": 2.8964981125277853e-05, + "loss": 1.5459, + "step": 30458 + }, + { + "epoch": 2.4, + "learning_rate": 2.8957680801469935e-05, + "loss": 1.4307, + "step": 30459 + }, + { + "epoch": 2.4, + "learning_rate": 2.8950381299472535e-05, + "loss": 1.4369, + "step": 30460 + }, + { + "epoch": 2.4, + "learning_rate": 2.8943082619335283e-05, + "loss": 1.4691, + "step": 30461 + }, + { + "epoch": 2.4, + "learning_rate": 2.893578476110769e-05, + "loss": 1.4393, + "step": 30462 + }, + { + "epoch": 2.4, + "learning_rate": 2.892848772483926e-05, + "loss": 1.4364, + "step": 30463 + }, + { + "epoch": 2.4, + "learning_rate": 2.8921191510579645e-05, + "loss": 1.4459, + "step": 30464 + }, + { + "epoch": 2.4, + "learning_rate": 2.8913896118378316e-05, + "loss": 1.4608, + "step": 30465 + }, + { + "epoch": 2.4, + "learning_rate": 2.890660154828477e-05, + "loss": 1.4085, + "step": 30466 + }, + { + "epoch": 2.4, + "learning_rate": 2.8899307800348566e-05, + "loss": 1.4375, + "step": 30467 + }, + { + "epoch": 2.4, + "learning_rate": 2.8892014874619295e-05, + "loss": 1.4838, + "step": 30468 + }, + { + "epoch": 2.4, + "learning_rate": 2.888472277114639e-05, + "loss": 1.4423, + "step": 30469 + }, + { + "epoch": 2.4, + "learning_rate": 2.8877431489979392e-05, + "loss": 1.4215, + "step": 30470 + }, + { + "epoch": 2.4, + "learning_rate": 2.887014103116774e-05, + "loss": 1.4981, + "step": 30471 + }, + { + "epoch": 2.4, + "learning_rate": 2.8862851394761037e-05, + "loss": 1.4463, + "step": 30472 + }, + { + "epoch": 2.4, + "learning_rate": 2.885556258080872e-05, + "loss": 1.4208, + "step": 30473 + }, + { + "epoch": 2.4, + "learning_rate": 2.8848274589360238e-05, + "loss": 1.3823, + "step": 30474 + }, + { + "epoch": 2.4, + "learning_rate": 2.884098742046516e-05, + "loss": 1.4379, + "step": 30475 + }, + { + "epoch": 2.4, + "learning_rate": 2.8833701074172904e-05, + "loss": 1.4511, + "step": 30476 + }, + { + "epoch": 2.4, + "learning_rate": 2.8826415550532927e-05, + "loss": 1.4458, + "step": 30477 + }, + { + "epoch": 2.4, + "learning_rate": 2.8819130849594756e-05, + "loss": 1.442, + "step": 30478 + }, + { + "epoch": 2.4, + "learning_rate": 2.881184697140782e-05, + "loss": 1.4266, + "step": 30479 + }, + { + "epoch": 2.4, + "learning_rate": 2.880456391602151e-05, + "loss": 1.4637, + "step": 30480 + }, + { + "epoch": 2.4, + "learning_rate": 2.8797281683485374e-05, + "loss": 1.4477, + "step": 30481 + }, + { + "epoch": 2.4, + "learning_rate": 2.8790000273848785e-05, + "loss": 1.4572, + "step": 30482 + }, + { + "epoch": 2.4, + "learning_rate": 2.878271968716122e-05, + "loss": 1.5263, + "step": 30483 + }, + { + "epoch": 2.4, + "learning_rate": 2.8775439923472076e-05, + "loss": 1.4583, + "step": 30484 + }, + { + "epoch": 2.4, + "learning_rate": 2.876816098283083e-05, + "loss": 1.479, + "step": 30485 + }, + { + "epoch": 2.4, + "learning_rate": 2.876088286528687e-05, + "loss": 1.4508, + "step": 30486 + }, + { + "epoch": 2.4, + "learning_rate": 2.8753605570889614e-05, + "loss": 1.4229, + "step": 30487 + }, + { + "epoch": 2.4, + "learning_rate": 2.874632909968842e-05, + "loss": 1.458, + "step": 30488 + }, + { + "epoch": 2.4, + "learning_rate": 2.873905345173278e-05, + "loss": 1.4481, + "step": 30489 + }, + { + "epoch": 2.4, + "learning_rate": 2.8731778627072055e-05, + "loss": 1.4789, + "step": 30490 + }, + { + "epoch": 2.4, + "learning_rate": 2.8724504625755588e-05, + "loss": 1.4518, + "step": 30491 + }, + { + "epoch": 2.4, + "learning_rate": 2.8717231447832846e-05, + "loss": 1.4539, + "step": 30492 + }, + { + "epoch": 2.4, + "learning_rate": 2.870995909335318e-05, + "loss": 1.4156, + "step": 30493 + }, + { + "epoch": 2.4, + "learning_rate": 2.8702687562365906e-05, + "loss": 1.453, + "step": 30494 + }, + { + "epoch": 2.4, + "learning_rate": 2.86954168549205e-05, + "loss": 1.4189, + "step": 30495 + }, + { + "epoch": 2.4, + "learning_rate": 2.8688146971066272e-05, + "loss": 1.4562, + "step": 30496 + }, + { + "epoch": 2.4, + "learning_rate": 2.8680877910852535e-05, + "loss": 1.471, + "step": 30497 + }, + { + "epoch": 2.4, + "learning_rate": 2.867360967432868e-05, + "loss": 1.453, + "step": 30498 + }, + { + "epoch": 2.4, + "learning_rate": 2.8666342261544118e-05, + "loss": 1.4446, + "step": 30499 + }, + { + "epoch": 2.4, + "learning_rate": 2.8659075672548127e-05, + "loss": 1.4464, + "step": 30500 + }, + { + "epoch": 2.4, + "learning_rate": 2.865180990739e-05, + "loss": 1.4788, + "step": 30501 + }, + { + "epoch": 2.4, + "learning_rate": 2.8644544966119166e-05, + "loss": 1.4331, + "step": 30502 + }, + { + "epoch": 2.4, + "learning_rate": 2.8637280848784916e-05, + "loss": 1.4372, + "step": 30503 + }, + { + "epoch": 2.4, + "learning_rate": 2.863001755543653e-05, + "loss": 1.4687, + "step": 30504 + }, + { + "epoch": 2.4, + "learning_rate": 2.8622755086123332e-05, + "loss": 1.4894, + "step": 30505 + }, + { + "epoch": 2.4, + "learning_rate": 2.861549344089467e-05, + "loss": 1.4275, + "step": 30506 + }, + { + "epoch": 2.4, + "learning_rate": 2.860823261979982e-05, + "loss": 1.446, + "step": 30507 + }, + { + "epoch": 2.4, + "learning_rate": 2.860097262288806e-05, + "loss": 1.4142, + "step": 30508 + }, + { + "epoch": 2.4, + "learning_rate": 2.8593713450208727e-05, + "loss": 1.4364, + "step": 30509 + }, + { + "epoch": 2.4, + "learning_rate": 2.858645510181109e-05, + "loss": 1.4162, + "step": 30510 + }, + { + "epoch": 2.4, + "learning_rate": 2.8579197577744372e-05, + "loss": 1.486, + "step": 30511 + }, + { + "epoch": 2.4, + "learning_rate": 2.8571940878057937e-05, + "loss": 1.4476, + "step": 30512 + }, + { + "epoch": 2.4, + "learning_rate": 2.8564685002800975e-05, + "loss": 1.442, + "step": 30513 + }, + { + "epoch": 2.4, + "learning_rate": 2.855742995202283e-05, + "loss": 1.4858, + "step": 30514 + }, + { + "epoch": 2.4, + "learning_rate": 2.8550175725772684e-05, + "loss": 1.4549, + "step": 30515 + }, + { + "epoch": 2.4, + "learning_rate": 2.854292232409986e-05, + "loss": 1.4175, + "step": 30516 + }, + { + "epoch": 2.4, + "learning_rate": 2.853566974705357e-05, + "loss": 1.4777, + "step": 30517 + }, + { + "epoch": 2.4, + "learning_rate": 2.8528417994683007e-05, + "loss": 1.4558, + "step": 30518 + }, + { + "epoch": 2.4, + "learning_rate": 2.8521167067037498e-05, + "loss": 1.4438, + "step": 30519 + }, + { + "epoch": 2.4, + "learning_rate": 2.8513916964166222e-05, + "loss": 1.5148, + "step": 30520 + }, + { + "epoch": 2.4, + "learning_rate": 2.8506667686118374e-05, + "loss": 1.4831, + "step": 30521 + }, + { + "epoch": 2.4, + "learning_rate": 2.8499419232943245e-05, + "loss": 1.4011, + "step": 30522 + }, + { + "epoch": 2.4, + "learning_rate": 2.8492171604690013e-05, + "loss": 1.4635, + "step": 30523 + }, + { + "epoch": 2.4, + "learning_rate": 2.848492480140787e-05, + "loss": 1.4385, + "step": 30524 + }, + { + "epoch": 2.4, + "learning_rate": 2.8477678823145998e-05, + "loss": 1.4525, + "step": 30525 + }, + { + "epoch": 2.4, + "learning_rate": 2.8470433669953657e-05, + "loss": 1.4055, + "step": 30526 + }, + { + "epoch": 2.4, + "learning_rate": 2.8463189341880023e-05, + "loss": 1.444, + "step": 30527 + }, + { + "epoch": 2.4, + "learning_rate": 2.8455945838974204e-05, + "loss": 1.4774, + "step": 30528 + }, + { + "epoch": 2.4, + "learning_rate": 2.8448703161285464e-05, + "loss": 1.4484, + "step": 30529 + }, + { + "epoch": 2.4, + "learning_rate": 2.8441461308862963e-05, + "loss": 1.3987, + "step": 30530 + }, + { + "epoch": 2.4, + "learning_rate": 2.8434220281755875e-05, + "loss": 1.4434, + "step": 30531 + }, + { + "epoch": 2.4, + "learning_rate": 2.84269800800133e-05, + "loss": 1.475, + "step": 30532 + }, + { + "epoch": 2.4, + "learning_rate": 2.8419740703684497e-05, + "loss": 1.5044, + "step": 30533 + }, + { + "epoch": 2.4, + "learning_rate": 2.841250215281854e-05, + "loss": 1.4209, + "step": 30534 + }, + { + "epoch": 2.4, + "learning_rate": 2.8405264427464557e-05, + "loss": 1.4228, + "step": 30535 + }, + { + "epoch": 2.4, + "learning_rate": 2.839802752767178e-05, + "loss": 1.4673, + "step": 30536 + }, + { + "epoch": 2.4, + "learning_rate": 2.839079145348928e-05, + "loss": 1.3593, + "step": 30537 + }, + { + "epoch": 2.4, + "learning_rate": 2.8383556204966174e-05, + "loss": 1.4354, + "step": 30538 + }, + { + "epoch": 2.4, + "learning_rate": 2.8376321782151635e-05, + "loss": 1.4433, + "step": 30539 + }, + { + "epoch": 2.4, + "learning_rate": 2.836908818509474e-05, + "loss": 1.4584, + "step": 30540 + }, + { + "epoch": 2.4, + "learning_rate": 2.8361855413844635e-05, + "loss": 1.4833, + "step": 30541 + }, + { + "epoch": 2.4, + "learning_rate": 2.8354623468450366e-05, + "loss": 1.4343, + "step": 30542 + }, + { + "epoch": 2.4, + "learning_rate": 2.8347392348961105e-05, + "loss": 1.4862, + "step": 30543 + }, + { + "epoch": 2.4, + "learning_rate": 2.834016205542592e-05, + "loss": 1.4772, + "step": 30544 + }, + { + "epoch": 2.4, + "learning_rate": 2.8332932587893848e-05, + "loss": 1.5024, + "step": 30545 + }, + { + "epoch": 2.4, + "learning_rate": 2.8325703946414036e-05, + "loss": 1.4586, + "step": 30546 + }, + { + "epoch": 2.4, + "learning_rate": 2.8318476131035578e-05, + "loss": 1.454, + "step": 30547 + }, + { + "epoch": 2.4, + "learning_rate": 2.8311249141807534e-05, + "loss": 1.4553, + "step": 30548 + }, + { + "epoch": 2.4, + "learning_rate": 2.8304022978778902e-05, + "loss": 1.4515, + "step": 30549 + }, + { + "epoch": 2.4, + "learning_rate": 2.8296797641998836e-05, + "loss": 1.4373, + "step": 30550 + }, + { + "epoch": 2.4, + "learning_rate": 2.8289573131516353e-05, + "loss": 1.4829, + "step": 30551 + }, + { + "epoch": 2.4, + "learning_rate": 2.828234944738046e-05, + "loss": 1.4328, + "step": 30552 + }, + { + "epoch": 2.4, + "learning_rate": 2.82751265896403e-05, + "loss": 1.4444, + "step": 30553 + }, + { + "epoch": 2.4, + "learning_rate": 2.826790455834484e-05, + "loss": 1.4649, + "step": 30554 + }, + { + "epoch": 2.4, + "learning_rate": 2.82606833535431e-05, + "loss": 1.4138, + "step": 30555 + }, + { + "epoch": 2.4, + "learning_rate": 2.825346297528418e-05, + "loss": 1.4992, + "step": 30556 + }, + { + "epoch": 2.4, + "learning_rate": 2.8246243423617055e-05, + "loss": 1.4769, + "step": 30557 + }, + { + "epoch": 2.4, + "learning_rate": 2.823902469859075e-05, + "loss": 1.4317, + "step": 30558 + }, + { + "epoch": 2.4, + "learning_rate": 2.823180680025423e-05, + "loss": 1.4547, + "step": 30559 + }, + { + "epoch": 2.4, + "learning_rate": 2.8224589728656556e-05, + "loss": 1.4087, + "step": 30560 + }, + { + "epoch": 2.4, + "learning_rate": 2.821737348384675e-05, + "loss": 1.4519, + "step": 30561 + }, + { + "epoch": 2.4, + "learning_rate": 2.8210158065873727e-05, + "loss": 1.4751, + "step": 30562 + }, + { + "epoch": 2.4, + "learning_rate": 2.8202943474786566e-05, + "loss": 1.4652, + "step": 30563 + }, + { + "epoch": 2.4, + "learning_rate": 2.8195729710634206e-05, + "loss": 1.4019, + "step": 30564 + }, + { + "epoch": 2.4, + "learning_rate": 2.8188516773465632e-05, + "loss": 1.4359, + "step": 30565 + }, + { + "epoch": 2.4, + "learning_rate": 2.818130466332976e-05, + "loss": 1.4799, + "step": 30566 + }, + { + "epoch": 2.41, + "learning_rate": 2.8174093380275648e-05, + "loss": 1.4196, + "step": 30567 + }, + { + "epoch": 2.41, + "learning_rate": 2.8166882924352212e-05, + "loss": 1.3812, + "step": 30568 + }, + { + "epoch": 2.41, + "learning_rate": 2.8159673295608353e-05, + "loss": 1.4665, + "step": 30569 + }, + { + "epoch": 2.41, + "learning_rate": 2.815246449409313e-05, + "loss": 1.4208, + "step": 30570 + }, + { + "epoch": 2.41, + "learning_rate": 2.8145256519855436e-05, + "loss": 1.5145, + "step": 30571 + }, + { + "epoch": 2.41, + "learning_rate": 2.8138049372944166e-05, + "loss": 1.4498, + "step": 30572 + }, + { + "epoch": 2.41, + "learning_rate": 2.8130843053408313e-05, + "loss": 1.4786, + "step": 30573 + }, + { + "epoch": 2.41, + "learning_rate": 2.812363756129681e-05, + "loss": 1.4135, + "step": 30574 + }, + { + "epoch": 2.41, + "learning_rate": 2.811643289665849e-05, + "loss": 1.4134, + "step": 30575 + }, + { + "epoch": 2.41, + "learning_rate": 2.8109229059542328e-05, + "loss": 1.4274, + "step": 30576 + }, + { + "epoch": 2.41, + "learning_rate": 2.810202604999729e-05, + "loss": 1.465, + "step": 30577 + }, + { + "epoch": 2.41, + "learning_rate": 2.8094823868072226e-05, + "loss": 1.4196, + "step": 30578 + }, + { + "epoch": 2.41, + "learning_rate": 2.8087622513815978e-05, + "loss": 1.4506, + "step": 30579 + }, + { + "epoch": 2.41, + "learning_rate": 2.8080421987277558e-05, + "loss": 1.5027, + "step": 30580 + }, + { + "epoch": 2.41, + "learning_rate": 2.8073222288505776e-05, + "loss": 1.489, + "step": 30581 + }, + { + "epoch": 2.41, + "learning_rate": 2.8066023417549528e-05, + "loss": 1.4914, + "step": 30582 + }, + { + "epoch": 2.41, + "learning_rate": 2.8058825374457672e-05, + "loss": 1.4544, + "step": 30583 + }, + { + "epoch": 2.41, + "learning_rate": 2.8051628159279122e-05, + "loss": 1.4387, + "step": 30584 + }, + { + "epoch": 2.41, + "learning_rate": 2.804443177206272e-05, + "loss": 1.4111, + "step": 30585 + }, + { + "epoch": 2.41, + "learning_rate": 2.8037236212857294e-05, + "loss": 1.455, + "step": 30586 + }, + { + "epoch": 2.41, + "learning_rate": 2.8030041481711757e-05, + "loss": 1.4562, + "step": 30587 + }, + { + "epoch": 2.41, + "learning_rate": 2.8022847578674933e-05, + "loss": 1.5018, + "step": 30588 + }, + { + "epoch": 2.41, + "learning_rate": 2.801565450379564e-05, + "loss": 1.4402, + "step": 30589 + }, + { + "epoch": 2.41, + "learning_rate": 2.800846225712276e-05, + "loss": 1.4319, + "step": 30590 + }, + { + "epoch": 2.41, + "learning_rate": 2.80012708387051e-05, + "loss": 1.4177, + "step": 30591 + }, + { + "epoch": 2.41, + "learning_rate": 2.799408024859146e-05, + "loss": 1.447, + "step": 30592 + }, + { + "epoch": 2.41, + "learning_rate": 2.7986890486830676e-05, + "loss": 1.4312, + "step": 30593 + }, + { + "epoch": 2.41, + "learning_rate": 2.7979701553471608e-05, + "loss": 1.4533, + "step": 30594 + }, + { + "epoch": 2.41, + "learning_rate": 2.7972513448563044e-05, + "loss": 1.4842, + "step": 30595 + }, + { + "epoch": 2.41, + "learning_rate": 2.796532617215372e-05, + "loss": 1.458, + "step": 30596 + }, + { + "epoch": 2.41, + "learning_rate": 2.795813972429254e-05, + "loss": 1.4564, + "step": 30597 + }, + { + "epoch": 2.41, + "learning_rate": 2.7950954105028235e-05, + "loss": 1.4773, + "step": 30598 + }, + { + "epoch": 2.41, + "learning_rate": 2.7943769314409597e-05, + "loss": 1.4494, + "step": 30599 + }, + { + "epoch": 2.41, + "learning_rate": 2.7936585352485373e-05, + "loss": 1.4611, + "step": 30600 + }, + { + "epoch": 2.41, + "learning_rate": 2.792940221930441e-05, + "loss": 1.442, + "step": 30601 + }, + { + "epoch": 2.41, + "learning_rate": 2.7922219914915445e-05, + "loss": 1.4758, + "step": 30602 + }, + { + "epoch": 2.41, + "learning_rate": 2.7915038439367194e-05, + "loss": 1.4665, + "step": 30603 + }, + { + "epoch": 2.41, + "learning_rate": 2.79078577927085e-05, + "loss": 1.5173, + "step": 30604 + }, + { + "epoch": 2.41, + "learning_rate": 2.7900677974988088e-05, + "loss": 1.4482, + "step": 30605 + }, + { + "epoch": 2.41, + "learning_rate": 2.789349898625464e-05, + "loss": 1.4369, + "step": 30606 + }, + { + "epoch": 2.41, + "learning_rate": 2.788632082655695e-05, + "loss": 1.4699, + "step": 30607 + }, + { + "epoch": 2.41, + "learning_rate": 2.787914349594381e-05, + "loss": 1.4669, + "step": 30608 + }, + { + "epoch": 2.41, + "learning_rate": 2.7871966994463884e-05, + "loss": 1.4615, + "step": 30609 + }, + { + "epoch": 2.41, + "learning_rate": 2.7864791322165864e-05, + "loss": 1.4755, + "step": 30610 + }, + { + "epoch": 2.41, + "learning_rate": 2.7857616479098545e-05, + "loss": 1.4699, + "step": 30611 + }, + { + "epoch": 2.41, + "learning_rate": 2.785044246531062e-05, + "loss": 1.4649, + "step": 30612 + }, + { + "epoch": 2.41, + "learning_rate": 2.784326928085073e-05, + "loss": 1.4734, + "step": 30613 + }, + { + "epoch": 2.41, + "learning_rate": 2.783609692576768e-05, + "loss": 1.4047, + "step": 30614 + }, + { + "epoch": 2.41, + "learning_rate": 2.782892540011011e-05, + "loss": 1.4708, + "step": 30615 + }, + { + "epoch": 2.41, + "learning_rate": 2.7821754703926673e-05, + "loss": 1.4758, + "step": 30616 + }, + { + "epoch": 2.41, + "learning_rate": 2.781458483726616e-05, + "loss": 1.4511, + "step": 30617 + }, + { + "epoch": 2.41, + "learning_rate": 2.780741580017717e-05, + "loss": 1.4079, + "step": 30618 + }, + { + "epoch": 2.41, + "learning_rate": 2.7800247592708385e-05, + "loss": 1.4519, + "step": 30619 + }, + { + "epoch": 2.41, + "learning_rate": 2.779308021490847e-05, + "loss": 1.4423, + "step": 30620 + }, + { + "epoch": 2.41, + "learning_rate": 2.7785913666826115e-05, + "loss": 1.4128, + "step": 30621 + }, + { + "epoch": 2.41, + "learning_rate": 2.7778747948509982e-05, + "loss": 1.4786, + "step": 30622 + }, + { + "epoch": 2.41, + "learning_rate": 2.777158306000865e-05, + "loss": 1.4536, + "step": 30623 + }, + { + "epoch": 2.41, + "learning_rate": 2.776441900137083e-05, + "loss": 1.4303, + "step": 30624 + }, + { + "epoch": 2.41, + "learning_rate": 2.7757255772645182e-05, + "loss": 1.4206, + "step": 30625 + }, + { + "epoch": 2.41, + "learning_rate": 2.7750093373880317e-05, + "loss": 1.4224, + "step": 30626 + }, + { + "epoch": 2.41, + "learning_rate": 2.7742931805124813e-05, + "loss": 1.4942, + "step": 30627 + }, + { + "epoch": 2.41, + "learning_rate": 2.7735771066427363e-05, + "loss": 1.4145, + "step": 30628 + }, + { + "epoch": 2.41, + "learning_rate": 2.7728611157836568e-05, + "loss": 1.4412, + "step": 30629 + }, + { + "epoch": 2.41, + "learning_rate": 2.772145207940098e-05, + "loss": 1.5129, + "step": 30630 + }, + { + "epoch": 2.41, + "learning_rate": 2.7714293831169298e-05, + "loss": 1.3949, + "step": 30631 + }, + { + "epoch": 2.41, + "learning_rate": 2.7707136413190084e-05, + "loss": 1.4725, + "step": 30632 + }, + { + "epoch": 2.41, + "learning_rate": 2.769997982551188e-05, + "loss": 1.4354, + "step": 30633 + }, + { + "epoch": 2.41, + "learning_rate": 2.769282406818335e-05, + "loss": 1.452, + "step": 30634 + }, + { + "epoch": 2.41, + "learning_rate": 2.768566914125307e-05, + "loss": 1.4555, + "step": 30635 + }, + { + "epoch": 2.41, + "learning_rate": 2.7678515044769585e-05, + "loss": 1.4562, + "step": 30636 + }, + { + "epoch": 2.41, + "learning_rate": 2.7671361778781452e-05, + "loss": 1.4903, + "step": 30637 + }, + { + "epoch": 2.41, + "learning_rate": 2.766420934333729e-05, + "loss": 1.4553, + "step": 30638 + }, + { + "epoch": 2.41, + "learning_rate": 2.7657057738485623e-05, + "loss": 1.4527, + "step": 30639 + }, + { + "epoch": 2.41, + "learning_rate": 2.7649906964275027e-05, + "loss": 1.4616, + "step": 30640 + }, + { + "epoch": 2.41, + "learning_rate": 2.764275702075403e-05, + "loss": 1.3787, + "step": 30641 + }, + { + "epoch": 2.41, + "learning_rate": 2.7635607907971214e-05, + "loss": 1.4286, + "step": 30642 + }, + { + "epoch": 2.41, + "learning_rate": 2.76284596259751e-05, + "loss": 1.4329, + "step": 30643 + }, + { + "epoch": 2.41, + "learning_rate": 2.7621312174814175e-05, + "loss": 1.4719, + "step": 30644 + }, + { + "epoch": 2.41, + "learning_rate": 2.7614165554537043e-05, + "loss": 1.4157, + "step": 30645 + }, + { + "epoch": 2.41, + "learning_rate": 2.76070197651922e-05, + "loss": 1.4971, + "step": 30646 + }, + { + "epoch": 2.41, + "learning_rate": 2.759987480682811e-05, + "loss": 1.5094, + "step": 30647 + }, + { + "epoch": 2.41, + "learning_rate": 2.7592730679493347e-05, + "loss": 1.4515, + "step": 30648 + }, + { + "epoch": 2.41, + "learning_rate": 2.7585587383236408e-05, + "loss": 1.4472, + "step": 30649 + }, + { + "epoch": 2.41, + "learning_rate": 2.7578444918105734e-05, + "loss": 1.4427, + "step": 30650 + }, + { + "epoch": 2.41, + "learning_rate": 2.7571303284149894e-05, + "loss": 1.493, + "step": 30651 + }, + { + "epoch": 2.41, + "learning_rate": 2.7564162481417358e-05, + "loss": 1.4683, + "step": 30652 + }, + { + "epoch": 2.41, + "learning_rate": 2.7557022509956573e-05, + "loss": 1.4703, + "step": 30653 + }, + { + "epoch": 2.41, + "learning_rate": 2.7549883369816e-05, + "loss": 1.4148, + "step": 30654 + }, + { + "epoch": 2.41, + "learning_rate": 2.7542745061044153e-05, + "loss": 1.4219, + "step": 30655 + }, + { + "epoch": 2.41, + "learning_rate": 2.753560758368954e-05, + "loss": 1.4228, + "step": 30656 + }, + { + "epoch": 2.41, + "learning_rate": 2.7528470937800558e-05, + "loss": 1.4585, + "step": 30657 + }, + { + "epoch": 2.41, + "learning_rate": 2.7521335123425632e-05, + "loss": 1.4268, + "step": 30658 + }, + { + "epoch": 2.41, + "learning_rate": 2.751420014061329e-05, + "loss": 1.4456, + "step": 30659 + }, + { + "epoch": 2.41, + "learning_rate": 2.750706598941193e-05, + "loss": 1.4333, + "step": 30660 + }, + { + "epoch": 2.41, + "learning_rate": 2.749993266986996e-05, + "loss": 1.4381, + "step": 30661 + }, + { + "epoch": 2.41, + "learning_rate": 2.7492800182035897e-05, + "loss": 1.4324, + "step": 30662 + }, + { + "epoch": 2.41, + "learning_rate": 2.748566852595811e-05, + "loss": 1.5095, + "step": 30663 + }, + { + "epoch": 2.41, + "learning_rate": 2.7478537701684983e-05, + "loss": 1.4791, + "step": 30664 + }, + { + "epoch": 2.41, + "learning_rate": 2.747140770926501e-05, + "loss": 1.4368, + "step": 30665 + }, + { + "epoch": 2.41, + "learning_rate": 2.7464278548746548e-05, + "loss": 1.4717, + "step": 30666 + }, + { + "epoch": 2.41, + "learning_rate": 2.7457150220177997e-05, + "loss": 1.444, + "step": 30667 + }, + { + "epoch": 2.41, + "learning_rate": 2.7450022723607802e-05, + "loss": 1.4254, + "step": 30668 + }, + { + "epoch": 2.41, + "learning_rate": 2.744289605908432e-05, + "loss": 1.3697, + "step": 30669 + }, + { + "epoch": 2.41, + "learning_rate": 2.7435770226655914e-05, + "loss": 1.4249, + "step": 30670 + }, + { + "epoch": 2.41, + "learning_rate": 2.7428645226370978e-05, + "loss": 1.4551, + "step": 30671 + }, + { + "epoch": 2.41, + "learning_rate": 2.742152105827794e-05, + "loss": 1.4554, + "step": 30672 + }, + { + "epoch": 2.41, + "learning_rate": 2.7414397722425146e-05, + "loss": 1.4583, + "step": 30673 + }, + { + "epoch": 2.41, + "learning_rate": 2.7407275218860892e-05, + "loss": 1.4061, + "step": 30674 + }, + { + "epoch": 2.41, + "learning_rate": 2.7400153547633618e-05, + "loss": 1.4783, + "step": 30675 + }, + { + "epoch": 2.41, + "learning_rate": 2.7393032708791655e-05, + "loss": 1.5087, + "step": 30676 + }, + { + "epoch": 2.41, + "learning_rate": 2.738591270238335e-05, + "loss": 1.4858, + "step": 30677 + }, + { + "epoch": 2.41, + "learning_rate": 2.7378793528456978e-05, + "loss": 1.4697, + "step": 30678 + }, + { + "epoch": 2.41, + "learning_rate": 2.737167518706098e-05, + "loss": 1.4209, + "step": 30679 + }, + { + "epoch": 2.41, + "learning_rate": 2.7364557678243626e-05, + "loss": 1.4523, + "step": 30680 + }, + { + "epoch": 2.41, + "learning_rate": 2.735744100205322e-05, + "loss": 1.4634, + "step": 30681 + }, + { + "epoch": 2.41, + "learning_rate": 2.7350325158538143e-05, + "loss": 1.4612, + "step": 30682 + }, + { + "epoch": 2.41, + "learning_rate": 2.7343210147746676e-05, + "loss": 1.444, + "step": 30683 + }, + { + "epoch": 2.41, + "learning_rate": 2.733609596972709e-05, + "loss": 1.4694, + "step": 30684 + }, + { + "epoch": 2.41, + "learning_rate": 2.7328982624527752e-05, + "loss": 1.4536, + "step": 30685 + }, + { + "epoch": 2.41, + "learning_rate": 2.7321870112196888e-05, + "loss": 1.4466, + "step": 30686 + }, + { + "epoch": 2.41, + "learning_rate": 2.7314758432782858e-05, + "loss": 1.4196, + "step": 30687 + }, + { + "epoch": 2.41, + "learning_rate": 2.7307647586333893e-05, + "loss": 1.4167, + "step": 30688 + }, + { + "epoch": 2.41, + "learning_rate": 2.730053757289832e-05, + "loss": 1.4294, + "step": 30689 + }, + { + "epoch": 2.41, + "learning_rate": 2.7293428392524397e-05, + "loss": 1.3839, + "step": 30690 + }, + { + "epoch": 2.41, + "learning_rate": 2.728632004526034e-05, + "loss": 1.4387, + "step": 30691 + }, + { + "epoch": 2.41, + "learning_rate": 2.7279212531154477e-05, + "loss": 1.4378, + "step": 30692 + }, + { + "epoch": 2.41, + "learning_rate": 2.727210585025505e-05, + "loss": 1.4461, + "step": 30693 + }, + { + "epoch": 2.42, + "learning_rate": 2.726500000261029e-05, + "loss": 1.4184, + "step": 30694 + }, + { + "epoch": 2.42, + "learning_rate": 2.725789498826842e-05, + "loss": 1.4787, + "step": 30695 + }, + { + "epoch": 2.42, + "learning_rate": 2.725079080727774e-05, + "loss": 1.4232, + "step": 30696 + }, + { + "epoch": 2.42, + "learning_rate": 2.7243687459686443e-05, + "loss": 1.5164, + "step": 30697 + }, + { + "epoch": 2.42, + "learning_rate": 2.723658494554274e-05, + "loss": 1.44, + "step": 30698 + }, + { + "epoch": 2.42, + "learning_rate": 2.7229483264894925e-05, + "loss": 1.4051, + "step": 30699 + }, + { + "epoch": 2.42, + "learning_rate": 2.7222382417791144e-05, + "loss": 1.4184, + "step": 30700 + }, + { + "epoch": 2.42, + "learning_rate": 2.7215282404279608e-05, + "loss": 1.4459, + "step": 30701 + }, + { + "epoch": 2.42, + "learning_rate": 2.7208183224408547e-05, + "loss": 1.4633, + "step": 30702 + }, + { + "epoch": 2.42, + "learning_rate": 2.7201084878226205e-05, + "loss": 1.4461, + "step": 30703 + }, + { + "epoch": 2.42, + "learning_rate": 2.7193987365780724e-05, + "loss": 1.4521, + "step": 30704 + }, + { + "epoch": 2.42, + "learning_rate": 2.718689068712025e-05, + "loss": 1.4431, + "step": 30705 + }, + { + "epoch": 2.42, + "learning_rate": 2.7179794842293063e-05, + "loss": 1.442, + "step": 30706 + }, + { + "epoch": 2.42, + "learning_rate": 2.717269983134729e-05, + "loss": 1.4022, + "step": 30707 + }, + { + "epoch": 2.42, + "learning_rate": 2.7165605654331058e-05, + "loss": 1.4569, + "step": 30708 + }, + { + "epoch": 2.42, + "learning_rate": 2.7158512311292628e-05, + "loss": 1.4566, + "step": 30709 + }, + { + "epoch": 2.42, + "learning_rate": 2.71514198022801e-05, + "loss": 1.4654, + "step": 30710 + }, + { + "epoch": 2.42, + "learning_rate": 2.7144328127341646e-05, + "loss": 1.4136, + "step": 30711 + }, + { + "epoch": 2.42, + "learning_rate": 2.7137237286525364e-05, + "loss": 1.4298, + "step": 30712 + }, + { + "epoch": 2.42, + "learning_rate": 2.7130147279879484e-05, + "loss": 1.4663, + "step": 30713 + }, + { + "epoch": 2.42, + "learning_rate": 2.7123058107452096e-05, + "loss": 1.4805, + "step": 30714 + }, + { + "epoch": 2.42, + "learning_rate": 2.7115969769291295e-05, + "loss": 1.4583, + "step": 30715 + }, + { + "epoch": 2.42, + "learning_rate": 2.710888226544528e-05, + "loss": 1.4694, + "step": 30716 + }, + { + "epoch": 2.42, + "learning_rate": 2.7101795595962094e-05, + "loss": 1.4479, + "step": 30717 + }, + { + "epoch": 2.42, + "learning_rate": 2.709470976088995e-05, + "loss": 1.4355, + "step": 30718 + }, + { + "epoch": 2.42, + "learning_rate": 2.7087624760276855e-05, + "loss": 1.4412, + "step": 30719 + }, + { + "epoch": 2.42, + "learning_rate": 2.7080540594170992e-05, + "loss": 1.4567, + "step": 30720 + }, + { + "epoch": 2.42, + "learning_rate": 2.7073457262620434e-05, + "loss": 1.4526, + "step": 30721 + }, + { + "epoch": 2.42, + "learning_rate": 2.706637476567323e-05, + "loss": 1.4386, + "step": 30722 + }, + { + "epoch": 2.42, + "learning_rate": 2.7059293103377526e-05, + "loss": 1.4826, + "step": 30723 + }, + { + "epoch": 2.42, + "learning_rate": 2.70522122757814e-05, + "loss": 1.443, + "step": 30724 + }, + { + "epoch": 2.42, + "learning_rate": 2.704513228293284e-05, + "loss": 1.4358, + "step": 30725 + }, + { + "epoch": 2.42, + "learning_rate": 2.7038053124880032e-05, + "loss": 1.4655, + "step": 30726 + }, + { + "epoch": 2.42, + "learning_rate": 2.7030974801670984e-05, + "loss": 1.4721, + "step": 30727 + }, + { + "epoch": 2.42, + "learning_rate": 2.7023897313353726e-05, + "loss": 1.4936, + "step": 30728 + }, + { + "epoch": 2.42, + "learning_rate": 2.701682065997637e-05, + "loss": 1.4362, + "step": 30729 + }, + { + "epoch": 2.42, + "learning_rate": 2.700974484158694e-05, + "loss": 1.4714, + "step": 30730 + }, + { + "epoch": 2.42, + "learning_rate": 2.7002669858233467e-05, + "loss": 1.4107, + "step": 30731 + }, + { + "epoch": 2.42, + "learning_rate": 2.6995595709963947e-05, + "loss": 1.4395, + "step": 30732 + }, + { + "epoch": 2.42, + "learning_rate": 2.6988522396826456e-05, + "loss": 1.4494, + "step": 30733 + }, + { + "epoch": 2.42, + "learning_rate": 2.698144991886906e-05, + "loss": 1.4905, + "step": 30734 + }, + { + "epoch": 2.42, + "learning_rate": 2.697437827613973e-05, + "loss": 1.453, + "step": 30735 + }, + { + "epoch": 2.42, + "learning_rate": 2.6967307468686434e-05, + "loss": 1.4689, + "step": 30736 + }, + { + "epoch": 2.42, + "learning_rate": 2.6960237496557264e-05, + "loss": 1.4519, + "step": 30737 + }, + { + "epoch": 2.42, + "learning_rate": 2.69531683598002e-05, + "loss": 1.4325, + "step": 30738 + }, + { + "epoch": 2.42, + "learning_rate": 2.6946100058463165e-05, + "loss": 1.4615, + "step": 30739 + }, + { + "epoch": 2.42, + "learning_rate": 2.6939032592594247e-05, + "loss": 1.4476, + "step": 30740 + }, + { + "epoch": 2.42, + "learning_rate": 2.693196596224138e-05, + "loss": 1.4581, + "step": 30741 + }, + { + "epoch": 2.42, + "learning_rate": 2.692490016745252e-05, + "loss": 1.4335, + "step": 30742 + }, + { + "epoch": 2.42, + "learning_rate": 2.6917835208275702e-05, + "loss": 1.4311, + "step": 30743 + }, + { + "epoch": 2.42, + "learning_rate": 2.6910771084758874e-05, + "loss": 1.4143, + "step": 30744 + }, + { + "epoch": 2.42, + "learning_rate": 2.6903707796949936e-05, + "loss": 1.4478, + "step": 30745 + }, + { + "epoch": 2.42, + "learning_rate": 2.6896645344896928e-05, + "loss": 1.4436, + "step": 30746 + }, + { + "epoch": 2.42, + "learning_rate": 2.688958372864776e-05, + "loss": 1.4843, + "step": 30747 + }, + { + "epoch": 2.42, + "learning_rate": 2.6882522948250385e-05, + "loss": 1.412, + "step": 30748 + }, + { + "epoch": 2.42, + "learning_rate": 2.6875463003752657e-05, + "loss": 1.4528, + "step": 30749 + }, + { + "epoch": 2.42, + "learning_rate": 2.6868403895202674e-05, + "loss": 1.4068, + "step": 30750 + }, + { + "epoch": 2.42, + "learning_rate": 2.6861345622648278e-05, + "loss": 1.479, + "step": 30751 + }, + { + "epoch": 2.42, + "learning_rate": 2.6854288186137386e-05, + "loss": 1.4555, + "step": 30752 + }, + { + "epoch": 2.42, + "learning_rate": 2.6847231585717887e-05, + "loss": 1.4795, + "step": 30753 + }, + { + "epoch": 2.42, + "learning_rate": 2.6840175821437766e-05, + "loss": 1.4581, + "step": 30754 + }, + { + "epoch": 2.42, + "learning_rate": 2.6833120893344877e-05, + "loss": 1.5232, + "step": 30755 + }, + { + "epoch": 2.42, + "learning_rate": 2.682606680148709e-05, + "loss": 1.4888, + "step": 30756 + }, + { + "epoch": 2.42, + "learning_rate": 2.6819013545912376e-05, + "loss": 1.4544, + "step": 30757 + }, + { + "epoch": 2.42, + "learning_rate": 2.6811961126668587e-05, + "loss": 1.4646, + "step": 30758 + }, + { + "epoch": 2.42, + "learning_rate": 2.680490954380356e-05, + "loss": 1.4566, + "step": 30759 + }, + { + "epoch": 2.42, + "learning_rate": 2.679785879736526e-05, + "loss": 1.5003, + "step": 30760 + }, + { + "epoch": 2.42, + "learning_rate": 2.6790808887401504e-05, + "loss": 1.4743, + "step": 30761 + }, + { + "epoch": 2.42, + "learning_rate": 2.6783759813960116e-05, + "loss": 1.4313, + "step": 30762 + }, + { + "epoch": 2.42, + "learning_rate": 2.6776711577089053e-05, + "loss": 1.4617, + "step": 30763 + }, + { + "epoch": 2.42, + "learning_rate": 2.6769664176836102e-05, + "loss": 1.4712, + "step": 30764 + }, + { + "epoch": 2.42, + "learning_rate": 2.6762617613249103e-05, + "loss": 1.4503, + "step": 30765 + }, + { + "epoch": 2.42, + "learning_rate": 2.675557188637592e-05, + "loss": 1.4549, + "step": 30766 + }, + { + "epoch": 2.42, + "learning_rate": 2.674852699626443e-05, + "loss": 1.4734, + "step": 30767 + }, + { + "epoch": 2.42, + "learning_rate": 2.674148294296243e-05, + "loss": 1.4585, + "step": 30768 + }, + { + "epoch": 2.42, + "learning_rate": 2.6734439726517743e-05, + "loss": 1.4416, + "step": 30769 + }, + { + "epoch": 2.42, + "learning_rate": 2.6727397346978135e-05, + "loss": 1.4484, + "step": 30770 + }, + { + "epoch": 2.42, + "learning_rate": 2.672035580439152e-05, + "loss": 1.39, + "step": 30771 + }, + { + "epoch": 2.42, + "learning_rate": 2.6713315098805653e-05, + "loss": 1.4283, + "step": 30772 + }, + { + "epoch": 2.42, + "learning_rate": 2.6706275230268302e-05, + "loss": 1.4667, + "step": 30773 + }, + { + "epoch": 2.42, + "learning_rate": 2.6699236198827346e-05, + "loss": 1.4877, + "step": 30774 + }, + { + "epoch": 2.42, + "learning_rate": 2.6692198004530525e-05, + "loss": 1.4758, + "step": 30775 + }, + { + "epoch": 2.42, + "learning_rate": 2.6685160647425602e-05, + "loss": 1.4785, + "step": 30776 + }, + { + "epoch": 2.42, + "learning_rate": 2.6678124127560424e-05, + "loss": 1.4711, + "step": 30777 + }, + { + "epoch": 2.42, + "learning_rate": 2.6671088444982735e-05, + "loss": 1.4768, + "step": 30778 + }, + { + "epoch": 2.42, + "learning_rate": 2.6664053599740248e-05, + "loss": 1.4744, + "step": 30779 + }, + { + "epoch": 2.42, + "learning_rate": 2.665701959188079e-05, + "loss": 1.4761, + "step": 30780 + }, + { + "epoch": 2.42, + "learning_rate": 2.6649986421452125e-05, + "loss": 1.3917, + "step": 30781 + }, + { + "epoch": 2.42, + "learning_rate": 2.6642954088501976e-05, + "loss": 1.4682, + "step": 30782 + }, + { + "epoch": 2.42, + "learning_rate": 2.663592259307808e-05, + "loss": 1.3911, + "step": 30783 + }, + { + "epoch": 2.42, + "learning_rate": 2.6628891935228207e-05, + "loss": 1.465, + "step": 30784 + }, + { + "epoch": 2.42, + "learning_rate": 2.662186211500009e-05, + "loss": 1.3407, + "step": 30785 + }, + { + "epoch": 2.42, + "learning_rate": 2.661483313244141e-05, + "loss": 1.4565, + "step": 30786 + }, + { + "epoch": 2.42, + "learning_rate": 2.6607804987599956e-05, + "loss": 1.4586, + "step": 30787 + }, + { + "epoch": 2.42, + "learning_rate": 2.6600777680523412e-05, + "loss": 1.4875, + "step": 30788 + }, + { + "epoch": 2.42, + "learning_rate": 2.6593751211259486e-05, + "loss": 1.4156, + "step": 30789 + }, + { + "epoch": 2.42, + "learning_rate": 2.6586725579855837e-05, + "loss": 1.4565, + "step": 30790 + }, + { + "epoch": 2.42, + "learning_rate": 2.657970078636027e-05, + "loss": 1.4205, + "step": 30791 + }, + { + "epoch": 2.42, + "learning_rate": 2.657267683082044e-05, + "loss": 1.449, + "step": 30792 + }, + { + "epoch": 2.42, + "learning_rate": 2.6565653713283958e-05, + "loss": 1.4684, + "step": 30793 + }, + { + "epoch": 2.42, + "learning_rate": 2.6558631433798622e-05, + "loss": 1.3862, + "step": 30794 + }, + { + "epoch": 2.42, + "learning_rate": 2.655160999241206e-05, + "loss": 1.4389, + "step": 30795 + }, + { + "epoch": 2.42, + "learning_rate": 2.65445893891719e-05, + "loss": 1.4373, + "step": 30796 + }, + { + "epoch": 2.42, + "learning_rate": 2.6537569624125836e-05, + "loss": 1.4996, + "step": 30797 + }, + { + "epoch": 2.42, + "learning_rate": 2.65305506973216e-05, + "loss": 1.4785, + "step": 30798 + }, + { + "epoch": 2.42, + "learning_rate": 2.6523532608806786e-05, + "loss": 1.4422, + "step": 30799 + }, + { + "epoch": 2.42, + "learning_rate": 2.6516515358629003e-05, + "loss": 1.4197, + "step": 30800 + }, + { + "epoch": 2.42, + "learning_rate": 2.6509498946835965e-05, + "loss": 1.3727, + "step": 30801 + }, + { + "epoch": 2.42, + "learning_rate": 2.65024833734753e-05, + "loss": 1.4207, + "step": 30802 + }, + { + "epoch": 2.42, + "learning_rate": 2.6495468638594575e-05, + "loss": 1.4327, + "step": 30803 + }, + { + "epoch": 2.42, + "learning_rate": 2.6488454742241493e-05, + "loss": 1.4127, + "step": 30804 + }, + { + "epoch": 2.42, + "learning_rate": 2.6481441684463654e-05, + "loss": 1.4123, + "step": 30805 + }, + { + "epoch": 2.42, + "learning_rate": 2.6474429465308657e-05, + "loss": 1.4364, + "step": 30806 + }, + { + "epoch": 2.42, + "learning_rate": 2.6467418084824088e-05, + "loss": 1.4618, + "step": 30807 + }, + { + "epoch": 2.42, + "learning_rate": 2.6460407543057614e-05, + "loss": 1.4309, + "step": 30808 + }, + { + "epoch": 2.42, + "learning_rate": 2.64533978400568e-05, + "loss": 1.4198, + "step": 30809 + }, + { + "epoch": 2.42, + "learning_rate": 2.6446388975869188e-05, + "loss": 1.4351, + "step": 30810 + }, + { + "epoch": 2.42, + "learning_rate": 2.6439380950542455e-05, + "loss": 1.4382, + "step": 30811 + }, + { + "epoch": 2.42, + "learning_rate": 2.64323737641241e-05, + "loss": 1.4412, + "step": 30812 + }, + { + "epoch": 2.42, + "learning_rate": 2.642536741666178e-05, + "loss": 1.4481, + "step": 30813 + }, + { + "epoch": 2.42, + "learning_rate": 2.6418361908202978e-05, + "loss": 1.4361, + "step": 30814 + }, + { + "epoch": 2.42, + "learning_rate": 2.641135723879534e-05, + "loss": 1.4628, + "step": 30815 + }, + { + "epoch": 2.42, + "learning_rate": 2.6404353408486388e-05, + "loss": 1.4628, + "step": 30816 + }, + { + "epoch": 2.42, + "learning_rate": 2.6397350417323625e-05, + "loss": 1.4278, + "step": 30817 + }, + { + "epoch": 2.42, + "learning_rate": 2.639034826535468e-05, + "loss": 1.4644, + "step": 30818 + }, + { + "epoch": 2.42, + "learning_rate": 2.638334695262707e-05, + "loss": 1.4848, + "step": 30819 + }, + { + "epoch": 2.42, + "learning_rate": 2.637634647918827e-05, + "loss": 1.4917, + "step": 30820 + }, + { + "epoch": 2.43, + "learning_rate": 2.6369346845085887e-05, + "loss": 1.4211, + "step": 30821 + }, + { + "epoch": 2.43, + "learning_rate": 2.6362348050367433e-05, + "loss": 1.4245, + "step": 30822 + }, + { + "epoch": 2.43, + "learning_rate": 2.6355350095080385e-05, + "loss": 1.433, + "step": 30823 + }, + { + "epoch": 2.43, + "learning_rate": 2.6348352979272258e-05, + "loss": 1.4539, + "step": 30824 + }, + { + "epoch": 2.43, + "learning_rate": 2.634135670299061e-05, + "loss": 1.4815, + "step": 30825 + }, + { + "epoch": 2.43, + "learning_rate": 2.633436126628291e-05, + "loss": 1.44, + "step": 30826 + }, + { + "epoch": 2.43, + "learning_rate": 2.6327366669196566e-05, + "loss": 1.4812, + "step": 30827 + }, + { + "epoch": 2.43, + "learning_rate": 2.6320372911779237e-05, + "loss": 1.4393, + "step": 30828 + }, + { + "epoch": 2.43, + "learning_rate": 2.6313379994078338e-05, + "loss": 1.4674, + "step": 30829 + }, + { + "epoch": 2.43, + "learning_rate": 2.6306387916141312e-05, + "loss": 1.4176, + "step": 30830 + }, + { + "epoch": 2.43, + "learning_rate": 2.6299396678015627e-05, + "loss": 1.452, + "step": 30831 + }, + { + "epoch": 2.43, + "learning_rate": 2.6292406279748808e-05, + "loss": 1.459, + "step": 30832 + }, + { + "epoch": 2.43, + "learning_rate": 2.628541672138828e-05, + "loss": 1.4337, + "step": 30833 + }, + { + "epoch": 2.43, + "learning_rate": 2.627842800298146e-05, + "loss": 1.4367, + "step": 30834 + }, + { + "epoch": 2.43, + "learning_rate": 2.6271440124575893e-05, + "loss": 1.4754, + "step": 30835 + }, + { + "epoch": 2.43, + "learning_rate": 2.6264453086218956e-05, + "loss": 1.4073, + "step": 30836 + }, + { + "epoch": 2.43, + "learning_rate": 2.6257466887958063e-05, + "loss": 1.43, + "step": 30837 + }, + { + "epoch": 2.43, + "learning_rate": 2.625048152984072e-05, + "loss": 1.434, + "step": 30838 + }, + { + "epoch": 2.43, + "learning_rate": 2.6243497011914317e-05, + "loss": 1.4319, + "step": 30839 + }, + { + "epoch": 2.43, + "learning_rate": 2.623651333422624e-05, + "loss": 1.4383, + "step": 30840 + }, + { + "epoch": 2.43, + "learning_rate": 2.622953049682397e-05, + "loss": 1.4613, + "step": 30841 + }, + { + "epoch": 2.43, + "learning_rate": 2.6222548499754904e-05, + "loss": 1.4486, + "step": 30842 + }, + { + "epoch": 2.43, + "learning_rate": 2.621556734306637e-05, + "loss": 1.4405, + "step": 30843 + }, + { + "epoch": 2.43, + "learning_rate": 2.6208587026805828e-05, + "loss": 1.5096, + "step": 30844 + }, + { + "epoch": 2.43, + "learning_rate": 2.6201607551020708e-05, + "loss": 1.4097, + "step": 30845 + }, + { + "epoch": 2.43, + "learning_rate": 2.619462891575836e-05, + "loss": 1.4683, + "step": 30846 + }, + { + "epoch": 2.43, + "learning_rate": 2.6187651121066154e-05, + "loss": 1.4101, + "step": 30847 + }, + { + "epoch": 2.43, + "learning_rate": 2.6180674166991428e-05, + "loss": 1.4715, + "step": 30848 + }, + { + "epoch": 2.43, + "learning_rate": 2.6173698053581638e-05, + "loss": 1.413, + "step": 30849 + }, + { + "epoch": 2.43, + "learning_rate": 2.6166722780884114e-05, + "loss": 1.4706, + "step": 30850 + }, + { + "epoch": 2.43, + "learning_rate": 2.6159748348946154e-05, + "loss": 1.4816, + "step": 30851 + }, + { + "epoch": 2.43, + "learning_rate": 2.6152774757815215e-05, + "loss": 1.4639, + "step": 30852 + }, + { + "epoch": 2.43, + "learning_rate": 2.614580200753858e-05, + "loss": 1.482, + "step": 30853 + }, + { + "epoch": 2.43, + "learning_rate": 2.613883009816356e-05, + "loss": 1.4868, + "step": 30854 + }, + { + "epoch": 2.43, + "learning_rate": 2.6131859029737566e-05, + "loss": 1.4247, + "step": 30855 + }, + { + "epoch": 2.43, + "learning_rate": 2.6124888802307915e-05, + "loss": 1.4353, + "step": 30856 + }, + { + "epoch": 2.43, + "learning_rate": 2.6117919415921846e-05, + "loss": 1.4219, + "step": 30857 + }, + { + "epoch": 2.43, + "learning_rate": 2.611095087062679e-05, + "loss": 1.4067, + "step": 30858 + }, + { + "epoch": 2.43, + "learning_rate": 2.6103983166469977e-05, + "loss": 1.4386, + "step": 30859 + }, + { + "epoch": 2.43, + "learning_rate": 2.6097016303498784e-05, + "loss": 1.4815, + "step": 30860 + }, + { + "epoch": 2.43, + "learning_rate": 2.6090050281760427e-05, + "loss": 1.4754, + "step": 30861 + }, + { + "epoch": 2.43, + "learning_rate": 2.6083085101302298e-05, + "loss": 1.4668, + "step": 30862 + }, + { + "epoch": 2.43, + "learning_rate": 2.6076120762171627e-05, + "loss": 1.4579, + "step": 30863 + }, + { + "epoch": 2.43, + "learning_rate": 2.6069157264415724e-05, + "loss": 1.4457, + "step": 30864 + }, + { + "epoch": 2.43, + "learning_rate": 2.6062194608081805e-05, + "loss": 1.49, + "step": 30865 + }, + { + "epoch": 2.43, + "learning_rate": 2.605523279321723e-05, + "loss": 1.4372, + "step": 30866 + }, + { + "epoch": 2.43, + "learning_rate": 2.6048271819869227e-05, + "loss": 1.4756, + "step": 30867 + }, + { + "epoch": 2.43, + "learning_rate": 2.604131168808501e-05, + "loss": 1.4803, + "step": 30868 + }, + { + "epoch": 2.43, + "learning_rate": 2.6034352397911923e-05, + "loss": 1.4304, + "step": 30869 + }, + { + "epoch": 2.43, + "learning_rate": 2.602739394939718e-05, + "loss": 1.4427, + "step": 30870 + }, + { + "epoch": 2.43, + "learning_rate": 2.6020436342587975e-05, + "loss": 1.4236, + "step": 30871 + }, + { + "epoch": 2.43, + "learning_rate": 2.601347957753162e-05, + "loss": 1.4352, + "step": 30872 + }, + { + "epoch": 2.43, + "learning_rate": 2.600652365427533e-05, + "loss": 1.4088, + "step": 30873 + }, + { + "epoch": 2.43, + "learning_rate": 2.5999568572866282e-05, + "loss": 1.4448, + "step": 30874 + }, + { + "epoch": 2.43, + "learning_rate": 2.5992614333351718e-05, + "loss": 1.4595, + "step": 30875 + }, + { + "epoch": 2.43, + "learning_rate": 2.5985660935778925e-05, + "loss": 1.4548, + "step": 30876 + }, + { + "epoch": 2.43, + "learning_rate": 2.597870838019504e-05, + "loss": 1.4454, + "step": 30877 + }, + { + "epoch": 2.43, + "learning_rate": 2.5971756666647263e-05, + "loss": 1.4429, + "step": 30878 + }, + { + "epoch": 2.43, + "learning_rate": 2.596480579518284e-05, + "loss": 1.4544, + "step": 30879 + }, + { + "epoch": 2.43, + "learning_rate": 2.595785576584895e-05, + "loss": 1.4191, + "step": 30880 + }, + { + "epoch": 2.43, + "learning_rate": 2.5950906578692753e-05, + "loss": 1.4506, + "step": 30881 + }, + { + "epoch": 2.43, + "learning_rate": 2.5943958233761415e-05, + "loss": 1.4743, + "step": 30882 + }, + { + "epoch": 2.43, + "learning_rate": 2.5937010731102177e-05, + "loss": 1.4595, + "step": 30883 + }, + { + "epoch": 2.43, + "learning_rate": 2.5930064070762185e-05, + "loss": 1.4246, + "step": 30884 + }, + { + "epoch": 2.43, + "learning_rate": 2.5923118252788538e-05, + "loss": 1.4545, + "step": 30885 + }, + { + "epoch": 2.43, + "learning_rate": 2.591617327722848e-05, + "loss": 1.4829, + "step": 30886 + }, + { + "epoch": 2.43, + "learning_rate": 2.590922914412914e-05, + "loss": 1.4258, + "step": 30887 + }, + { + "epoch": 2.43, + "learning_rate": 2.5902285853537615e-05, + "loss": 1.3898, + "step": 30888 + }, + { + "epoch": 2.43, + "learning_rate": 2.589534340550113e-05, + "loss": 1.4437, + "step": 30889 + }, + { + "epoch": 2.43, + "learning_rate": 2.5888401800066733e-05, + "loss": 1.4751, + "step": 30890 + }, + { + "epoch": 2.43, + "learning_rate": 2.5881461037281636e-05, + "loss": 1.5045, + "step": 30891 + }, + { + "epoch": 2.43, + "learning_rate": 2.5874521117192885e-05, + "loss": 1.4538, + "step": 30892 + }, + { + "epoch": 2.43, + "learning_rate": 2.586758203984768e-05, + "loss": 1.4576, + "step": 30893 + }, + { + "epoch": 2.43, + "learning_rate": 2.5860643805293073e-05, + "loss": 1.4926, + "step": 30894 + }, + { + "epoch": 2.43, + "learning_rate": 2.585370641357617e-05, + "loss": 1.4118, + "step": 30895 + }, + { + "epoch": 2.43, + "learning_rate": 2.5846769864744128e-05, + "loss": 1.4378, + "step": 30896 + }, + { + "epoch": 2.43, + "learning_rate": 2.583983415884401e-05, + "loss": 1.4555, + "step": 30897 + }, + { + "epoch": 2.43, + "learning_rate": 2.5832899295922844e-05, + "loss": 1.4351, + "step": 30898 + }, + { + "epoch": 2.43, + "learning_rate": 2.5825965276027828e-05, + "loss": 1.4262, + "step": 30899 + }, + { + "epoch": 2.43, + "learning_rate": 2.581903209920597e-05, + "loss": 1.482, + "step": 30900 + }, + { + "epoch": 2.43, + "learning_rate": 2.5812099765504356e-05, + "loss": 1.5204, + "step": 30901 + }, + { + "epoch": 2.43, + "learning_rate": 2.5805168274970013e-05, + "loss": 1.4415, + "step": 30902 + }, + { + "epoch": 2.43, + "learning_rate": 2.579823762765008e-05, + "loss": 1.4751, + "step": 30903 + }, + { + "epoch": 2.43, + "learning_rate": 2.579130782359158e-05, + "loss": 1.4701, + "step": 30904 + }, + { + "epoch": 2.43, + "learning_rate": 2.5784378862841516e-05, + "loss": 1.4334, + "step": 30905 + }, + { + "epoch": 2.43, + "learning_rate": 2.577745074544697e-05, + "loss": 1.4705, + "step": 30906 + }, + { + "epoch": 2.43, + "learning_rate": 2.5770523471455025e-05, + "loss": 1.461, + "step": 30907 + }, + { + "epoch": 2.43, + "learning_rate": 2.5763597040912654e-05, + "loss": 1.4641, + "step": 30908 + }, + { + "epoch": 2.43, + "learning_rate": 2.575667145386687e-05, + "loss": 1.4868, + "step": 30909 + }, + { + "epoch": 2.43, + "learning_rate": 2.574974671036478e-05, + "loss": 1.4182, + "step": 30910 + }, + { + "epoch": 2.43, + "learning_rate": 2.574282281045331e-05, + "loss": 1.4752, + "step": 30911 + }, + { + "epoch": 2.43, + "learning_rate": 2.573589975417949e-05, + "loss": 1.4199, + "step": 30912 + }, + { + "epoch": 2.43, + "learning_rate": 2.5728977541590357e-05, + "loss": 1.4746, + "step": 30913 + }, + { + "epoch": 2.43, + "learning_rate": 2.5722056172732907e-05, + "loss": 1.4059, + "step": 30914 + }, + { + "epoch": 2.43, + "learning_rate": 2.5715135647654056e-05, + "loss": 1.431, + "step": 30915 + }, + { + "epoch": 2.43, + "learning_rate": 2.5708215966400896e-05, + "loss": 1.4213, + "step": 30916 + }, + { + "epoch": 2.43, + "learning_rate": 2.570129712902036e-05, + "loss": 1.5146, + "step": 30917 + }, + { + "epoch": 2.43, + "learning_rate": 2.5694379135559422e-05, + "loss": 1.4754, + "step": 30918 + }, + { + "epoch": 2.43, + "learning_rate": 2.5687461986065017e-05, + "loss": 1.4885, + "step": 30919 + }, + { + "epoch": 2.43, + "learning_rate": 2.568054568058417e-05, + "loss": 1.4443, + "step": 30920 + }, + { + "epoch": 2.43, + "learning_rate": 2.5673630219163825e-05, + "loss": 1.454, + "step": 30921 + }, + { + "epoch": 2.43, + "learning_rate": 2.5666715601850886e-05, + "loss": 1.4652, + "step": 30922 + }, + { + "epoch": 2.43, + "learning_rate": 2.5659801828692323e-05, + "loss": 1.4477, + "step": 30923 + }, + { + "epoch": 2.43, + "learning_rate": 2.5652888899735134e-05, + "loss": 1.4224, + "step": 30924 + }, + { + "epoch": 2.43, + "learning_rate": 2.5645976815026204e-05, + "loss": 1.4938, + "step": 30925 + }, + { + "epoch": 2.43, + "learning_rate": 2.5639065574612438e-05, + "loss": 1.4419, + "step": 30926 + }, + { + "epoch": 2.43, + "learning_rate": 2.563215517854082e-05, + "loss": 1.4303, + "step": 30927 + }, + { + "epoch": 2.43, + "learning_rate": 2.5625245626858242e-05, + "loss": 1.4482, + "step": 30928 + }, + { + "epoch": 2.43, + "learning_rate": 2.5618336919611572e-05, + "loss": 1.4815, + "step": 30929 + }, + { + "epoch": 2.43, + "learning_rate": 2.5611429056847782e-05, + "loss": 1.4437, + "step": 30930 + }, + { + "epoch": 2.43, + "learning_rate": 2.5604522038613757e-05, + "loss": 1.4765, + "step": 30931 + }, + { + "epoch": 2.43, + "learning_rate": 2.559761586495634e-05, + "loss": 1.4707, + "step": 30932 + }, + { + "epoch": 2.43, + "learning_rate": 2.5590710535922492e-05, + "loss": 1.4883, + "step": 30933 + }, + { + "epoch": 2.43, + "learning_rate": 2.5583806051559065e-05, + "loss": 1.44, + "step": 30934 + }, + { + "epoch": 2.43, + "learning_rate": 2.5576902411912947e-05, + "loss": 1.4357, + "step": 30935 + }, + { + "epoch": 2.43, + "learning_rate": 2.5569999617030957e-05, + "loss": 1.4241, + "step": 30936 + }, + { + "epoch": 2.43, + "learning_rate": 2.556309766696e-05, + "loss": 1.435, + "step": 30937 + }, + { + "epoch": 2.43, + "learning_rate": 2.5556196561746982e-05, + "loss": 1.4677, + "step": 30938 + }, + { + "epoch": 2.43, + "learning_rate": 2.5549296301438675e-05, + "loss": 1.5214, + "step": 30939 + }, + { + "epoch": 2.43, + "learning_rate": 2.5542396886081997e-05, + "loss": 1.498, + "step": 30940 + }, + { + "epoch": 2.43, + "learning_rate": 2.5535498315723783e-05, + "loss": 1.4667, + "step": 30941 + }, + { + "epoch": 2.43, + "learning_rate": 2.5528600590410843e-05, + "loss": 1.4427, + "step": 30942 + }, + { + "epoch": 2.43, + "learning_rate": 2.552170371018996e-05, + "loss": 1.4534, + "step": 30943 + }, + { + "epoch": 2.43, + "learning_rate": 2.5514807675108072e-05, + "loss": 1.4458, + "step": 30944 + }, + { + "epoch": 2.43, + "learning_rate": 2.550791248521194e-05, + "loss": 1.3844, + "step": 30945 + }, + { + "epoch": 2.43, + "learning_rate": 2.550101814054834e-05, + "loss": 1.4548, + "step": 30946 + }, + { + "epoch": 2.43, + "learning_rate": 2.549412464116417e-05, + "loss": 1.4655, + "step": 30947 + }, + { + "epoch": 2.44, + "learning_rate": 2.5487231987106176e-05, + "loss": 1.4249, + "step": 30948 + }, + { + "epoch": 2.44, + "learning_rate": 2.5480340178421138e-05, + "loss": 1.4169, + "step": 30949 + }, + { + "epoch": 2.44, + "learning_rate": 2.54734492151559e-05, + "loss": 1.384, + "step": 30950 + }, + { + "epoch": 2.44, + "learning_rate": 2.5466559097357224e-05, + "loss": 1.4382, + "step": 30951 + }, + { + "epoch": 2.44, + "learning_rate": 2.545966982507186e-05, + "loss": 1.4267, + "step": 30952 + }, + { + "epoch": 2.44, + "learning_rate": 2.54527813983466e-05, + "loss": 1.4671, + "step": 30953 + }, + { + "epoch": 2.44, + "learning_rate": 2.5445893817228274e-05, + "loss": 1.4529, + "step": 30954 + }, + { + "epoch": 2.44, + "learning_rate": 2.543900708176358e-05, + "loss": 1.3741, + "step": 30955 + }, + { + "epoch": 2.44, + "learning_rate": 2.543212119199926e-05, + "loss": 1.4963, + "step": 30956 + }, + { + "epoch": 2.44, + "learning_rate": 2.542523614798213e-05, + "loss": 1.4821, + "step": 30957 + }, + { + "epoch": 2.44, + "learning_rate": 2.5418351949758904e-05, + "loss": 1.4846, + "step": 30958 + }, + { + "epoch": 2.44, + "learning_rate": 2.5411468597376323e-05, + "loss": 1.4329, + "step": 30959 + }, + { + "epoch": 2.44, + "learning_rate": 2.5404586090881068e-05, + "loss": 1.447, + "step": 30960 + }, + { + "epoch": 2.44, + "learning_rate": 2.5397704430319954e-05, + "loss": 1.4909, + "step": 30961 + }, + { + "epoch": 2.44, + "learning_rate": 2.5390823615739675e-05, + "loss": 1.4395, + "step": 30962 + }, + { + "epoch": 2.44, + "learning_rate": 2.5383943647186894e-05, + "loss": 1.4389, + "step": 30963 + }, + { + "epoch": 2.44, + "learning_rate": 2.5377064524708406e-05, + "loss": 1.4117, + "step": 30964 + }, + { + "epoch": 2.44, + "learning_rate": 2.5370186248350878e-05, + "loss": 1.4535, + "step": 30965 + }, + { + "epoch": 2.44, + "learning_rate": 2.5363308818160965e-05, + "loss": 1.4471, + "step": 30966 + }, + { + "epoch": 2.44, + "learning_rate": 2.5356432234185454e-05, + "loss": 1.4746, + "step": 30967 + }, + { + "epoch": 2.44, + "learning_rate": 2.534955649647097e-05, + "loss": 1.4278, + "step": 30968 + }, + { + "epoch": 2.44, + "learning_rate": 2.534268160506419e-05, + "loss": 1.4178, + "step": 30969 + }, + { + "epoch": 2.44, + "learning_rate": 2.53358075600118e-05, + "loss": 1.4324, + "step": 30970 + }, + { + "epoch": 2.44, + "learning_rate": 2.532893436136051e-05, + "loss": 1.4247, + "step": 30971 + }, + { + "epoch": 2.44, + "learning_rate": 2.5322062009156964e-05, + "loss": 1.4324, + "step": 30972 + }, + { + "epoch": 2.44, + "learning_rate": 2.5315190503447792e-05, + "loss": 1.3696, + "step": 30973 + }, + { + "epoch": 2.44, + "learning_rate": 2.530831984427969e-05, + "loss": 1.4624, + "step": 30974 + }, + { + "epoch": 2.44, + "learning_rate": 2.5301450031699288e-05, + "loss": 1.4522, + "step": 30975 + }, + { + "epoch": 2.44, + "learning_rate": 2.5294581065753218e-05, + "loss": 1.4471, + "step": 30976 + }, + { + "epoch": 2.44, + "learning_rate": 2.5287712946488105e-05, + "loss": 1.4429, + "step": 30977 + }, + { + "epoch": 2.44, + "learning_rate": 2.5280845673950628e-05, + "loss": 1.4567, + "step": 30978 + }, + { + "epoch": 2.44, + "learning_rate": 2.5273979248187387e-05, + "loss": 1.4604, + "step": 30979 + }, + { + "epoch": 2.44, + "learning_rate": 2.5267113669244943e-05, + "loss": 1.4744, + "step": 30980 + }, + { + "epoch": 2.44, + "learning_rate": 2.5260248937170023e-05, + "loss": 1.4235, + "step": 30981 + }, + { + "epoch": 2.44, + "learning_rate": 2.525338505200916e-05, + "loss": 1.4676, + "step": 30982 + }, + { + "epoch": 2.44, + "learning_rate": 2.524652201380895e-05, + "loss": 1.4656, + "step": 30983 + }, + { + "epoch": 2.44, + "learning_rate": 2.5239659822616036e-05, + "loss": 1.4951, + "step": 30984 + }, + { + "epoch": 2.44, + "learning_rate": 2.523279847847695e-05, + "loss": 1.4384, + "step": 30985 + }, + { + "epoch": 2.44, + "learning_rate": 2.522593798143834e-05, + "loss": 1.4574, + "step": 30986 + }, + { + "epoch": 2.44, + "learning_rate": 2.5219078331546728e-05, + "loss": 1.4261, + "step": 30987 + }, + { + "epoch": 2.44, + "learning_rate": 2.521221952884875e-05, + "loss": 1.4841, + "step": 30988 + }, + { + "epoch": 2.44, + "learning_rate": 2.520536157339093e-05, + "loss": 1.4591, + "step": 30989 + }, + { + "epoch": 2.44, + "learning_rate": 2.5198504465219806e-05, + "loss": 1.4249, + "step": 30990 + }, + { + "epoch": 2.44, + "learning_rate": 2.5191648204382e-05, + "loss": 1.4877, + "step": 30991 + }, + { + "epoch": 2.44, + "learning_rate": 2.518479279092404e-05, + "loss": 1.4322, + "step": 30992 + }, + { + "epoch": 2.44, + "learning_rate": 2.5177938224892413e-05, + "loss": 1.5093, + "step": 30993 + }, + { + "epoch": 2.44, + "learning_rate": 2.5171084506333727e-05, + "loss": 1.4259, + "step": 30994 + }, + { + "epoch": 2.44, + "learning_rate": 2.5164231635294514e-05, + "loss": 1.4517, + "step": 30995 + }, + { + "epoch": 2.44, + "learning_rate": 2.5157379611821266e-05, + "loss": 1.4154, + "step": 30996 + }, + { + "epoch": 2.44, + "learning_rate": 2.515052843596048e-05, + "loss": 1.4686, + "step": 30997 + }, + { + "epoch": 2.44, + "learning_rate": 2.514367810775874e-05, + "loss": 1.477, + "step": 30998 + }, + { + "epoch": 2.44, + "learning_rate": 2.513682862726254e-05, + "loss": 1.4516, + "step": 30999 + }, + { + "epoch": 2.44, + "learning_rate": 2.5129979994518308e-05, + "loss": 1.4581, + "step": 31000 + }, + { + "epoch": 2.44, + "learning_rate": 2.5123132209572622e-05, + "loss": 1.4445, + "step": 31001 + }, + { + "epoch": 2.44, + "learning_rate": 2.511628527247198e-05, + "loss": 1.4978, + "step": 31002 + }, + { + "epoch": 2.44, + "learning_rate": 2.5109439183262863e-05, + "loss": 1.4505, + "step": 31003 + }, + { + "epoch": 2.44, + "learning_rate": 2.5102593941991683e-05, + "loss": 1.463, + "step": 31004 + }, + { + "epoch": 2.44, + "learning_rate": 2.5095749548705e-05, + "loss": 1.4579, + "step": 31005 + }, + { + "epoch": 2.44, + "learning_rate": 2.508890600344925e-05, + "loss": 1.4673, + "step": 31006 + }, + { + "epoch": 2.44, + "learning_rate": 2.508206330627087e-05, + "loss": 1.3552, + "step": 31007 + }, + { + "epoch": 2.44, + "learning_rate": 2.507522145721638e-05, + "loss": 1.4734, + "step": 31008 + }, + { + "epoch": 2.44, + "learning_rate": 2.5068380456332194e-05, + "loss": 1.4252, + "step": 31009 + }, + { + "epoch": 2.44, + "learning_rate": 2.5061540303664717e-05, + "loss": 1.4531, + "step": 31010 + }, + { + "epoch": 2.44, + "learning_rate": 2.5054700999260485e-05, + "loss": 1.4635, + "step": 31011 + }, + { + "epoch": 2.44, + "learning_rate": 2.5047862543165875e-05, + "loss": 1.4349, + "step": 31012 + }, + { + "epoch": 2.44, + "learning_rate": 2.504102493542732e-05, + "loss": 1.4157, + "step": 31013 + }, + { + "epoch": 2.44, + "learning_rate": 2.5034188176091206e-05, + "loss": 1.4418, + "step": 31014 + }, + { + "epoch": 2.44, + "learning_rate": 2.5027352265204043e-05, + "loss": 1.4746, + "step": 31015 + }, + { + "epoch": 2.44, + "learning_rate": 2.502051720281215e-05, + "loss": 1.4889, + "step": 31016 + }, + { + "epoch": 2.44, + "learning_rate": 2.5013682988962013e-05, + "loss": 1.4645, + "step": 31017 + }, + { + "epoch": 2.44, + "learning_rate": 2.500684962369996e-05, + "loss": 1.4777, + "step": 31018 + }, + { + "epoch": 2.44, + "learning_rate": 2.5000017107072467e-05, + "loss": 1.4437, + "step": 31019 + }, + { + "epoch": 2.44, + "learning_rate": 2.4993185439125867e-05, + "loss": 1.4113, + "step": 31020 + }, + { + "epoch": 2.44, + "learning_rate": 2.4986354619906523e-05, + "loss": 1.4528, + "step": 31021 + }, + { + "epoch": 2.44, + "learning_rate": 2.4979524649460865e-05, + "loss": 1.4284, + "step": 31022 + }, + { + "epoch": 2.44, + "learning_rate": 2.497269552783525e-05, + "loss": 1.4583, + "step": 31023 + }, + { + "epoch": 2.44, + "learning_rate": 2.4965867255076e-05, + "loss": 1.4366, + "step": 31024 + }, + { + "epoch": 2.44, + "learning_rate": 2.4959039831229555e-05, + "loss": 1.4794, + "step": 31025 + }, + { + "epoch": 2.44, + "learning_rate": 2.495221325634223e-05, + "loss": 1.4681, + "step": 31026 + }, + { + "epoch": 2.44, + "learning_rate": 2.494538753046032e-05, + "loss": 1.4151, + "step": 31027 + }, + { + "epoch": 2.44, + "learning_rate": 2.4938562653630255e-05, + "loss": 1.4599, + "step": 31028 + }, + { + "epoch": 2.44, + "learning_rate": 2.4931738625898335e-05, + "loss": 1.464, + "step": 31029 + }, + { + "epoch": 2.44, + "learning_rate": 2.49249154473109e-05, + "loss": 1.4293, + "step": 31030 + }, + { + "epoch": 2.44, + "learning_rate": 2.4918093117914236e-05, + "loss": 1.4848, + "step": 31031 + }, + { + "epoch": 2.44, + "learning_rate": 2.491127163775468e-05, + "loss": 1.4835, + "step": 31032 + }, + { + "epoch": 2.44, + "learning_rate": 2.490445100687859e-05, + "loss": 1.5074, + "step": 31033 + }, + { + "epoch": 2.44, + "learning_rate": 2.4897631225332253e-05, + "loss": 1.4676, + "step": 31034 + }, + { + "epoch": 2.44, + "learning_rate": 2.4890812293161937e-05, + "loss": 1.4467, + "step": 31035 + }, + { + "epoch": 2.44, + "learning_rate": 2.4883994210413987e-05, + "loss": 1.4401, + "step": 31036 + }, + { + "epoch": 2.44, + "learning_rate": 2.4877176977134684e-05, + "loss": 1.4341, + "step": 31037 + }, + { + "epoch": 2.44, + "learning_rate": 2.4870360593370255e-05, + "loss": 1.4895, + "step": 31038 + }, + { + "epoch": 2.44, + "learning_rate": 2.486354505916706e-05, + "loss": 1.4766, + "step": 31039 + }, + { + "epoch": 2.44, + "learning_rate": 2.4856730374571336e-05, + "loss": 1.4426, + "step": 31040 + }, + { + "epoch": 2.44, + "learning_rate": 2.4849916539629327e-05, + "loss": 1.4208, + "step": 31041 + }, + { + "epoch": 2.44, + "learning_rate": 2.4843103554387344e-05, + "loss": 1.4267, + "step": 31042 + }, + { + "epoch": 2.44, + "learning_rate": 2.4836291418891637e-05, + "loss": 1.5063, + "step": 31043 + }, + { + "epoch": 2.44, + "learning_rate": 2.4829480133188394e-05, + "loss": 1.4997, + "step": 31044 + }, + { + "epoch": 2.44, + "learning_rate": 2.4822669697323954e-05, + "loss": 1.461, + "step": 31045 + }, + { + "epoch": 2.44, + "learning_rate": 2.4815860111344495e-05, + "loss": 1.4677, + "step": 31046 + }, + { + "epoch": 2.44, + "learning_rate": 2.4809051375296225e-05, + "loss": 1.4515, + "step": 31047 + }, + { + "epoch": 2.44, + "learning_rate": 2.4802243489225426e-05, + "loss": 1.4607, + "step": 31048 + }, + { + "epoch": 2.44, + "learning_rate": 2.479543645317833e-05, + "loss": 1.4816, + "step": 31049 + }, + { + "epoch": 2.44, + "learning_rate": 2.4788630267201114e-05, + "loss": 1.4487, + "step": 31050 + }, + { + "epoch": 2.44, + "learning_rate": 2.478182493133998e-05, + "loss": 1.4752, + "step": 31051 + }, + { + "epoch": 2.44, + "learning_rate": 2.47750204456412e-05, + "loss": 1.4499, + "step": 31052 + }, + { + "epoch": 2.44, + "learning_rate": 2.4768216810150905e-05, + "loss": 1.4564, + "step": 31053 + }, + { + "epoch": 2.44, + "learning_rate": 2.4761414024915327e-05, + "loss": 1.4563, + "step": 31054 + }, + { + "epoch": 2.44, + "learning_rate": 2.475461208998058e-05, + "loss": 1.439, + "step": 31055 + }, + { + "epoch": 2.44, + "learning_rate": 2.474781100539294e-05, + "loss": 1.4576, + "step": 31056 + }, + { + "epoch": 2.44, + "learning_rate": 2.474101077119856e-05, + "loss": 1.4357, + "step": 31057 + }, + { + "epoch": 2.44, + "learning_rate": 2.4734211387443547e-05, + "loss": 1.4416, + "step": 31058 + }, + { + "epoch": 2.44, + "learning_rate": 2.472741285417415e-05, + "loss": 1.4702, + "step": 31059 + }, + { + "epoch": 2.44, + "learning_rate": 2.472061517143648e-05, + "loss": 1.4213, + "step": 31060 + }, + { + "epoch": 2.44, + "learning_rate": 2.4713818339276668e-05, + "loss": 1.4458, + "step": 31061 + }, + { + "epoch": 2.44, + "learning_rate": 2.470702235774093e-05, + "loss": 1.4537, + "step": 31062 + }, + { + "epoch": 2.44, + "learning_rate": 2.470022722687534e-05, + "loss": 1.4429, + "step": 31063 + }, + { + "epoch": 2.44, + "learning_rate": 2.4693432946726083e-05, + "loss": 1.3762, + "step": 31064 + }, + { + "epoch": 2.44, + "learning_rate": 2.4686639517339235e-05, + "loss": 1.4444, + "step": 31065 + }, + { + "epoch": 2.44, + "learning_rate": 2.4679846938760977e-05, + "loss": 1.4428, + "step": 31066 + }, + { + "epoch": 2.44, + "learning_rate": 2.4673055211037425e-05, + "loss": 1.4566, + "step": 31067 + }, + { + "epoch": 2.44, + "learning_rate": 2.4666264334214603e-05, + "loss": 1.4824, + "step": 31068 + }, + { + "epoch": 2.44, + "learning_rate": 2.4659474308338745e-05, + "loss": 1.5117, + "step": 31069 + }, + { + "epoch": 2.44, + "learning_rate": 2.4652685133455863e-05, + "loss": 1.4178, + "step": 31070 + }, + { + "epoch": 2.44, + "learning_rate": 2.464589680961209e-05, + "loss": 1.4635, + "step": 31071 + }, + { + "epoch": 2.44, + "learning_rate": 2.4639109336853464e-05, + "loss": 1.4534, + "step": 31072 + }, + { + "epoch": 2.44, + "learning_rate": 2.4632322715226138e-05, + "loss": 1.4089, + "step": 31073 + }, + { + "epoch": 2.44, + "learning_rate": 2.462553694477616e-05, + "loss": 1.4325, + "step": 31074 + }, + { + "epoch": 2.45, + "learning_rate": 2.4618752025549554e-05, + "loss": 1.4531, + "step": 31075 + }, + { + "epoch": 2.45, + "learning_rate": 2.461196795759249e-05, + "loss": 1.3969, + "step": 31076 + }, + { + "epoch": 2.45, + "learning_rate": 2.460518474095094e-05, + "loss": 1.4551, + "step": 31077 + }, + { + "epoch": 2.45, + "learning_rate": 2.459840237567097e-05, + "loss": 1.4404, + "step": 31078 + }, + { + "epoch": 2.45, + "learning_rate": 2.4591620861798634e-05, + "loss": 1.4121, + "step": 31079 + }, + { + "epoch": 2.45, + "learning_rate": 2.4584840199380034e-05, + "loss": 1.4009, + "step": 31080 + }, + { + "epoch": 2.45, + "learning_rate": 2.4578060388461156e-05, + "loss": 1.4596, + "step": 31081 + }, + { + "epoch": 2.45, + "learning_rate": 2.4571281429087997e-05, + "loss": 1.418, + "step": 31082 + }, + { + "epoch": 2.45, + "learning_rate": 2.456450332130665e-05, + "loss": 1.437, + "step": 31083 + }, + { + "epoch": 2.45, + "learning_rate": 2.4557726065163114e-05, + "loss": 1.4418, + "step": 31084 + }, + { + "epoch": 2.45, + "learning_rate": 2.455094966070335e-05, + "loss": 1.4463, + "step": 31085 + }, + { + "epoch": 2.45, + "learning_rate": 2.454417410797344e-05, + "loss": 1.4751, + "step": 31086 + }, + { + "epoch": 2.45, + "learning_rate": 2.4537399407019366e-05, + "loss": 1.4386, + "step": 31087 + }, + { + "epoch": 2.45, + "learning_rate": 2.4530625557887118e-05, + "loss": 1.4884, + "step": 31088 + }, + { + "epoch": 2.45, + "learning_rate": 2.452385256062263e-05, + "loss": 1.4076, + "step": 31089 + }, + { + "epoch": 2.45, + "learning_rate": 2.4517080415272002e-05, + "loss": 1.4693, + "step": 31090 + }, + { + "epoch": 2.45, + "learning_rate": 2.4510309121881122e-05, + "loss": 1.4318, + "step": 31091 + }, + { + "epoch": 2.45, + "learning_rate": 2.4503538680495977e-05, + "loss": 1.4541, + "step": 31092 + }, + { + "epoch": 2.45, + "learning_rate": 2.4496769091162576e-05, + "loss": 1.4544, + "step": 31093 + }, + { + "epoch": 2.45, + "learning_rate": 2.4490000353926853e-05, + "loss": 1.401, + "step": 31094 + }, + { + "epoch": 2.45, + "learning_rate": 2.4483232468834736e-05, + "loss": 1.4023, + "step": 31095 + }, + { + "epoch": 2.45, + "learning_rate": 2.44764654359322e-05, + "loss": 1.4569, + "step": 31096 + }, + { + "epoch": 2.45, + "learning_rate": 2.4469699255265235e-05, + "loss": 1.4696, + "step": 31097 + }, + { + "epoch": 2.45, + "learning_rate": 2.446293392687973e-05, + "loss": 1.445, + "step": 31098 + }, + { + "epoch": 2.45, + "learning_rate": 2.4456169450821584e-05, + "loss": 1.4534, + "step": 31099 + }, + { + "epoch": 2.45, + "learning_rate": 2.4449405827136825e-05, + "loss": 1.461, + "step": 31100 + }, + { + "epoch": 2.45, + "learning_rate": 2.4442643055871303e-05, + "loss": 1.4793, + "step": 31101 + }, + { + "epoch": 2.45, + "learning_rate": 2.4435881137070913e-05, + "loss": 1.4723, + "step": 31102 + }, + { + "epoch": 2.45, + "learning_rate": 2.442912007078163e-05, + "loss": 1.4069, + "step": 31103 + }, + { + "epoch": 2.45, + "learning_rate": 2.442235985704933e-05, + "loss": 1.4546, + "step": 31104 + }, + { + "epoch": 2.45, + "learning_rate": 2.441560049591986e-05, + "loss": 1.4421, + "step": 31105 + }, + { + "epoch": 2.45, + "learning_rate": 2.4408841987439214e-05, + "loss": 1.4769, + "step": 31106 + }, + { + "epoch": 2.45, + "learning_rate": 2.4402084331653217e-05, + "loss": 1.4279, + "step": 31107 + }, + { + "epoch": 2.45, + "learning_rate": 2.439532752860776e-05, + "loss": 1.4573, + "step": 31108 + }, + { + "epoch": 2.45, + "learning_rate": 2.4388571578348665e-05, + "loss": 1.4767, + "step": 31109 + }, + { + "epoch": 2.45, + "learning_rate": 2.4381816480921856e-05, + "loss": 1.4604, + "step": 31110 + }, + { + "epoch": 2.45, + "learning_rate": 2.4375062236373234e-05, + "loss": 1.4026, + "step": 31111 + }, + { + "epoch": 2.45, + "learning_rate": 2.4368308844748625e-05, + "loss": 1.4333, + "step": 31112 + }, + { + "epoch": 2.45, + "learning_rate": 2.436155630609381e-05, + "loss": 1.4537, + "step": 31113 + }, + { + "epoch": 2.45, + "learning_rate": 2.4354804620454738e-05, + "loss": 1.4116, + "step": 31114 + }, + { + "epoch": 2.45, + "learning_rate": 2.434805378787722e-05, + "loss": 1.4354, + "step": 31115 + }, + { + "epoch": 2.45, + "learning_rate": 2.434130380840702e-05, + "loss": 1.4148, + "step": 31116 + }, + { + "epoch": 2.45, + "learning_rate": 2.433455468209007e-05, + "loss": 1.5019, + "step": 31117 + }, + { + "epoch": 2.45, + "learning_rate": 2.4327806408972146e-05, + "loss": 1.457, + "step": 31118 + }, + { + "epoch": 2.45, + "learning_rate": 2.4321058989099012e-05, + "loss": 1.4415, + "step": 31119 + }, + { + "epoch": 2.45, + "learning_rate": 2.4314312422516587e-05, + "loss": 1.4831, + "step": 31120 + }, + { + "epoch": 2.45, + "learning_rate": 2.4307566709270626e-05, + "loss": 1.4729, + "step": 31121 + }, + { + "epoch": 2.45, + "learning_rate": 2.4300821849406866e-05, + "loss": 1.4277, + "step": 31122 + }, + { + "epoch": 2.45, + "learning_rate": 2.4294077842971216e-05, + "loss": 1.4618, + "step": 31123 + }, + { + "epoch": 2.45, + "learning_rate": 2.428733469000939e-05, + "loss": 1.4431, + "step": 31124 + }, + { + "epoch": 2.45, + "learning_rate": 2.4280592390567204e-05, + "loss": 1.4488, + "step": 31125 + }, + { + "epoch": 2.45, + "learning_rate": 2.427385094469034e-05, + "loss": 1.4629, + "step": 31126 + }, + { + "epoch": 2.45, + "learning_rate": 2.4267110352424718e-05, + "loss": 1.4248, + "step": 31127 + }, + { + "epoch": 2.45, + "learning_rate": 2.4260370613816025e-05, + "loss": 1.4445, + "step": 31128 + }, + { + "epoch": 2.45, + "learning_rate": 2.4253631728910045e-05, + "loss": 1.4406, + "step": 31129 + }, + { + "epoch": 2.45, + "learning_rate": 2.424689369775245e-05, + "loss": 1.4342, + "step": 31130 + }, + { + "epoch": 2.45, + "learning_rate": 2.424015652038911e-05, + "loss": 1.3804, + "step": 31131 + }, + { + "epoch": 2.45, + "learning_rate": 2.42334201968657e-05, + "loss": 1.4492, + "step": 31132 + }, + { + "epoch": 2.45, + "learning_rate": 2.422668472722792e-05, + "loss": 1.5045, + "step": 31133 + }, + { + "epoch": 2.45, + "learning_rate": 2.421995011152158e-05, + "loss": 1.535, + "step": 31134 + }, + { + "epoch": 2.45, + "learning_rate": 2.421321634979238e-05, + "loss": 1.4892, + "step": 31135 + }, + { + "epoch": 2.45, + "learning_rate": 2.4206483442085983e-05, + "loss": 1.4522, + "step": 31136 + }, + { + "epoch": 2.45, + "learning_rate": 2.4199751388448186e-05, + "loss": 1.4347, + "step": 31137 + }, + { + "epoch": 2.45, + "learning_rate": 2.4193020188924632e-05, + "loss": 1.4378, + "step": 31138 + }, + { + "epoch": 2.45, + "learning_rate": 2.418628984356104e-05, + "loss": 1.4444, + "step": 31139 + }, + { + "epoch": 2.45, + "learning_rate": 2.417956035240312e-05, + "loss": 1.4625, + "step": 31140 + }, + { + "epoch": 2.45, + "learning_rate": 2.4172831715496572e-05, + "loss": 1.4585, + "step": 31141 + }, + { + "epoch": 2.45, + "learning_rate": 2.4166103932887004e-05, + "loss": 1.4234, + "step": 31142 + }, + { + "epoch": 2.45, + "learning_rate": 2.4159377004620167e-05, + "loss": 1.4099, + "step": 31143 + }, + { + "epoch": 2.45, + "learning_rate": 2.415265093074174e-05, + "loss": 1.4721, + "step": 31144 + }, + { + "epoch": 2.45, + "learning_rate": 2.414592571129737e-05, + "loss": 1.4552, + "step": 31145 + }, + { + "epoch": 2.45, + "learning_rate": 2.413920134633272e-05, + "loss": 1.4444, + "step": 31146 + }, + { + "epoch": 2.45, + "learning_rate": 2.4132477835893387e-05, + "loss": 1.5256, + "step": 31147 + }, + { + "epoch": 2.45, + "learning_rate": 2.412575518002512e-05, + "loss": 1.4059, + "step": 31148 + }, + { + "epoch": 2.45, + "learning_rate": 2.4119033378773494e-05, + "loss": 1.4617, + "step": 31149 + }, + { + "epoch": 2.45, + "learning_rate": 2.4112312432184144e-05, + "loss": 1.4292, + "step": 31150 + }, + { + "epoch": 2.45, + "learning_rate": 2.4105592340302764e-05, + "loss": 1.4498, + "step": 31151 + }, + { + "epoch": 2.45, + "learning_rate": 2.4098873103174922e-05, + "loss": 1.4317, + "step": 31152 + }, + { + "epoch": 2.45, + "learning_rate": 2.4092154720846224e-05, + "loss": 1.451, + "step": 31153 + }, + { + "epoch": 2.45, + "learning_rate": 2.408543719336234e-05, + "loss": 1.4842, + "step": 31154 + }, + { + "epoch": 2.45, + "learning_rate": 2.407872052076886e-05, + "loss": 1.4408, + "step": 31155 + }, + { + "epoch": 2.45, + "learning_rate": 2.4072004703111343e-05, + "loss": 1.4382, + "step": 31156 + }, + { + "epoch": 2.45, + "learning_rate": 2.4065289740435424e-05, + "loss": 1.4703, + "step": 31157 + }, + { + "epoch": 2.45, + "learning_rate": 2.405857563278672e-05, + "loss": 1.4315, + "step": 31158 + }, + { + "epoch": 2.45, + "learning_rate": 2.4051862380210795e-05, + "loss": 1.4623, + "step": 31159 + }, + { + "epoch": 2.45, + "learning_rate": 2.404514998275318e-05, + "loss": 1.4865, + "step": 31160 + }, + { + "epoch": 2.45, + "learning_rate": 2.4038438440459522e-05, + "loss": 1.4754, + "step": 31161 + }, + { + "epoch": 2.45, + "learning_rate": 2.403172775337537e-05, + "loss": 1.4601, + "step": 31162 + }, + { + "epoch": 2.45, + "learning_rate": 2.402501792154623e-05, + "loss": 1.4995, + "step": 31163 + }, + { + "epoch": 2.45, + "learning_rate": 2.4018308945017724e-05, + "loss": 1.4896, + "step": 31164 + }, + { + "epoch": 2.45, + "learning_rate": 2.401160082383539e-05, + "loss": 1.4523, + "step": 31165 + }, + { + "epoch": 2.45, + "learning_rate": 2.4004893558044752e-05, + "loss": 1.446, + "step": 31166 + }, + { + "epoch": 2.45, + "learning_rate": 2.3998187147691315e-05, + "loss": 1.3967, + "step": 31167 + }, + { + "epoch": 2.45, + "learning_rate": 2.3991481592820698e-05, + "loss": 1.3914, + "step": 31168 + }, + { + "epoch": 2.45, + "learning_rate": 2.3984776893478395e-05, + "loss": 1.4424, + "step": 31169 + }, + { + "epoch": 2.45, + "learning_rate": 2.3978073049709873e-05, + "loss": 1.4604, + "step": 31170 + }, + { + "epoch": 2.45, + "learning_rate": 2.3971370061560708e-05, + "loss": 1.4714, + "step": 31171 + }, + { + "epoch": 2.45, + "learning_rate": 2.3964667929076414e-05, + "loss": 1.4017, + "step": 31172 + }, + { + "epoch": 2.45, + "learning_rate": 2.3957966652302424e-05, + "loss": 1.4378, + "step": 31173 + }, + { + "epoch": 2.45, + "learning_rate": 2.39512662312843e-05, + "loss": 1.4352, + "step": 31174 + }, + { + "epoch": 2.45, + "learning_rate": 2.3944566666067538e-05, + "loss": 1.3578, + "step": 31175 + }, + { + "epoch": 2.45, + "learning_rate": 2.393786795669762e-05, + "loss": 1.464, + "step": 31176 + }, + { + "epoch": 2.45, + "learning_rate": 2.393117010321996e-05, + "loss": 1.4586, + "step": 31177 + }, + { + "epoch": 2.45, + "learning_rate": 2.3924473105680137e-05, + "loss": 1.4205, + "step": 31178 + }, + { + "epoch": 2.45, + "learning_rate": 2.3917776964123547e-05, + "loss": 1.4878, + "step": 31179 + }, + { + "epoch": 2.45, + "learning_rate": 2.3911081678595655e-05, + "loss": 1.5079, + "step": 31180 + }, + { + "epoch": 2.45, + "learning_rate": 2.390438724914196e-05, + "loss": 1.4287, + "step": 31181 + }, + { + "epoch": 2.45, + "learning_rate": 2.3897693675807904e-05, + "loss": 1.377, + "step": 31182 + }, + { + "epoch": 2.45, + "learning_rate": 2.3891000958638905e-05, + "loss": 1.48, + "step": 31183 + }, + { + "epoch": 2.45, + "learning_rate": 2.3884309097680394e-05, + "loss": 1.4446, + "step": 31184 + }, + { + "epoch": 2.45, + "learning_rate": 2.3877618092977864e-05, + "loss": 1.4572, + "step": 31185 + }, + { + "epoch": 2.45, + "learning_rate": 2.3870927944576695e-05, + "loss": 1.4076, + "step": 31186 + }, + { + "epoch": 2.45, + "learning_rate": 2.386423865252229e-05, + "loss": 1.429, + "step": 31187 + }, + { + "epoch": 2.45, + "learning_rate": 2.385755021686014e-05, + "loss": 1.46, + "step": 31188 + }, + { + "epoch": 2.45, + "learning_rate": 2.385086263763556e-05, + "loss": 1.4844, + "step": 31189 + }, + { + "epoch": 2.45, + "learning_rate": 2.3844175914894065e-05, + "loss": 1.4016, + "step": 31190 + }, + { + "epoch": 2.45, + "learning_rate": 2.383749004868095e-05, + "loss": 1.4753, + "step": 31191 + }, + { + "epoch": 2.45, + "learning_rate": 2.3830805039041682e-05, + "loss": 1.4942, + "step": 31192 + }, + { + "epoch": 2.45, + "learning_rate": 2.3824120886021643e-05, + "loss": 1.4451, + "step": 31193 + }, + { + "epoch": 2.45, + "learning_rate": 2.3817437589666138e-05, + "loss": 1.4295, + "step": 31194 + }, + { + "epoch": 2.45, + "learning_rate": 2.3810755150020637e-05, + "loss": 1.4035, + "step": 31195 + }, + { + "epoch": 2.45, + "learning_rate": 2.3804073567130487e-05, + "loss": 1.4272, + "step": 31196 + }, + { + "epoch": 2.45, + "learning_rate": 2.3797392841040984e-05, + "loss": 1.4546, + "step": 31197 + }, + { + "epoch": 2.45, + "learning_rate": 2.3790712971797592e-05, + "loss": 1.3829, + "step": 31198 + }, + { + "epoch": 2.45, + "learning_rate": 2.378403395944559e-05, + "loss": 1.4444, + "step": 31199 + }, + { + "epoch": 2.45, + "learning_rate": 2.3777355804030362e-05, + "loss": 1.4131, + "step": 31200 + }, + { + "epoch": 2.45, + "learning_rate": 2.37706785055972e-05, + "loss": 1.4353, + "step": 31201 + }, + { + "epoch": 2.46, + "learning_rate": 2.376400206419149e-05, + "loss": 1.4052, + "step": 31202 + }, + { + "epoch": 2.46, + "learning_rate": 2.3757326479858556e-05, + "loss": 1.4955, + "step": 31203 + }, + { + "epoch": 2.46, + "learning_rate": 2.3750651752643667e-05, + "loss": 1.435, + "step": 31204 + }, + { + "epoch": 2.46, + "learning_rate": 2.3743977882592185e-05, + "loss": 1.4441, + "step": 31205 + }, + { + "epoch": 2.46, + "learning_rate": 2.3737304869749458e-05, + "loss": 1.3819, + "step": 31206 + }, + { + "epoch": 2.46, + "learning_rate": 2.3730632714160746e-05, + "loss": 1.4665, + "step": 31207 + }, + { + "epoch": 2.46, + "learning_rate": 2.3723961415871336e-05, + "loss": 1.4526, + "step": 31208 + }, + { + "epoch": 2.46, + "learning_rate": 2.3717290974926567e-05, + "loss": 1.4552, + "step": 31209 + }, + { + "epoch": 2.46, + "learning_rate": 2.371062139137171e-05, + "loss": 1.4796, + "step": 31210 + }, + { + "epoch": 2.46, + "learning_rate": 2.370395266525199e-05, + "loss": 1.5206, + "step": 31211 + }, + { + "epoch": 2.46, + "learning_rate": 2.3697284796612793e-05, + "loss": 1.4784, + "step": 31212 + }, + { + "epoch": 2.46, + "learning_rate": 2.369061778549931e-05, + "loss": 1.4701, + "step": 31213 + }, + { + "epoch": 2.46, + "learning_rate": 2.368395163195681e-05, + "loss": 1.4006, + "step": 31214 + }, + { + "epoch": 2.46, + "learning_rate": 2.3677286336030604e-05, + "loss": 1.4659, + "step": 31215 + }, + { + "epoch": 2.46, + "learning_rate": 2.3670621897765905e-05, + "loss": 1.4319, + "step": 31216 + }, + { + "epoch": 2.46, + "learning_rate": 2.3663958317207948e-05, + "loss": 1.4842, + "step": 31217 + }, + { + "epoch": 2.46, + "learning_rate": 2.3657295594402024e-05, + "loss": 1.457, + "step": 31218 + }, + { + "epoch": 2.46, + "learning_rate": 2.3650633729393336e-05, + "loss": 1.4688, + "step": 31219 + }, + { + "epoch": 2.46, + "learning_rate": 2.3643972722227094e-05, + "loss": 1.438, + "step": 31220 + }, + { + "epoch": 2.46, + "learning_rate": 2.3637312572948547e-05, + "loss": 1.4195, + "step": 31221 + }, + { + "epoch": 2.46, + "learning_rate": 2.363065328160294e-05, + "loss": 1.4234, + "step": 31222 + }, + { + "epoch": 2.46, + "learning_rate": 2.3623994848235473e-05, + "loss": 1.4118, + "step": 31223 + }, + { + "epoch": 2.46, + "learning_rate": 2.3617337272891325e-05, + "loss": 1.4733, + "step": 31224 + }, + { + "epoch": 2.46, + "learning_rate": 2.361068055561569e-05, + "loss": 1.4802, + "step": 31225 + }, + { + "epoch": 2.46, + "learning_rate": 2.3604024696453822e-05, + "loss": 1.4538, + "step": 31226 + }, + { + "epoch": 2.46, + "learning_rate": 2.359736969545088e-05, + "loss": 1.4308, + "step": 31227 + }, + { + "epoch": 2.46, + "learning_rate": 2.3590715552651995e-05, + "loss": 1.4748, + "step": 31228 + }, + { + "epoch": 2.46, + "learning_rate": 2.3584062268102434e-05, + "loss": 1.4201, + "step": 31229 + }, + { + "epoch": 2.46, + "learning_rate": 2.3577409841847324e-05, + "loss": 1.4184, + "step": 31230 + }, + { + "epoch": 2.46, + "learning_rate": 2.357075827393181e-05, + "loss": 1.4058, + "step": 31231 + }, + { + "epoch": 2.46, + "learning_rate": 2.3564107564401115e-05, + "loss": 1.4445, + "step": 31232 + }, + { + "epoch": 2.46, + "learning_rate": 2.355745771330034e-05, + "loss": 1.468, + "step": 31233 + }, + { + "epoch": 2.46, + "learning_rate": 2.355080872067463e-05, + "loss": 1.4186, + "step": 31234 + }, + { + "epoch": 2.46, + "learning_rate": 2.3544160586569172e-05, + "loss": 1.5129, + "step": 31235 + }, + { + "epoch": 2.46, + "learning_rate": 2.353751331102905e-05, + "loss": 1.4643, + "step": 31236 + }, + { + "epoch": 2.46, + "learning_rate": 2.353086689409946e-05, + "loss": 1.4384, + "step": 31237 + }, + { + "epoch": 2.46, + "learning_rate": 2.3524221335825465e-05, + "loss": 1.4278, + "step": 31238 + }, + { + "epoch": 2.46, + "learning_rate": 2.3517576636252235e-05, + "loss": 1.4622, + "step": 31239 + }, + { + "epoch": 2.46, + "learning_rate": 2.351093279542486e-05, + "loss": 1.4463, + "step": 31240 + }, + { + "epoch": 2.46, + "learning_rate": 2.3504289813388454e-05, + "loss": 1.4627, + "step": 31241 + }, + { + "epoch": 2.46, + "learning_rate": 2.349764769018809e-05, + "loss": 1.4293, + "step": 31242 + }, + { + "epoch": 2.46, + "learning_rate": 2.3491006425868903e-05, + "loss": 1.4729, + "step": 31243 + }, + { + "epoch": 2.46, + "learning_rate": 2.348436602047598e-05, + "loss": 1.4093, + "step": 31244 + }, + { + "epoch": 2.46, + "learning_rate": 2.347772647405437e-05, + "loss": 1.4021, + "step": 31245 + }, + { + "epoch": 2.46, + "learning_rate": 2.3471087786649202e-05, + "loss": 1.4208, + "step": 31246 + }, + { + "epoch": 2.46, + "learning_rate": 2.346444995830552e-05, + "loss": 1.4934, + "step": 31247 + }, + { + "epoch": 2.46, + "learning_rate": 2.345781298906836e-05, + "loss": 1.4185, + "step": 31248 + }, + { + "epoch": 2.46, + "learning_rate": 2.3451176878982848e-05, + "loss": 1.4092, + "step": 31249 + }, + { + "epoch": 2.46, + "learning_rate": 2.3444541628094017e-05, + "loss": 1.4601, + "step": 31250 + }, + { + "epoch": 2.46, + "learning_rate": 2.343790723644688e-05, + "loss": 1.4554, + "step": 31251 + }, + { + "epoch": 2.46, + "learning_rate": 2.34312737040865e-05, + "loss": 1.4647, + "step": 31252 + }, + { + "epoch": 2.46, + "learning_rate": 2.3424641031057962e-05, + "loss": 1.4115, + "step": 31253 + }, + { + "epoch": 2.46, + "learning_rate": 2.341800921740626e-05, + "loss": 1.438, + "step": 31254 + }, + { + "epoch": 2.46, + "learning_rate": 2.341137826317639e-05, + "loss": 1.4265, + "step": 31255 + }, + { + "epoch": 2.46, + "learning_rate": 2.3404748168413434e-05, + "loss": 1.411, + "step": 31256 + }, + { + "epoch": 2.46, + "learning_rate": 2.339811893316239e-05, + "loss": 1.4131, + "step": 31257 + }, + { + "epoch": 2.46, + "learning_rate": 2.339149055746824e-05, + "loss": 1.438, + "step": 31258 + }, + { + "epoch": 2.46, + "learning_rate": 2.3384863041375963e-05, + "loss": 1.447, + "step": 31259 + }, + { + "epoch": 2.46, + "learning_rate": 2.3378236384930638e-05, + "loss": 1.5095, + "step": 31260 + }, + { + "epoch": 2.46, + "learning_rate": 2.3371610588177214e-05, + "loss": 1.4418, + "step": 31261 + }, + { + "epoch": 2.46, + "learning_rate": 2.336498565116064e-05, + "loss": 1.4122, + "step": 31262 + }, + { + "epoch": 2.46, + "learning_rate": 2.335836157392596e-05, + "loss": 1.4596, + "step": 31263 + }, + { + "epoch": 2.46, + "learning_rate": 2.3351738356518125e-05, + "loss": 1.4458, + "step": 31264 + }, + { + "epoch": 2.46, + "learning_rate": 2.334511599898206e-05, + "loss": 1.443, + "step": 31265 + }, + { + "epoch": 2.46, + "learning_rate": 2.3338494501362786e-05, + "loss": 1.4224, + "step": 31266 + }, + { + "epoch": 2.46, + "learning_rate": 2.3331873863705214e-05, + "loss": 1.4263, + "step": 31267 + }, + { + "epoch": 2.46, + "learning_rate": 2.3325254086054356e-05, + "loss": 1.4392, + "step": 31268 + }, + { + "epoch": 2.46, + "learning_rate": 2.3318635168455063e-05, + "loss": 1.4394, + "step": 31269 + }, + { + "epoch": 2.46, + "learning_rate": 2.331201711095238e-05, + "loss": 1.5033, + "step": 31270 + }, + { + "epoch": 2.46, + "learning_rate": 2.330539991359119e-05, + "loss": 1.4304, + "step": 31271 + }, + { + "epoch": 2.46, + "learning_rate": 2.3298783576416385e-05, + "loss": 1.4192, + "step": 31272 + }, + { + "epoch": 2.46, + "learning_rate": 2.3292168099472937e-05, + "loss": 1.4043, + "step": 31273 + }, + { + "epoch": 2.46, + "learning_rate": 2.328555348280577e-05, + "loss": 1.4287, + "step": 31274 + }, + { + "epoch": 2.46, + "learning_rate": 2.3278939726459716e-05, + "loss": 1.4253, + "step": 31275 + }, + { + "epoch": 2.46, + "learning_rate": 2.327232683047976e-05, + "loss": 1.4808, + "step": 31276 + }, + { + "epoch": 2.46, + "learning_rate": 2.3265714794910776e-05, + "loss": 1.4615, + "step": 31277 + }, + { + "epoch": 2.46, + "learning_rate": 2.325910361979767e-05, + "loss": 1.4306, + "step": 31278 + }, + { + "epoch": 2.46, + "learning_rate": 2.3252493305185248e-05, + "loss": 1.4141, + "step": 31279 + }, + { + "epoch": 2.46, + "learning_rate": 2.3245883851118496e-05, + "loss": 1.4562, + "step": 31280 + }, + { + "epoch": 2.46, + "learning_rate": 2.323927525764226e-05, + "loss": 1.4225, + "step": 31281 + }, + { + "epoch": 2.46, + "learning_rate": 2.3232667524801335e-05, + "loss": 1.4491, + "step": 31282 + }, + { + "epoch": 2.46, + "learning_rate": 2.3226060652640656e-05, + "loss": 1.4224, + "step": 31283 + }, + { + "epoch": 2.46, + "learning_rate": 2.321945464120508e-05, + "loss": 1.4639, + "step": 31284 + }, + { + "epoch": 2.46, + "learning_rate": 2.3212849490539463e-05, + "loss": 1.4592, + "step": 31285 + }, + { + "epoch": 2.46, + "learning_rate": 2.32062452006886e-05, + "loss": 1.4645, + "step": 31286 + }, + { + "epoch": 2.46, + "learning_rate": 2.3199641771697386e-05, + "loss": 1.4779, + "step": 31287 + }, + { + "epoch": 2.46, + "learning_rate": 2.319303920361062e-05, + "loss": 1.4229, + "step": 31288 + }, + { + "epoch": 2.46, + "learning_rate": 2.3186437496473115e-05, + "loss": 1.4488, + "step": 31289 + }, + { + "epoch": 2.46, + "learning_rate": 2.3179836650329752e-05, + "loss": 1.46, + "step": 31290 + }, + { + "epoch": 2.46, + "learning_rate": 2.317323666522533e-05, + "loss": 1.4377, + "step": 31291 + }, + { + "epoch": 2.46, + "learning_rate": 2.316663754120458e-05, + "loss": 1.4836, + "step": 31292 + }, + { + "epoch": 2.46, + "learning_rate": 2.3160039278312416e-05, + "loss": 1.4488, + "step": 31293 + }, + { + "epoch": 2.46, + "learning_rate": 2.3153441876593597e-05, + "loss": 1.4797, + "step": 31294 + }, + { + "epoch": 2.46, + "learning_rate": 2.3146845336092895e-05, + "loss": 1.4706, + "step": 31295 + }, + { + "epoch": 2.46, + "learning_rate": 2.3140249656855087e-05, + "loss": 1.4348, + "step": 31296 + }, + { + "epoch": 2.46, + "learning_rate": 2.3133654838925005e-05, + "loss": 1.4942, + "step": 31297 + }, + { + "epoch": 2.46, + "learning_rate": 2.3127060882347392e-05, + "loss": 1.4773, + "step": 31298 + }, + { + "epoch": 2.46, + "learning_rate": 2.3120467787166986e-05, + "loss": 1.4479, + "step": 31299 + }, + { + "epoch": 2.46, + "learning_rate": 2.3113875553428597e-05, + "loss": 1.4149, + "step": 31300 + }, + { + "epoch": 2.46, + "learning_rate": 2.3107284181176987e-05, + "loss": 1.4218, + "step": 31301 + }, + { + "epoch": 2.46, + "learning_rate": 2.310069367045691e-05, + "loss": 1.4829, + "step": 31302 + }, + { + "epoch": 2.46, + "learning_rate": 2.309410402131306e-05, + "loss": 1.4999, + "step": 31303 + }, + { + "epoch": 2.46, + "learning_rate": 2.308751523379023e-05, + "loss": 1.4297, + "step": 31304 + }, + { + "epoch": 2.46, + "learning_rate": 2.308092730793316e-05, + "loss": 1.3891, + "step": 31305 + }, + { + "epoch": 2.46, + "learning_rate": 2.3074340243786494e-05, + "loss": 1.4166, + "step": 31306 + }, + { + "epoch": 2.46, + "learning_rate": 2.306775404139506e-05, + "loss": 1.4152, + "step": 31307 + }, + { + "epoch": 2.46, + "learning_rate": 2.306116870080354e-05, + "loss": 1.4152, + "step": 31308 + }, + { + "epoch": 2.46, + "learning_rate": 2.3054584222056583e-05, + "loss": 1.4906, + "step": 31309 + }, + { + "epoch": 2.46, + "learning_rate": 2.3048000605198986e-05, + "loss": 1.4997, + "step": 31310 + }, + { + "epoch": 2.46, + "learning_rate": 2.3041417850275395e-05, + "loss": 1.42, + "step": 31311 + }, + { + "epoch": 2.46, + "learning_rate": 2.3034835957330526e-05, + "loss": 1.494, + "step": 31312 + }, + { + "epoch": 2.46, + "learning_rate": 2.302825492640903e-05, + "loss": 1.4129, + "step": 31313 + }, + { + "epoch": 2.46, + "learning_rate": 2.302167475755563e-05, + "loss": 1.4222, + "step": 31314 + }, + { + "epoch": 2.46, + "learning_rate": 2.3015095450814962e-05, + "loss": 1.4539, + "step": 31315 + }, + { + "epoch": 2.46, + "learning_rate": 2.3008517006231725e-05, + "loss": 1.4941, + "step": 31316 + }, + { + "epoch": 2.46, + "learning_rate": 2.3001939423850595e-05, + "loss": 1.3757, + "step": 31317 + }, + { + "epoch": 2.46, + "learning_rate": 2.2995362703716226e-05, + "loss": 1.4533, + "step": 31318 + }, + { + "epoch": 2.46, + "learning_rate": 2.298878684587326e-05, + "loss": 1.4786, + "step": 31319 + }, + { + "epoch": 2.46, + "learning_rate": 2.298221185036631e-05, + "loss": 1.4346, + "step": 31320 + }, + { + "epoch": 2.46, + "learning_rate": 2.2975637717240065e-05, + "loss": 1.4382, + "step": 31321 + }, + { + "epoch": 2.46, + "learning_rate": 2.296906444653915e-05, + "loss": 1.4275, + "step": 31322 + }, + { + "epoch": 2.46, + "learning_rate": 2.296249203830816e-05, + "loss": 1.405, + "step": 31323 + }, + { + "epoch": 2.46, + "learning_rate": 2.2955920492591766e-05, + "loss": 1.4492, + "step": 31324 + }, + { + "epoch": 2.46, + "learning_rate": 2.2949349809434566e-05, + "loss": 1.4717, + "step": 31325 + }, + { + "epoch": 2.46, + "learning_rate": 2.2942779988881133e-05, + "loss": 1.4796, + "step": 31326 + }, + { + "epoch": 2.46, + "learning_rate": 2.2936211030976153e-05, + "loss": 1.405, + "step": 31327 + }, + { + "epoch": 2.46, + "learning_rate": 2.2929642935764175e-05, + "loss": 1.4216, + "step": 31328 + }, + { + "epoch": 2.47, + "learning_rate": 2.292307570328976e-05, + "loss": 1.4538, + "step": 31329 + }, + { + "epoch": 2.47, + "learning_rate": 2.2916509333597527e-05, + "loss": 1.467, + "step": 31330 + }, + { + "epoch": 2.47, + "learning_rate": 2.2909943826732102e-05, + "loss": 1.479, + "step": 31331 + }, + { + "epoch": 2.47, + "learning_rate": 2.2903379182738035e-05, + "loss": 1.468, + "step": 31332 + }, + { + "epoch": 2.47, + "learning_rate": 2.2896815401659857e-05, + "loss": 1.4194, + "step": 31333 + }, + { + "epoch": 2.47, + "learning_rate": 2.289025248354218e-05, + "loss": 1.4243, + "step": 31334 + }, + { + "epoch": 2.47, + "learning_rate": 2.288369042842954e-05, + "loss": 1.4433, + "step": 31335 + }, + { + "epoch": 2.47, + "learning_rate": 2.2877129236366513e-05, + "loss": 1.4481, + "step": 31336 + }, + { + "epoch": 2.47, + "learning_rate": 2.2870568907397567e-05, + "loss": 1.4706, + "step": 31337 + }, + { + "epoch": 2.47, + "learning_rate": 2.2864009441567367e-05, + "loss": 1.5242, + "step": 31338 + }, + { + "epoch": 2.47, + "learning_rate": 2.2857450838920356e-05, + "loss": 1.4518, + "step": 31339 + }, + { + "epoch": 2.47, + "learning_rate": 2.2850893099501068e-05, + "loss": 1.4609, + "step": 31340 + }, + { + "epoch": 2.47, + "learning_rate": 2.2844336223354083e-05, + "loss": 1.4839, + "step": 31341 + }, + { + "epoch": 2.47, + "learning_rate": 2.283778021052388e-05, + "loss": 1.4364, + "step": 31342 + }, + { + "epoch": 2.47, + "learning_rate": 2.283122506105495e-05, + "loss": 1.4631, + "step": 31343 + }, + { + "epoch": 2.47, + "learning_rate": 2.282467077499186e-05, + "loss": 1.4382, + "step": 31344 + }, + { + "epoch": 2.47, + "learning_rate": 2.2818117352379066e-05, + "loss": 1.4232, + "step": 31345 + }, + { + "epoch": 2.47, + "learning_rate": 2.2811564793261034e-05, + "loss": 1.4044, + "step": 31346 + }, + { + "epoch": 2.47, + "learning_rate": 2.2805013097682308e-05, + "loss": 1.4361, + "step": 31347 + }, + { + "epoch": 2.47, + "learning_rate": 2.2798462265687366e-05, + "loss": 1.4452, + "step": 31348 + }, + { + "epoch": 2.47, + "learning_rate": 2.2791912297320664e-05, + "loss": 1.4355, + "step": 31349 + }, + { + "epoch": 2.47, + "learning_rate": 2.278536319262666e-05, + "loss": 1.4076, + "step": 31350 + }, + { + "epoch": 2.47, + "learning_rate": 2.277881495164987e-05, + "loss": 1.4407, + "step": 31351 + }, + { + "epoch": 2.47, + "learning_rate": 2.277226757443471e-05, + "loss": 1.4406, + "step": 31352 + }, + { + "epoch": 2.47, + "learning_rate": 2.276572106102566e-05, + "loss": 1.5, + "step": 31353 + }, + { + "epoch": 2.47, + "learning_rate": 2.27591754114671e-05, + "loss": 1.4339, + "step": 31354 + }, + { + "epoch": 2.47, + "learning_rate": 2.2752630625803562e-05, + "loss": 1.4077, + "step": 31355 + }, + { + "epoch": 2.47, + "learning_rate": 2.274608670407943e-05, + "loss": 1.5004, + "step": 31356 + }, + { + "epoch": 2.47, + "learning_rate": 2.273954364633913e-05, + "loss": 1.4149, + "step": 31357 + }, + { + "epoch": 2.47, + "learning_rate": 2.2733001452627116e-05, + "loss": 1.442, + "step": 31358 + }, + { + "epoch": 2.47, + "learning_rate": 2.2726460122987812e-05, + "loss": 1.4731, + "step": 31359 + }, + { + "epoch": 2.47, + "learning_rate": 2.2719919657465552e-05, + "loss": 1.4349, + "step": 31360 + }, + { + "epoch": 2.47, + "learning_rate": 2.271338005610485e-05, + "loss": 1.4738, + "step": 31361 + }, + { + "epoch": 2.47, + "learning_rate": 2.270684131895001e-05, + "loss": 1.4392, + "step": 31362 + }, + { + "epoch": 2.47, + "learning_rate": 2.2700303446045502e-05, + "loss": 1.4311, + "step": 31363 + }, + { + "epoch": 2.47, + "learning_rate": 2.2693766437435668e-05, + "loss": 1.4662, + "step": 31364 + }, + { + "epoch": 2.47, + "learning_rate": 2.2687230293164914e-05, + "loss": 1.3939, + "step": 31365 + }, + { + "epoch": 2.47, + "learning_rate": 2.268069501327763e-05, + "loss": 1.4371, + "step": 31366 + }, + { + "epoch": 2.47, + "learning_rate": 2.2674160597818135e-05, + "loss": 1.4451, + "step": 31367 + }, + { + "epoch": 2.47, + "learning_rate": 2.266762704683084e-05, + "loss": 1.4436, + "step": 31368 + }, + { + "epoch": 2.47, + "learning_rate": 2.2661094360360117e-05, + "loss": 1.3876, + "step": 31369 + }, + { + "epoch": 2.47, + "learning_rate": 2.2654562538450233e-05, + "loss": 1.4708, + "step": 31370 + }, + { + "epoch": 2.47, + "learning_rate": 2.2648031581145638e-05, + "loss": 1.4298, + "step": 31371 + }, + { + "epoch": 2.47, + "learning_rate": 2.2641501488490625e-05, + "loss": 1.4487, + "step": 31372 + }, + { + "epoch": 2.47, + "learning_rate": 2.2634972260529533e-05, + "loss": 1.4722, + "step": 31373 + }, + { + "epoch": 2.47, + "learning_rate": 2.262844389730667e-05, + "loss": 1.4405, + "step": 31374 + }, + { + "epoch": 2.47, + "learning_rate": 2.2621916398866417e-05, + "loss": 1.4915, + "step": 31375 + }, + { + "epoch": 2.47, + "learning_rate": 2.2615389765253045e-05, + "loss": 1.4387, + "step": 31376 + }, + { + "epoch": 2.47, + "learning_rate": 2.2608863996510862e-05, + "loss": 1.414, + "step": 31377 + }, + { + "epoch": 2.47, + "learning_rate": 2.2602339092684184e-05, + "loss": 1.4743, + "step": 31378 + }, + { + "epoch": 2.47, + "learning_rate": 2.2595815053817362e-05, + "loss": 1.444, + "step": 31379 + }, + { + "epoch": 2.47, + "learning_rate": 2.258929187995464e-05, + "loss": 1.4618, + "step": 31380 + }, + { + "epoch": 2.47, + "learning_rate": 2.2582769571140268e-05, + "loss": 1.4642, + "step": 31381 + }, + { + "epoch": 2.47, + "learning_rate": 2.2576248127418628e-05, + "loss": 1.4413, + "step": 31382 + }, + { + "epoch": 2.47, + "learning_rate": 2.256972754883395e-05, + "loss": 1.4722, + "step": 31383 + }, + { + "epoch": 2.47, + "learning_rate": 2.2563207835430446e-05, + "loss": 1.4308, + "step": 31384 + }, + { + "epoch": 2.47, + "learning_rate": 2.2556688987252486e-05, + "loss": 1.4667, + "step": 31385 + }, + { + "epoch": 2.47, + "learning_rate": 2.255017100434428e-05, + "loss": 1.4841, + "step": 31386 + }, + { + "epoch": 2.47, + "learning_rate": 2.2543653886750028e-05, + "loss": 1.4524, + "step": 31387 + }, + { + "epoch": 2.47, + "learning_rate": 2.253713763451408e-05, + "loss": 1.4574, + "step": 31388 + }, + { + "epoch": 2.47, + "learning_rate": 2.253062224768063e-05, + "loss": 1.4366, + "step": 31389 + }, + { + "epoch": 2.47, + "learning_rate": 2.2524107726293895e-05, + "loss": 1.4678, + "step": 31390 + }, + { + "epoch": 2.47, + "learning_rate": 2.2517594070398104e-05, + "loss": 1.3962, + "step": 31391 + }, + { + "epoch": 2.47, + "learning_rate": 2.2511081280037525e-05, + "loss": 1.4688, + "step": 31392 + }, + { + "epoch": 2.47, + "learning_rate": 2.2504569355256318e-05, + "loss": 1.4752, + "step": 31393 + }, + { + "epoch": 2.47, + "learning_rate": 2.2498058296098753e-05, + "loss": 1.4612, + "step": 31394 + }, + { + "epoch": 2.47, + "learning_rate": 2.2491548102608993e-05, + "loss": 1.4184, + "step": 31395 + }, + { + "epoch": 2.47, + "learning_rate": 2.2485038774831282e-05, + "loss": 1.4868, + "step": 31396 + }, + { + "epoch": 2.47, + "learning_rate": 2.247853031280979e-05, + "loss": 1.449, + "step": 31397 + }, + { + "epoch": 2.47, + "learning_rate": 2.247202271658866e-05, + "loss": 1.4589, + "step": 31398 + }, + { + "epoch": 2.47, + "learning_rate": 2.246551598621216e-05, + "loss": 1.4393, + "step": 31399 + }, + { + "epoch": 2.47, + "learning_rate": 2.2459010121724442e-05, + "loss": 1.4809, + "step": 31400 + }, + { + "epoch": 2.47, + "learning_rate": 2.245250512316961e-05, + "loss": 1.4773, + "step": 31401 + }, + { + "epoch": 2.47, + "learning_rate": 2.244600099059192e-05, + "loss": 1.4153, + "step": 31402 + }, + { + "epoch": 2.47, + "learning_rate": 2.2439497724035506e-05, + "loss": 1.4928, + "step": 31403 + }, + { + "epoch": 2.47, + "learning_rate": 2.2432995323544454e-05, + "loss": 1.4437, + "step": 31404 + }, + { + "epoch": 2.47, + "learning_rate": 2.242649378916301e-05, + "loss": 1.4445, + "step": 31405 + }, + { + "epoch": 2.47, + "learning_rate": 2.2419993120935274e-05, + "loss": 1.3964, + "step": 31406 + }, + { + "epoch": 2.47, + "learning_rate": 2.241349331890539e-05, + "loss": 1.4831, + "step": 31407 + }, + { + "epoch": 2.47, + "learning_rate": 2.240699438311743e-05, + "loss": 1.4319, + "step": 31408 + }, + { + "epoch": 2.47, + "learning_rate": 2.2400496313615567e-05, + "loss": 1.4518, + "step": 31409 + }, + { + "epoch": 2.47, + "learning_rate": 2.2393999110443962e-05, + "loss": 1.4279, + "step": 31410 + }, + { + "epoch": 2.47, + "learning_rate": 2.2387502773646678e-05, + "loss": 1.4922, + "step": 31411 + }, + { + "epoch": 2.47, + "learning_rate": 2.2381007303267777e-05, + "loss": 1.491, + "step": 31412 + }, + { + "epoch": 2.47, + "learning_rate": 2.2374512699351466e-05, + "loss": 1.4294, + "step": 31413 + }, + { + "epoch": 2.47, + "learning_rate": 2.2368018961941785e-05, + "loss": 1.4548, + "step": 31414 + }, + { + "epoch": 2.47, + "learning_rate": 2.2361526091082788e-05, + "loss": 1.4786, + "step": 31415 + }, + { + "epoch": 2.47, + "learning_rate": 2.235503408681862e-05, + "loss": 1.4356, + "step": 31416 + }, + { + "epoch": 2.47, + "learning_rate": 2.2348542949193326e-05, + "loss": 1.4123, + "step": 31417 + }, + { + "epoch": 2.47, + "learning_rate": 2.234205267825096e-05, + "loss": 1.4882, + "step": 31418 + }, + { + "epoch": 2.47, + "learning_rate": 2.2335563274035635e-05, + "loss": 1.4364, + "step": 31419 + }, + { + "epoch": 2.47, + "learning_rate": 2.232907473659138e-05, + "loss": 1.4224, + "step": 31420 + }, + { + "epoch": 2.47, + "learning_rate": 2.2322587065962226e-05, + "loss": 1.4108, + "step": 31421 + }, + { + "epoch": 2.47, + "learning_rate": 2.2316100262192277e-05, + "loss": 1.4266, + "step": 31422 + }, + { + "epoch": 2.47, + "learning_rate": 2.2309614325325544e-05, + "loss": 1.4847, + "step": 31423 + }, + { + "epoch": 2.47, + "learning_rate": 2.230312925540607e-05, + "loss": 1.4509, + "step": 31424 + }, + { + "epoch": 2.47, + "learning_rate": 2.2296645052477813e-05, + "loss": 1.452, + "step": 31425 + }, + { + "epoch": 2.47, + "learning_rate": 2.2290161716584932e-05, + "loss": 1.4188, + "step": 31426 + }, + { + "epoch": 2.47, + "learning_rate": 2.2283679247771358e-05, + "loss": 1.4809, + "step": 31427 + }, + { + "epoch": 2.47, + "learning_rate": 2.227719764608111e-05, + "loss": 1.4795, + "step": 31428 + }, + { + "epoch": 2.47, + "learning_rate": 2.2270716911558227e-05, + "loss": 1.4628, + "step": 31429 + }, + { + "epoch": 2.47, + "learning_rate": 2.22642370442467e-05, + "loss": 1.4754, + "step": 31430 + }, + { + "epoch": 2.47, + "learning_rate": 2.225775804419051e-05, + "loss": 1.4025, + "step": 31431 + }, + { + "epoch": 2.47, + "learning_rate": 2.225127991143362e-05, + "loss": 1.4776, + "step": 31432 + }, + { + "epoch": 2.47, + "learning_rate": 2.2244802646020072e-05, + "loss": 1.4261, + "step": 31433 + }, + { + "epoch": 2.47, + "learning_rate": 2.2238326247993803e-05, + "loss": 1.4071, + "step": 31434 + }, + { + "epoch": 2.47, + "learning_rate": 2.2231850717398762e-05, + "loss": 1.4763, + "step": 31435 + }, + { + "epoch": 2.47, + "learning_rate": 2.2225376054279e-05, + "loss": 1.449, + "step": 31436 + }, + { + "epoch": 2.47, + "learning_rate": 2.2218902258678408e-05, + "loss": 1.4067, + "step": 31437 + }, + { + "epoch": 2.47, + "learning_rate": 2.2212429330640917e-05, + "loss": 1.3928, + "step": 31438 + }, + { + "epoch": 2.47, + "learning_rate": 2.220595727021055e-05, + "loss": 1.4563, + "step": 31439 + }, + { + "epoch": 2.47, + "learning_rate": 2.2199486077431166e-05, + "loss": 1.4187, + "step": 31440 + }, + { + "epoch": 2.47, + "learning_rate": 2.21930157523468e-05, + "loss": 1.4265, + "step": 31441 + }, + { + "epoch": 2.47, + "learning_rate": 2.2186546295001278e-05, + "loss": 1.422, + "step": 31442 + }, + { + "epoch": 2.47, + "learning_rate": 2.218007770543862e-05, + "loss": 1.4687, + "step": 31443 + }, + { + "epoch": 2.47, + "learning_rate": 2.2173609983702688e-05, + "loss": 1.4877, + "step": 31444 + }, + { + "epoch": 2.47, + "learning_rate": 2.2167143129837368e-05, + "loss": 1.5046, + "step": 31445 + }, + { + "epoch": 2.47, + "learning_rate": 2.2160677143886635e-05, + "loss": 1.447, + "step": 31446 + }, + { + "epoch": 2.47, + "learning_rate": 2.2154212025894358e-05, + "loss": 1.4809, + "step": 31447 + }, + { + "epoch": 2.47, + "learning_rate": 2.2147747775904433e-05, + "loss": 1.451, + "step": 31448 + }, + { + "epoch": 2.47, + "learning_rate": 2.2141284393960713e-05, + "loss": 1.4609, + "step": 31449 + }, + { + "epoch": 2.47, + "learning_rate": 2.2134821880107156e-05, + "loss": 1.4542, + "step": 31450 + }, + { + "epoch": 2.47, + "learning_rate": 2.2128360234387583e-05, + "loss": 1.4567, + "step": 31451 + }, + { + "epoch": 2.47, + "learning_rate": 2.2121899456845854e-05, + "loss": 1.4444, + "step": 31452 + }, + { + "epoch": 2.47, + "learning_rate": 2.2115439547525887e-05, + "loss": 1.4196, + "step": 31453 + }, + { + "epoch": 2.47, + "learning_rate": 2.2108980506471513e-05, + "loss": 1.4553, + "step": 31454 + }, + { + "epoch": 2.47, + "learning_rate": 2.2102522333726547e-05, + "loss": 1.4706, + "step": 31455 + }, + { + "epoch": 2.47, + "learning_rate": 2.2096065029334887e-05, + "loss": 1.4444, + "step": 31456 + }, + { + "epoch": 2.48, + "learning_rate": 2.208960859334038e-05, + "loss": 1.4729, + "step": 31457 + }, + { + "epoch": 2.48, + "learning_rate": 2.2083153025786858e-05, + "loss": 1.382, + "step": 31458 + }, + { + "epoch": 2.48, + "learning_rate": 2.2076698326718107e-05, + "loss": 1.4258, + "step": 31459 + }, + { + "epoch": 2.48, + "learning_rate": 2.2070244496178004e-05, + "loss": 1.4344, + "step": 31460 + }, + { + "epoch": 2.48, + "learning_rate": 2.2063791534210347e-05, + "loss": 1.4591, + "step": 31461 + }, + { + "epoch": 2.48, + "learning_rate": 2.20573394408589e-05, + "loss": 1.4485, + "step": 31462 + }, + { + "epoch": 2.48, + "learning_rate": 2.205088821616755e-05, + "loss": 1.4714, + "step": 31463 + }, + { + "epoch": 2.48, + "learning_rate": 2.2044437860180074e-05, + "loss": 1.4634, + "step": 31464 + }, + { + "epoch": 2.48, + "learning_rate": 2.203798837294024e-05, + "loss": 1.4433, + "step": 31465 + }, + { + "epoch": 2.48, + "learning_rate": 2.2031539754491827e-05, + "loss": 1.492, + "step": 31466 + }, + { + "epoch": 2.48, + "learning_rate": 2.202509200487867e-05, + "loss": 1.4334, + "step": 31467 + }, + { + "epoch": 2.48, + "learning_rate": 2.2018645124144512e-05, + "loss": 1.4771, + "step": 31468 + }, + { + "epoch": 2.48, + "learning_rate": 2.201219911233309e-05, + "loss": 1.5031, + "step": 31469 + }, + { + "epoch": 2.48, + "learning_rate": 2.200575396948825e-05, + "loss": 1.4141, + "step": 31470 + }, + { + "epoch": 2.48, + "learning_rate": 2.1999309695653705e-05, + "loss": 1.4323, + "step": 31471 + }, + { + "epoch": 2.48, + "learning_rate": 2.1992866290873172e-05, + "loss": 1.4854, + "step": 31472 + }, + { + "epoch": 2.48, + "learning_rate": 2.1986423755190452e-05, + "loss": 1.4592, + "step": 31473 + }, + { + "epoch": 2.48, + "learning_rate": 2.197998208864929e-05, + "loss": 1.4428, + "step": 31474 + }, + { + "epoch": 2.48, + "learning_rate": 2.1973541291293402e-05, + "loss": 1.4875, + "step": 31475 + }, + { + "epoch": 2.48, + "learning_rate": 2.1967101363166485e-05, + "loss": 1.4377, + "step": 31476 + }, + { + "epoch": 2.48, + "learning_rate": 2.196066230431234e-05, + "loss": 1.4479, + "step": 31477 + }, + { + "epoch": 2.48, + "learning_rate": 2.1954224114774628e-05, + "loss": 1.4494, + "step": 31478 + }, + { + "epoch": 2.48, + "learning_rate": 2.1947786794597032e-05, + "loss": 1.4405, + "step": 31479 + }, + { + "epoch": 2.48, + "learning_rate": 2.1941350343823355e-05, + "loss": 1.4517, + "step": 31480 + }, + { + "epoch": 2.48, + "learning_rate": 2.1934914762497223e-05, + "loss": 1.5064, + "step": 31481 + }, + { + "epoch": 2.48, + "learning_rate": 2.1928480050662322e-05, + "loss": 1.4926, + "step": 31482 + }, + { + "epoch": 2.48, + "learning_rate": 2.1922046208362397e-05, + "loss": 1.4388, + "step": 31483 + }, + { + "epoch": 2.48, + "learning_rate": 2.19156132356411e-05, + "loss": 1.4738, + "step": 31484 + }, + { + "epoch": 2.48, + "learning_rate": 2.1909181132542108e-05, + "loss": 1.4349, + "step": 31485 + }, + { + "epoch": 2.48, + "learning_rate": 2.1902749899109058e-05, + "loss": 1.4591, + "step": 31486 + }, + { + "epoch": 2.48, + "learning_rate": 2.1896319535385627e-05, + "loss": 1.4646, + "step": 31487 + }, + { + "epoch": 2.48, + "learning_rate": 2.188989004141555e-05, + "loss": 1.4353, + "step": 31488 + }, + { + "epoch": 2.48, + "learning_rate": 2.1883461417242404e-05, + "loss": 1.4358, + "step": 31489 + }, + { + "epoch": 2.48, + "learning_rate": 2.1877033662909842e-05, + "loss": 1.4465, + "step": 31490 + }, + { + "epoch": 2.48, + "learning_rate": 2.187060677846153e-05, + "loss": 1.4633, + "step": 31491 + }, + { + "epoch": 2.48, + "learning_rate": 2.1864180763941114e-05, + "loss": 1.464, + "step": 31492 + }, + { + "epoch": 2.48, + "learning_rate": 2.185775561939214e-05, + "loss": 1.422, + "step": 31493 + }, + { + "epoch": 2.48, + "learning_rate": 2.185133134485833e-05, + "loss": 1.4525, + "step": 31494 + }, + { + "epoch": 2.48, + "learning_rate": 2.1844907940383277e-05, + "loss": 1.4552, + "step": 31495 + }, + { + "epoch": 2.48, + "learning_rate": 2.1838485406010532e-05, + "loss": 1.4253, + "step": 31496 + }, + { + "epoch": 2.48, + "learning_rate": 2.183206374178379e-05, + "loss": 1.4675, + "step": 31497 + }, + { + "epoch": 2.48, + "learning_rate": 2.1825642947746586e-05, + "loss": 1.4488, + "step": 31498 + }, + { + "epoch": 2.48, + "learning_rate": 2.1819223023942517e-05, + "loss": 1.4704, + "step": 31499 + }, + { + "epoch": 2.48, + "learning_rate": 2.1812803970415216e-05, + "loss": 1.4086, + "step": 31500 + }, + { + "epoch": 2.48, + "learning_rate": 2.1806385787208248e-05, + "loss": 1.4065, + "step": 31501 + }, + { + "epoch": 2.48, + "learning_rate": 2.179996847436516e-05, + "loss": 1.4512, + "step": 31502 + }, + { + "epoch": 2.48, + "learning_rate": 2.179355203192947e-05, + "loss": 1.4348, + "step": 31503 + }, + { + "epoch": 2.48, + "learning_rate": 2.1787136459944886e-05, + "loss": 1.4405, + "step": 31504 + }, + { + "epoch": 2.48, + "learning_rate": 2.17807217584549e-05, + "loss": 1.5202, + "step": 31505 + }, + { + "epoch": 2.48, + "learning_rate": 2.1774307927503054e-05, + "loss": 1.4465, + "step": 31506 + }, + { + "epoch": 2.48, + "learning_rate": 2.176789496713285e-05, + "loss": 1.4485, + "step": 31507 + }, + { + "epoch": 2.48, + "learning_rate": 2.1761482877387914e-05, + "loss": 1.4557, + "step": 31508 + }, + { + "epoch": 2.48, + "learning_rate": 2.1755071658311752e-05, + "loss": 1.4538, + "step": 31509 + }, + { + "epoch": 2.48, + "learning_rate": 2.1748661309947842e-05, + "loss": 1.3933, + "step": 31510 + }, + { + "epoch": 2.48, + "learning_rate": 2.174225183233978e-05, + "loss": 1.4251, + "step": 31511 + }, + { + "epoch": 2.48, + "learning_rate": 2.173584322553105e-05, + "loss": 1.4628, + "step": 31512 + }, + { + "epoch": 2.48, + "learning_rate": 2.1729435489565123e-05, + "loss": 1.4222, + "step": 31513 + }, + { + "epoch": 2.48, + "learning_rate": 2.1723028624485573e-05, + "loss": 1.4324, + "step": 31514 + }, + { + "epoch": 2.48, + "learning_rate": 2.1716622630335883e-05, + "loss": 1.4284, + "step": 31515 + }, + { + "epoch": 2.48, + "learning_rate": 2.1710217507159487e-05, + "loss": 1.4641, + "step": 31516 + }, + { + "epoch": 2.48, + "learning_rate": 2.170381325499997e-05, + "loss": 1.4711, + "step": 31517 + }, + { + "epoch": 2.48, + "learning_rate": 2.169740987390074e-05, + "loss": 1.4366, + "step": 31518 + }, + { + "epoch": 2.48, + "learning_rate": 2.1691007363905282e-05, + "loss": 1.4688, + "step": 31519 + }, + { + "epoch": 2.48, + "learning_rate": 2.1684605725057065e-05, + "loss": 1.4703, + "step": 31520 + }, + { + "epoch": 2.48, + "learning_rate": 2.1678204957399598e-05, + "loss": 1.4835, + "step": 31521 + }, + { + "epoch": 2.48, + "learning_rate": 2.16718050609763e-05, + "loss": 1.4336, + "step": 31522 + }, + { + "epoch": 2.48, + "learning_rate": 2.1665406035830636e-05, + "loss": 1.4134, + "step": 31523 + }, + { + "epoch": 2.48, + "learning_rate": 2.1659007882006002e-05, + "loss": 1.435, + "step": 31524 + }, + { + "epoch": 2.48, + "learning_rate": 2.1652610599545933e-05, + "loss": 1.4817, + "step": 31525 + }, + { + "epoch": 2.48, + "learning_rate": 2.1646214188493794e-05, + "loss": 1.4231, + "step": 31526 + }, + { + "epoch": 2.48, + "learning_rate": 2.1639818648893e-05, + "loss": 1.4525, + "step": 31527 + }, + { + "epoch": 2.48, + "learning_rate": 2.163342398078703e-05, + "loss": 1.3962, + "step": 31528 + }, + { + "epoch": 2.48, + "learning_rate": 2.1627030184219285e-05, + "loss": 1.4787, + "step": 31529 + }, + { + "epoch": 2.48, + "learning_rate": 2.1620637259233114e-05, + "loss": 1.3759, + "step": 31530 + }, + { + "epoch": 2.48, + "learning_rate": 2.1614245205872015e-05, + "loss": 1.4302, + "step": 31531 + }, + { + "epoch": 2.48, + "learning_rate": 2.160785402417934e-05, + "loss": 1.4427, + "step": 31532 + }, + { + "epoch": 2.48, + "learning_rate": 2.1601463714198447e-05, + "loss": 1.4243, + "step": 31533 + }, + { + "epoch": 2.48, + "learning_rate": 2.159507427597279e-05, + "loss": 1.4358, + "step": 31534 + }, + { + "epoch": 2.48, + "learning_rate": 2.15886857095457e-05, + "loss": 1.4531, + "step": 31535 + }, + { + "epoch": 2.48, + "learning_rate": 2.158229801496059e-05, + "loss": 1.4696, + "step": 31536 + }, + { + "epoch": 2.48, + "learning_rate": 2.157591119226078e-05, + "loss": 1.4197, + "step": 31537 + }, + { + "epoch": 2.48, + "learning_rate": 2.15695252414897e-05, + "loss": 1.4627, + "step": 31538 + }, + { + "epoch": 2.48, + "learning_rate": 2.156314016269066e-05, + "loss": 1.4382, + "step": 31539 + }, + { + "epoch": 2.48, + "learning_rate": 2.1556755955907e-05, + "loss": 1.41, + "step": 31540 + }, + { + "epoch": 2.48, + "learning_rate": 2.1550372621182115e-05, + "loss": 1.441, + "step": 31541 + }, + { + "epoch": 2.48, + "learning_rate": 2.154399015855932e-05, + "loss": 1.4881, + "step": 31542 + }, + { + "epoch": 2.48, + "learning_rate": 2.1537608568081932e-05, + "loss": 1.4699, + "step": 31543 + }, + { + "epoch": 2.48, + "learning_rate": 2.1531227849793264e-05, + "loss": 1.4397, + "step": 31544 + }, + { + "epoch": 2.48, + "learning_rate": 2.15248480037367e-05, + "loss": 1.4717, + "step": 31545 + }, + { + "epoch": 2.48, + "learning_rate": 2.151846902995552e-05, + "loss": 1.4866, + "step": 31546 + }, + { + "epoch": 2.48, + "learning_rate": 2.1512090928492993e-05, + "loss": 1.4554, + "step": 31547 + }, + { + "epoch": 2.48, + "learning_rate": 2.1505713699392498e-05, + "loss": 1.456, + "step": 31548 + }, + { + "epoch": 2.48, + "learning_rate": 2.1499337342697296e-05, + "loss": 1.3978, + "step": 31549 + }, + { + "epoch": 2.48, + "learning_rate": 2.1492961858450662e-05, + "loss": 1.4323, + "step": 31550 + }, + { + "epoch": 2.48, + "learning_rate": 2.1486587246695893e-05, + "loss": 1.4407, + "step": 31551 + }, + { + "epoch": 2.48, + "learning_rate": 2.1480213507476297e-05, + "loss": 1.4882, + "step": 31552 + }, + { + "epoch": 2.48, + "learning_rate": 2.1473840640835143e-05, + "loss": 1.4904, + "step": 31553 + }, + { + "epoch": 2.48, + "learning_rate": 2.146746864681565e-05, + "loss": 1.4944, + "step": 31554 + }, + { + "epoch": 2.48, + "learning_rate": 2.1461097525461146e-05, + "loss": 1.4592, + "step": 31555 + }, + { + "epoch": 2.48, + "learning_rate": 2.1454727276814847e-05, + "loss": 1.4496, + "step": 31556 + }, + { + "epoch": 2.48, + "learning_rate": 2.144835790091999e-05, + "loss": 1.4331, + "step": 31557 + }, + { + "epoch": 2.48, + "learning_rate": 2.144198939781988e-05, + "loss": 1.463, + "step": 31558 + }, + { + "epoch": 2.48, + "learning_rate": 2.143562176755771e-05, + "loss": 1.385, + "step": 31559 + }, + { + "epoch": 2.48, + "learning_rate": 2.142925501017672e-05, + "loss": 1.4214, + "step": 31560 + }, + { + "epoch": 2.48, + "learning_rate": 2.14228891257201e-05, + "loss": 1.424, + "step": 31561 + }, + { + "epoch": 2.48, + "learning_rate": 2.1416524114231144e-05, + "loss": 1.4198, + "step": 31562 + }, + { + "epoch": 2.48, + "learning_rate": 2.1410159975753032e-05, + "loss": 1.4325, + "step": 31563 + }, + { + "epoch": 2.48, + "learning_rate": 2.140379671032895e-05, + "loss": 1.4443, + "step": 31564 + }, + { + "epoch": 2.48, + "learning_rate": 2.1397434318002148e-05, + "loss": 1.5086, + "step": 31565 + }, + { + "epoch": 2.48, + "learning_rate": 2.1391072798815755e-05, + "loss": 1.4325, + "step": 31566 + }, + { + "epoch": 2.48, + "learning_rate": 2.1384712152813056e-05, + "loss": 1.4542, + "step": 31567 + }, + { + "epoch": 2.48, + "learning_rate": 2.1378352380037145e-05, + "loss": 1.473, + "step": 31568 + }, + { + "epoch": 2.48, + "learning_rate": 2.1371993480531273e-05, + "loss": 1.4411, + "step": 31569 + }, + { + "epoch": 2.48, + "learning_rate": 2.1365635454338576e-05, + "loss": 1.4254, + "step": 31570 + }, + { + "epoch": 2.48, + "learning_rate": 2.1359278301502215e-05, + "loss": 1.4197, + "step": 31571 + }, + { + "epoch": 2.48, + "learning_rate": 2.135292202206537e-05, + "loss": 1.4121, + "step": 31572 + }, + { + "epoch": 2.48, + "learning_rate": 2.1346566616071213e-05, + "loss": 1.4405, + "step": 31573 + }, + { + "epoch": 2.48, + "learning_rate": 2.134021208356284e-05, + "loss": 1.4223, + "step": 31574 + }, + { + "epoch": 2.48, + "learning_rate": 2.133385842458345e-05, + "loss": 1.4378, + "step": 31575 + }, + { + "epoch": 2.48, + "learning_rate": 2.1327505639176157e-05, + "loss": 1.4125, + "step": 31576 + }, + { + "epoch": 2.48, + "learning_rate": 2.1321153727384095e-05, + "loss": 1.5069, + "step": 31577 + }, + { + "epoch": 2.48, + "learning_rate": 2.131480268925036e-05, + "loss": 1.4593, + "step": 31578 + }, + { + "epoch": 2.48, + "learning_rate": 2.130845252481812e-05, + "loss": 1.4694, + "step": 31579 + }, + { + "epoch": 2.48, + "learning_rate": 2.130210323413049e-05, + "loss": 1.4719, + "step": 31580 + }, + { + "epoch": 2.48, + "learning_rate": 2.1295754817230504e-05, + "loss": 1.3869, + "step": 31581 + }, + { + "epoch": 2.48, + "learning_rate": 2.1289407274161325e-05, + "loss": 1.4418, + "step": 31582 + }, + { + "epoch": 2.48, + "learning_rate": 2.1283060604966086e-05, + "loss": 1.4911, + "step": 31583 + }, + { + "epoch": 2.49, + "learning_rate": 2.1276714809687818e-05, + "loss": 1.4466, + "step": 31584 + }, + { + "epoch": 2.49, + "learning_rate": 2.1270369888369603e-05, + "loss": 1.4468, + "step": 31585 + }, + { + "epoch": 2.49, + "learning_rate": 2.1264025841054562e-05, + "loss": 1.4379, + "step": 31586 + }, + { + "epoch": 2.49, + "learning_rate": 2.1257682667785735e-05, + "loss": 1.463, + "step": 31587 + }, + { + "epoch": 2.49, + "learning_rate": 2.1251340368606177e-05, + "loss": 1.4291, + "step": 31588 + }, + { + "epoch": 2.49, + "learning_rate": 2.1244998943559004e-05, + "loss": 1.4955, + "step": 31589 + }, + { + "epoch": 2.49, + "learning_rate": 2.123865839268723e-05, + "loss": 1.4593, + "step": 31590 + }, + { + "epoch": 2.49, + "learning_rate": 2.123231871603387e-05, + "loss": 1.4167, + "step": 31591 + }, + { + "epoch": 2.49, + "learning_rate": 2.1225979913642038e-05, + "loss": 1.4269, + "step": 31592 + }, + { + "epoch": 2.49, + "learning_rate": 2.1219641985554752e-05, + "loss": 1.4196, + "step": 31593 + }, + { + "epoch": 2.49, + "learning_rate": 2.1213304931814996e-05, + "loss": 1.4086, + "step": 31594 + }, + { + "epoch": 2.49, + "learning_rate": 2.1206968752465847e-05, + "loss": 1.4118, + "step": 31595 + }, + { + "epoch": 2.49, + "learning_rate": 2.1200633447550324e-05, + "loss": 1.4955, + "step": 31596 + }, + { + "epoch": 2.49, + "learning_rate": 2.119429901711141e-05, + "loss": 1.5025, + "step": 31597 + }, + { + "epoch": 2.49, + "learning_rate": 2.1187965461192054e-05, + "loss": 1.4213, + "step": 31598 + }, + { + "epoch": 2.49, + "learning_rate": 2.11816327798354e-05, + "loss": 1.4362, + "step": 31599 + }, + { + "epoch": 2.49, + "learning_rate": 2.1175300973084386e-05, + "loss": 1.4372, + "step": 31600 + }, + { + "epoch": 2.49, + "learning_rate": 2.1168970040981976e-05, + "loss": 1.4377, + "step": 31601 + }, + { + "epoch": 2.49, + "learning_rate": 2.1162639983571134e-05, + "loss": 1.4263, + "step": 31602 + }, + { + "epoch": 2.49, + "learning_rate": 2.1156310800894893e-05, + "loss": 1.4176, + "step": 31603 + }, + { + "epoch": 2.49, + "learning_rate": 2.1149982492996204e-05, + "loss": 1.3977, + "step": 31604 + }, + { + "epoch": 2.49, + "learning_rate": 2.1143655059917995e-05, + "loss": 1.4012, + "step": 31605 + }, + { + "epoch": 2.49, + "learning_rate": 2.1137328501703288e-05, + "loss": 1.4293, + "step": 31606 + }, + { + "epoch": 2.49, + "learning_rate": 2.1131002818395028e-05, + "loss": 1.466, + "step": 31607 + }, + { + "epoch": 2.49, + "learning_rate": 2.1124678010036095e-05, + "loss": 1.4627, + "step": 31608 + }, + { + "epoch": 2.49, + "learning_rate": 2.1118354076669508e-05, + "loss": 1.4242, + "step": 31609 + }, + { + "epoch": 2.49, + "learning_rate": 2.1112031018338184e-05, + "loss": 1.4692, + "step": 31610 + }, + { + "epoch": 2.49, + "learning_rate": 2.1105708835085e-05, + "loss": 1.5245, + "step": 31611 + }, + { + "epoch": 2.49, + "learning_rate": 2.109938752695296e-05, + "loss": 1.4377, + "step": 31612 + }, + { + "epoch": 2.49, + "learning_rate": 2.1093067093984912e-05, + "loss": 1.5022, + "step": 31613 + }, + { + "epoch": 2.49, + "learning_rate": 2.1086747536223837e-05, + "loss": 1.4226, + "step": 31614 + }, + { + "epoch": 2.49, + "learning_rate": 2.1080428853712584e-05, + "loss": 1.4771, + "step": 31615 + }, + { + "epoch": 2.49, + "learning_rate": 2.1074111046494084e-05, + "loss": 1.4189, + "step": 31616 + }, + { + "epoch": 2.49, + "learning_rate": 2.106779411461124e-05, + "loss": 1.428, + "step": 31617 + }, + { + "epoch": 2.49, + "learning_rate": 2.106147805810692e-05, + "loss": 1.455, + "step": 31618 + }, + { + "epoch": 2.49, + "learning_rate": 2.105516287702398e-05, + "loss": 1.3835, + "step": 31619 + }, + { + "epoch": 2.49, + "learning_rate": 2.104884857140536e-05, + "loss": 1.4902, + "step": 31620 + }, + { + "epoch": 2.49, + "learning_rate": 2.1042535141293887e-05, + "loss": 1.3797, + "step": 31621 + }, + { + "epoch": 2.49, + "learning_rate": 2.1036222586732398e-05, + "loss": 1.4447, + "step": 31622 + }, + { + "epoch": 2.49, + "learning_rate": 2.102991090776384e-05, + "loss": 1.4696, + "step": 31623 + }, + { + "epoch": 2.49, + "learning_rate": 2.1023600104431014e-05, + "loss": 1.4889, + "step": 31624 + }, + { + "epoch": 2.49, + "learning_rate": 2.101729017677672e-05, + "loss": 1.4829, + "step": 31625 + }, + { + "epoch": 2.49, + "learning_rate": 2.1010981124843902e-05, + "loss": 1.4335, + "step": 31626 + }, + { + "epoch": 2.49, + "learning_rate": 2.1004672948675328e-05, + "loss": 1.4058, + "step": 31627 + }, + { + "epoch": 2.49, + "learning_rate": 2.0998365648313796e-05, + "loss": 1.4389, + "step": 31628 + }, + { + "epoch": 2.49, + "learning_rate": 2.0992059223802178e-05, + "loss": 1.3863, + "step": 31629 + }, + { + "epoch": 2.49, + "learning_rate": 2.098575367518333e-05, + "loss": 1.4453, + "step": 31630 + }, + { + "epoch": 2.49, + "learning_rate": 2.097944900250001e-05, + "loss": 1.4523, + "step": 31631 + }, + { + "epoch": 2.49, + "learning_rate": 2.0973145205794993e-05, + "loss": 1.432, + "step": 31632 + }, + { + "epoch": 2.49, + "learning_rate": 2.0966842285111167e-05, + "loss": 1.4599, + "step": 31633 + }, + { + "epoch": 2.49, + "learning_rate": 2.0960540240491264e-05, + "loss": 1.4636, + "step": 31634 + }, + { + "epoch": 2.49, + "learning_rate": 2.0954239071978078e-05, + "loss": 1.3874, + "step": 31635 + }, + { + "epoch": 2.49, + "learning_rate": 2.094793877961438e-05, + "loss": 1.4772, + "step": 31636 + }, + { + "epoch": 2.49, + "learning_rate": 2.0941639363442986e-05, + "loss": 1.4481, + "step": 31637 + }, + { + "epoch": 2.49, + "learning_rate": 2.0935340823506623e-05, + "loss": 1.4315, + "step": 31638 + }, + { + "epoch": 2.49, + "learning_rate": 2.0929043159848063e-05, + "loss": 1.437, + "step": 31639 + }, + { + "epoch": 2.49, + "learning_rate": 2.0922746372510085e-05, + "loss": 1.4542, + "step": 31640 + }, + { + "epoch": 2.49, + "learning_rate": 2.0916450461535455e-05, + "loss": 1.4978, + "step": 31641 + }, + { + "epoch": 2.49, + "learning_rate": 2.091015542696684e-05, + "loss": 1.4368, + "step": 31642 + }, + { + "epoch": 2.49, + "learning_rate": 2.0903861268847073e-05, + "loss": 1.5311, + "step": 31643 + }, + { + "epoch": 2.49, + "learning_rate": 2.0897567987218832e-05, + "loss": 1.4616, + "step": 31644 + }, + { + "epoch": 2.49, + "learning_rate": 2.089127558212484e-05, + "loss": 1.433, + "step": 31645 + }, + { + "epoch": 2.49, + "learning_rate": 2.0884984053607838e-05, + "loss": 1.4361, + "step": 31646 + }, + { + "epoch": 2.49, + "learning_rate": 2.0878693401710567e-05, + "loss": 1.4567, + "step": 31647 + }, + { + "epoch": 2.49, + "learning_rate": 2.087240362647572e-05, + "loss": 1.4101, + "step": 31648 + }, + { + "epoch": 2.49, + "learning_rate": 2.0866114727945964e-05, + "loss": 1.4614, + "step": 31649 + }, + { + "epoch": 2.49, + "learning_rate": 2.085982670616405e-05, + "loss": 1.413, + "step": 31650 + }, + { + "epoch": 2.49, + "learning_rate": 2.085353956117266e-05, + "loss": 1.4072, + "step": 31651 + }, + { + "epoch": 2.49, + "learning_rate": 2.0847253293014427e-05, + "loss": 1.4825, + "step": 31652 + }, + { + "epoch": 2.49, + "learning_rate": 2.0840967901732115e-05, + "loss": 1.4027, + "step": 31653 + }, + { + "epoch": 2.49, + "learning_rate": 2.083468338736834e-05, + "loss": 1.4256, + "step": 31654 + }, + { + "epoch": 2.49, + "learning_rate": 2.0828399749965786e-05, + "loss": 1.4545, + "step": 31655 + }, + { + "epoch": 2.49, + "learning_rate": 2.0822116989567083e-05, + "loss": 1.4525, + "step": 31656 + }, + { + "epoch": 2.49, + "learning_rate": 2.0815835106214968e-05, + "loss": 1.4799, + "step": 31657 + }, + { + "epoch": 2.49, + "learning_rate": 2.0809554099952018e-05, + "loss": 1.4399, + "step": 31658 + }, + { + "epoch": 2.49, + "learning_rate": 2.0803273970820887e-05, + "loss": 1.4286, + "step": 31659 + }, + { + "epoch": 2.49, + "learning_rate": 2.0796994718864222e-05, + "loss": 1.4937, + "step": 31660 + }, + { + "epoch": 2.49, + "learning_rate": 2.0790716344124707e-05, + "loss": 1.4285, + "step": 31661 + }, + { + "epoch": 2.49, + "learning_rate": 2.0784438846644923e-05, + "loss": 1.456, + "step": 31662 + }, + { + "epoch": 2.49, + "learning_rate": 2.0778162226467438e-05, + "loss": 1.4366, + "step": 31663 + }, + { + "epoch": 2.49, + "learning_rate": 2.077188648363498e-05, + "loss": 1.4521, + "step": 31664 + }, + { + "epoch": 2.49, + "learning_rate": 2.0765611618190086e-05, + "loss": 1.4738, + "step": 31665 + }, + { + "epoch": 2.49, + "learning_rate": 2.075933763017534e-05, + "loss": 1.4147, + "step": 31666 + }, + { + "epoch": 2.49, + "learning_rate": 2.07530645196334e-05, + "loss": 1.4358, + "step": 31667 + }, + { + "epoch": 2.49, + "learning_rate": 2.074679228660684e-05, + "loss": 1.4209, + "step": 31668 + }, + { + "epoch": 2.49, + "learning_rate": 2.074052093113819e-05, + "loss": 1.5103, + "step": 31669 + }, + { + "epoch": 2.49, + "learning_rate": 2.0734250453270097e-05, + "loss": 1.4456, + "step": 31670 + }, + { + "epoch": 2.49, + "learning_rate": 2.0727980853045113e-05, + "loss": 1.4502, + "step": 31671 + }, + { + "epoch": 2.49, + "learning_rate": 2.0721712130505803e-05, + "loss": 1.4436, + "step": 31672 + }, + { + "epoch": 2.49, + "learning_rate": 2.0715444285694698e-05, + "loss": 1.4914, + "step": 31673 + }, + { + "epoch": 2.49, + "learning_rate": 2.070917731865442e-05, + "loss": 1.4083, + "step": 31674 + }, + { + "epoch": 2.49, + "learning_rate": 2.070291122942746e-05, + "loss": 1.4438, + "step": 31675 + }, + { + "epoch": 2.49, + "learning_rate": 2.0696646018056357e-05, + "loss": 1.3995, + "step": 31676 + }, + { + "epoch": 2.49, + "learning_rate": 2.0690381684583672e-05, + "loss": 1.4221, + "step": 31677 + }, + { + "epoch": 2.49, + "learning_rate": 2.0684118229051976e-05, + "loss": 1.4761, + "step": 31678 + }, + { + "epoch": 2.49, + "learning_rate": 2.067785565150375e-05, + "loss": 1.4891, + "step": 31679 + }, + { + "epoch": 2.49, + "learning_rate": 2.067159395198149e-05, + "loss": 1.4918, + "step": 31680 + }, + { + "epoch": 2.49, + "learning_rate": 2.0665333130527767e-05, + "loss": 1.4681, + "step": 31681 + }, + { + "epoch": 2.49, + "learning_rate": 2.0659073187185045e-05, + "loss": 1.4427, + "step": 31682 + }, + { + "epoch": 2.49, + "learning_rate": 2.065281412199582e-05, + "loss": 1.4238, + "step": 31683 + }, + { + "epoch": 2.49, + "learning_rate": 2.0646555935002645e-05, + "loss": 1.4811, + "step": 31684 + }, + { + "epoch": 2.49, + "learning_rate": 2.064029862624797e-05, + "loss": 1.4076, + "step": 31685 + }, + { + "epoch": 2.49, + "learning_rate": 2.063404219577424e-05, + "loss": 1.4673, + "step": 31686 + }, + { + "epoch": 2.49, + "learning_rate": 2.062778664362401e-05, + "loss": 1.4535, + "step": 31687 + }, + { + "epoch": 2.49, + "learning_rate": 2.0621531969839728e-05, + "loss": 1.4649, + "step": 31688 + }, + { + "epoch": 2.49, + "learning_rate": 2.0615278174463822e-05, + "loss": 1.4376, + "step": 31689 + }, + { + "epoch": 2.49, + "learning_rate": 2.0609025257538765e-05, + "loss": 1.4363, + "step": 31690 + }, + { + "epoch": 2.49, + "learning_rate": 2.060277321910705e-05, + "loss": 1.48, + "step": 31691 + }, + { + "epoch": 2.49, + "learning_rate": 2.059652205921106e-05, + "loss": 1.4845, + "step": 31692 + }, + { + "epoch": 2.49, + "learning_rate": 2.059027177789327e-05, + "loss": 1.5536, + "step": 31693 + }, + { + "epoch": 2.49, + "learning_rate": 2.058402237519617e-05, + "loss": 1.4346, + "step": 31694 + }, + { + "epoch": 2.49, + "learning_rate": 2.057777385116213e-05, + "loss": 1.4454, + "step": 31695 + }, + { + "epoch": 2.49, + "learning_rate": 2.0571526205833576e-05, + "loss": 1.3869, + "step": 31696 + }, + { + "epoch": 2.49, + "learning_rate": 2.056527943925292e-05, + "loss": 1.4444, + "step": 31697 + }, + { + "epoch": 2.49, + "learning_rate": 2.05590335514626e-05, + "loss": 1.4702, + "step": 31698 + }, + { + "epoch": 2.49, + "learning_rate": 2.0552788542505038e-05, + "loss": 1.4548, + "step": 31699 + }, + { + "epoch": 2.49, + "learning_rate": 2.054654441242255e-05, + "loss": 1.4448, + "step": 31700 + }, + { + "epoch": 2.49, + "learning_rate": 2.0540301161257634e-05, + "loss": 1.5172, + "step": 31701 + }, + { + "epoch": 2.49, + "learning_rate": 2.053405878905262e-05, + "loss": 1.4576, + "step": 31702 + }, + { + "epoch": 2.49, + "learning_rate": 2.052781729584988e-05, + "loss": 1.4572, + "step": 31703 + }, + { + "epoch": 2.49, + "learning_rate": 2.0521576681691843e-05, + "loss": 1.4713, + "step": 31704 + }, + { + "epoch": 2.49, + "learning_rate": 2.0515336946620842e-05, + "loss": 1.4418, + "step": 31705 + }, + { + "epoch": 2.49, + "learning_rate": 2.050909809067921e-05, + "loss": 1.4128, + "step": 31706 + }, + { + "epoch": 2.49, + "learning_rate": 2.0502860113909398e-05, + "loss": 1.4651, + "step": 31707 + }, + { + "epoch": 2.49, + "learning_rate": 2.0496623016353654e-05, + "loss": 1.412, + "step": 31708 + }, + { + "epoch": 2.49, + "learning_rate": 2.049038679805441e-05, + "loss": 1.4308, + "step": 31709 + }, + { + "epoch": 2.49, + "learning_rate": 2.0484151459053933e-05, + "loss": 1.4323, + "step": 31710 + }, + { + "epoch": 2.5, + "learning_rate": 2.047791699939462e-05, + "loss": 1.4594, + "step": 31711 + }, + { + "epoch": 2.5, + "learning_rate": 2.0471683419118796e-05, + "loss": 1.4133, + "step": 31712 + }, + { + "epoch": 2.5, + "learning_rate": 2.046545071826875e-05, + "loss": 1.4688, + "step": 31713 + }, + { + "epoch": 2.5, + "learning_rate": 2.045921889688677e-05, + "loss": 1.4195, + "step": 31714 + }, + { + "epoch": 2.5, + "learning_rate": 2.0452987955015255e-05, + "loss": 1.4448, + "step": 31715 + }, + { + "epoch": 2.5, + "learning_rate": 2.0446757892696454e-05, + "loss": 1.4839, + "step": 31716 + }, + { + "epoch": 2.5, + "learning_rate": 2.0440528709972647e-05, + "loss": 1.4222, + "step": 31717 + }, + { + "epoch": 2.5, + "learning_rate": 2.043430040688619e-05, + "loss": 1.4471, + "step": 31718 + }, + { + "epoch": 2.5, + "learning_rate": 2.042807298347931e-05, + "loss": 1.3916, + "step": 31719 + }, + { + "epoch": 2.5, + "learning_rate": 2.0421846439794293e-05, + "loss": 1.4299, + "step": 31720 + }, + { + "epoch": 2.5, + "learning_rate": 2.0415620775873472e-05, + "loss": 1.4305, + "step": 31721 + }, + { + "epoch": 2.5, + "learning_rate": 2.0409395991759058e-05, + "loss": 1.4238, + "step": 31722 + }, + { + "epoch": 2.5, + "learning_rate": 2.0403172087493308e-05, + "loss": 1.4599, + "step": 31723 + }, + { + "epoch": 2.5, + "learning_rate": 2.0396949063118502e-05, + "loss": 1.4482, + "step": 31724 + }, + { + "epoch": 2.5, + "learning_rate": 2.0390726918676938e-05, + "loss": 1.4571, + "step": 31725 + }, + { + "epoch": 2.5, + "learning_rate": 2.0384505654210797e-05, + "loss": 1.4363, + "step": 31726 + }, + { + "epoch": 2.5, + "learning_rate": 2.03782852697623e-05, + "loss": 1.4823, + "step": 31727 + }, + { + "epoch": 2.5, + "learning_rate": 2.0372065765373745e-05, + "loss": 1.4246, + "step": 31728 + }, + { + "epoch": 2.5, + "learning_rate": 2.036584714108735e-05, + "loss": 1.4225, + "step": 31729 + }, + { + "epoch": 2.5, + "learning_rate": 2.0359629396945294e-05, + "loss": 1.4583, + "step": 31730 + }, + { + "epoch": 2.5, + "learning_rate": 2.0353412532989794e-05, + "loss": 1.4297, + "step": 31731 + }, + { + "epoch": 2.5, + "learning_rate": 2.0347196549263102e-05, + "loss": 1.4291, + "step": 31732 + }, + { + "epoch": 2.5, + "learning_rate": 2.0340981445807398e-05, + "loss": 1.4382, + "step": 31733 + }, + { + "epoch": 2.5, + "learning_rate": 2.033476722266485e-05, + "loss": 1.3808, + "step": 31734 + }, + { + "epoch": 2.5, + "learning_rate": 2.0328553879877692e-05, + "loss": 1.4116, + "step": 31735 + }, + { + "epoch": 2.5, + "learning_rate": 2.032234141748812e-05, + "loss": 1.5003, + "step": 31736 + }, + { + "epoch": 2.5, + "learning_rate": 2.0316129835538235e-05, + "loss": 1.4597, + "step": 31737 + }, + { + "epoch": 2.5, + "learning_rate": 2.0309919134070308e-05, + "loss": 1.4052, + "step": 31738 + }, + { + "epoch": 2.5, + "learning_rate": 2.0303709313126432e-05, + "loss": 1.4671, + "step": 31739 + }, + { + "epoch": 2.5, + "learning_rate": 2.029750037274881e-05, + "loss": 1.3732, + "step": 31740 + }, + { + "epoch": 2.5, + "learning_rate": 2.0291292312979573e-05, + "loss": 1.4383, + "step": 31741 + }, + { + "epoch": 2.5, + "learning_rate": 2.0285085133860905e-05, + "loss": 1.4121, + "step": 31742 + }, + { + "epoch": 2.5, + "learning_rate": 2.0278878835434925e-05, + "loss": 1.4597, + "step": 31743 + }, + { + "epoch": 2.5, + "learning_rate": 2.0272673417743747e-05, + "loss": 1.4651, + "step": 31744 + }, + { + "epoch": 2.5, + "learning_rate": 2.026646888082955e-05, + "loss": 1.4776, + "step": 31745 + }, + { + "epoch": 2.5, + "learning_rate": 2.026026522473444e-05, + "loss": 1.4575, + "step": 31746 + }, + { + "epoch": 2.5, + "learning_rate": 2.0254062449500513e-05, + "loss": 1.4172, + "step": 31747 + }, + { + "epoch": 2.5, + "learning_rate": 2.024786055516992e-05, + "loss": 1.427, + "step": 31748 + }, + { + "epoch": 2.5, + "learning_rate": 2.024165954178476e-05, + "loss": 1.4698, + "step": 31749 + }, + { + "epoch": 2.5, + "learning_rate": 2.0235459409387118e-05, + "loss": 1.4417, + "step": 31750 + }, + { + "epoch": 2.5, + "learning_rate": 2.0229260158019055e-05, + "loss": 1.4566, + "step": 31751 + }, + { + "epoch": 2.5, + "learning_rate": 2.0223061787722744e-05, + "loss": 1.4617, + "step": 31752 + }, + { + "epoch": 2.5, + "learning_rate": 2.021686429854023e-05, + "loss": 1.4425, + "step": 31753 + }, + { + "epoch": 2.5, + "learning_rate": 2.021066769051355e-05, + "loss": 1.4418, + "step": 31754 + }, + { + "epoch": 2.5, + "learning_rate": 2.0204471963684814e-05, + "loss": 1.4192, + "step": 31755 + }, + { + "epoch": 2.5, + "learning_rate": 2.019827711809613e-05, + "loss": 1.4158, + "step": 31756 + }, + { + "epoch": 2.5, + "learning_rate": 2.0192083153789507e-05, + "loss": 1.4639, + "step": 31757 + }, + { + "epoch": 2.5, + "learning_rate": 2.0185890070806966e-05, + "loss": 1.4237, + "step": 31758 + }, + { + "epoch": 2.5, + "learning_rate": 2.017969786919062e-05, + "loss": 1.4499, + "step": 31759 + }, + { + "epoch": 2.5, + "learning_rate": 2.0173506548982503e-05, + "loss": 1.4328, + "step": 31760 + }, + { + "epoch": 2.5, + "learning_rate": 2.0167316110224583e-05, + "loss": 1.5092, + "step": 31761 + }, + { + "epoch": 2.5, + "learning_rate": 2.0161126552958995e-05, + "loss": 1.4577, + "step": 31762 + }, + { + "epoch": 2.5, + "learning_rate": 2.0154937877227683e-05, + "loss": 1.4297, + "step": 31763 + }, + { + "epoch": 2.5, + "learning_rate": 2.0148750083072667e-05, + "loss": 1.496, + "step": 31764 + }, + { + "epoch": 2.5, + "learning_rate": 2.0142563170536014e-05, + "loss": 1.436, + "step": 31765 + }, + { + "epoch": 2.5, + "learning_rate": 2.0136377139659686e-05, + "loss": 1.423, + "step": 31766 + }, + { + "epoch": 2.5, + "learning_rate": 2.0130191990485706e-05, + "loss": 1.4716, + "step": 31767 + }, + { + "epoch": 2.5, + "learning_rate": 2.0124007723056003e-05, + "loss": 1.4736, + "step": 31768 + }, + { + "epoch": 2.5, + "learning_rate": 2.0117824337412676e-05, + "loss": 1.4378, + "step": 31769 + }, + { + "epoch": 2.5, + "learning_rate": 2.0111641833597593e-05, + "loss": 1.4643, + "step": 31770 + }, + { + "epoch": 2.5, + "learning_rate": 2.0105460211652818e-05, + "loss": 1.4541, + "step": 31771 + }, + { + "epoch": 2.5, + "learning_rate": 2.0099279471620256e-05, + "loss": 1.4456, + "step": 31772 + }, + { + "epoch": 2.5, + "learning_rate": 2.0093099613541935e-05, + "loss": 1.476, + "step": 31773 + }, + { + "epoch": 2.5, + "learning_rate": 2.0086920637459775e-05, + "loss": 1.4346, + "step": 31774 + }, + { + "epoch": 2.5, + "learning_rate": 2.0080742543415706e-05, + "loss": 1.4019, + "step": 31775 + }, + { + "epoch": 2.5, + "learning_rate": 2.007456533145173e-05, + "loss": 1.4705, + "step": 31776 + }, + { + "epoch": 2.5, + "learning_rate": 2.0068389001609765e-05, + "loss": 1.4702, + "step": 31777 + }, + { + "epoch": 2.5, + "learning_rate": 2.0062213553931688e-05, + "loss": 1.4633, + "step": 31778 + }, + { + "epoch": 2.5, + "learning_rate": 2.005603898845952e-05, + "loss": 1.4492, + "step": 31779 + }, + { + "epoch": 2.5, + "learning_rate": 2.004986530523513e-05, + "loss": 1.4292, + "step": 31780 + }, + { + "epoch": 2.5, + "learning_rate": 2.0043692504300412e-05, + "loss": 1.4822, + "step": 31781 + }, + { + "epoch": 2.5, + "learning_rate": 2.0037520585697337e-05, + "loss": 1.4506, + "step": 31782 + }, + { + "epoch": 2.5, + "learning_rate": 2.0031349549467786e-05, + "loss": 1.4402, + "step": 31783 + }, + { + "epoch": 2.5, + "learning_rate": 2.002517939565364e-05, + "loss": 1.4509, + "step": 31784 + }, + { + "epoch": 2.5, + "learning_rate": 2.001901012429677e-05, + "loss": 1.4491, + "step": 31785 + }, + { + "epoch": 2.5, + "learning_rate": 2.0012841735439106e-05, + "loss": 1.4227, + "step": 31786 + }, + { + "epoch": 2.5, + "learning_rate": 2.0006674229122532e-05, + "loss": 1.5069, + "step": 31787 + }, + { + "epoch": 2.5, + "learning_rate": 2.00005076053889e-05, + "loss": 1.4738, + "step": 31788 + }, + { + "epoch": 2.5, + "learning_rate": 1.9994341864280054e-05, + "loss": 1.4315, + "step": 31789 + }, + { + "epoch": 2.5, + "learning_rate": 1.998817700583792e-05, + "loss": 1.4228, + "step": 31790 + }, + { + "epoch": 2.5, + "learning_rate": 1.9982013030104305e-05, + "loss": 1.4225, + "step": 31791 + }, + { + "epoch": 2.5, + "learning_rate": 1.9975849937121047e-05, + "loss": 1.437, + "step": 31792 + }, + { + "epoch": 2.5, + "learning_rate": 1.9969687726930063e-05, + "loss": 1.4363, + "step": 31793 + }, + { + "epoch": 2.5, + "learning_rate": 1.9963526399573116e-05, + "loss": 1.4539, + "step": 31794 + }, + { + "epoch": 2.5, + "learning_rate": 1.995736595509204e-05, + "loss": 1.3937, + "step": 31795 + }, + { + "epoch": 2.5, + "learning_rate": 1.9951206393528725e-05, + "loss": 1.4271, + "step": 31796 + }, + { + "epoch": 2.5, + "learning_rate": 1.994504771492496e-05, + "loss": 1.4918, + "step": 31797 + }, + { + "epoch": 2.5, + "learning_rate": 1.9938889919322503e-05, + "loss": 1.4293, + "step": 31798 + }, + { + "epoch": 2.5, + "learning_rate": 1.9932733006763253e-05, + "loss": 1.5098, + "step": 31799 + }, + { + "epoch": 2.5, + "learning_rate": 1.9926576977288957e-05, + "loss": 1.4085, + "step": 31800 + }, + { + "epoch": 2.5, + "learning_rate": 1.992042183094143e-05, + "loss": 1.4553, + "step": 31801 + }, + { + "epoch": 2.5, + "learning_rate": 1.9914267567762393e-05, + "loss": 1.4769, + "step": 31802 + }, + { + "epoch": 2.5, + "learning_rate": 1.9908114187793745e-05, + "loss": 1.4298, + "step": 31803 + }, + { + "epoch": 2.5, + "learning_rate": 1.9901961691077217e-05, + "loss": 1.4051, + "step": 31804 + }, + { + "epoch": 2.5, + "learning_rate": 1.9895810077654545e-05, + "loss": 1.481, + "step": 31805 + }, + { + "epoch": 2.5, + "learning_rate": 1.988965934756756e-05, + "loss": 1.4158, + "step": 31806 + }, + { + "epoch": 2.5, + "learning_rate": 1.988350950085798e-05, + "loss": 1.443, + "step": 31807 + }, + { + "epoch": 2.5, + "learning_rate": 1.987736053756757e-05, + "loss": 1.5291, + "step": 31808 + }, + { + "epoch": 2.5, + "learning_rate": 1.987121245773805e-05, + "loss": 1.4104, + "step": 31809 + }, + { + "epoch": 2.5, + "learning_rate": 1.98650652614112e-05, + "loss": 1.407, + "step": 31810 + }, + { + "epoch": 2.5, + "learning_rate": 1.9858918948628755e-05, + "loss": 1.4284, + "step": 31811 + }, + { + "epoch": 2.5, + "learning_rate": 1.9852773519432398e-05, + "loss": 1.4846, + "step": 31812 + }, + { + "epoch": 2.5, + "learning_rate": 1.9846628973863928e-05, + "loss": 1.4622, + "step": 31813 + }, + { + "epoch": 2.5, + "learning_rate": 1.984048531196501e-05, + "loss": 1.4456, + "step": 31814 + }, + { + "epoch": 2.5, + "learning_rate": 1.9834342533777347e-05, + "loss": 1.4303, + "step": 31815 + }, + { + "epoch": 2.5, + "learning_rate": 1.982820063934269e-05, + "loss": 1.4673, + "step": 31816 + }, + { + "epoch": 2.5, + "learning_rate": 1.982205962870272e-05, + "loss": 1.4382, + "step": 31817 + }, + { + "epoch": 2.5, + "learning_rate": 1.9815919501899086e-05, + "loss": 1.4923, + "step": 31818 + }, + { + "epoch": 2.5, + "learning_rate": 1.980978025897354e-05, + "loss": 1.4049, + "step": 31819 + }, + { + "epoch": 2.5, + "learning_rate": 1.980364189996775e-05, + "loss": 1.462, + "step": 31820 + }, + { + "epoch": 2.5, + "learning_rate": 1.9797504424923394e-05, + "loss": 1.4384, + "step": 31821 + }, + { + "epoch": 2.5, + "learning_rate": 1.9791367833882095e-05, + "loss": 1.4756, + "step": 31822 + }, + { + "epoch": 2.5, + "learning_rate": 1.97852321268856e-05, + "loss": 1.4175, + "step": 31823 + }, + { + "epoch": 2.5, + "learning_rate": 1.9779097303975507e-05, + "loss": 1.4425, + "step": 31824 + }, + { + "epoch": 2.5, + "learning_rate": 1.977296336519347e-05, + "loss": 1.4662, + "step": 31825 + }, + { + "epoch": 2.5, + "learning_rate": 1.9766830310581134e-05, + "loss": 1.4682, + "step": 31826 + }, + { + "epoch": 2.5, + "learning_rate": 1.976069814018017e-05, + "loss": 1.4459, + "step": 31827 + }, + { + "epoch": 2.5, + "learning_rate": 1.975456685403221e-05, + "loss": 1.4603, + "step": 31828 + }, + { + "epoch": 2.5, + "learning_rate": 1.9748436452178822e-05, + "loss": 1.4314, + "step": 31829 + }, + { + "epoch": 2.5, + "learning_rate": 1.9742306934661706e-05, + "loss": 1.4829, + "step": 31830 + }, + { + "epoch": 2.5, + "learning_rate": 1.9736178301522444e-05, + "loss": 1.4394, + "step": 31831 + }, + { + "epoch": 2.5, + "learning_rate": 1.97300505528026e-05, + "loss": 1.4333, + "step": 31832 + }, + { + "epoch": 2.5, + "learning_rate": 1.9723923688543846e-05, + "loss": 1.4801, + "step": 31833 + }, + { + "epoch": 2.5, + "learning_rate": 1.971779770878778e-05, + "loss": 1.4441, + "step": 31834 + }, + { + "epoch": 2.5, + "learning_rate": 1.971167261357597e-05, + "loss": 1.4705, + "step": 31835 + }, + { + "epoch": 2.5, + "learning_rate": 1.970554840294998e-05, + "loss": 1.4841, + "step": 31836 + }, + { + "epoch": 2.5, + "learning_rate": 1.969942507695144e-05, + "loss": 1.4166, + "step": 31837 + }, + { + "epoch": 2.51, + "learning_rate": 1.9693302635621894e-05, + "loss": 1.4398, + "step": 31838 + }, + { + "epoch": 2.51, + "learning_rate": 1.9687181079002883e-05, + "loss": 1.4521, + "step": 31839 + }, + { + "epoch": 2.51, + "learning_rate": 1.9681060407136047e-05, + "loss": 1.4716, + "step": 31840 + }, + { + "epoch": 2.51, + "learning_rate": 1.967494062006288e-05, + "loss": 1.4823, + "step": 31841 + }, + { + "epoch": 2.51, + "learning_rate": 1.966882171782495e-05, + "loss": 1.4931, + "step": 31842 + }, + { + "epoch": 2.51, + "learning_rate": 1.966270370046376e-05, + "loss": 1.4496, + "step": 31843 + }, + { + "epoch": 2.51, + "learning_rate": 1.9656586568020927e-05, + "loss": 1.4318, + "step": 31844 + }, + { + "epoch": 2.51, + "learning_rate": 1.9650470320537947e-05, + "loss": 1.4833, + "step": 31845 + }, + { + "epoch": 2.51, + "learning_rate": 1.9644354958056292e-05, + "loss": 1.461, + "step": 31846 + }, + { + "epoch": 2.51, + "learning_rate": 1.9638240480617574e-05, + "loss": 1.4184, + "step": 31847 + }, + { + "epoch": 2.51, + "learning_rate": 1.963212688826326e-05, + "loss": 1.4505, + "step": 31848 + }, + { + "epoch": 2.51, + "learning_rate": 1.962601418103482e-05, + "loss": 1.4946, + "step": 31849 + }, + { + "epoch": 2.51, + "learning_rate": 1.961990235897382e-05, + "loss": 1.4509, + "step": 31850 + }, + { + "epoch": 2.51, + "learning_rate": 1.9613791422121743e-05, + "loss": 1.439, + "step": 31851 + }, + { + "epoch": 2.51, + "learning_rate": 1.960768137052009e-05, + "loss": 1.4405, + "step": 31852 + }, + { + "epoch": 2.51, + "learning_rate": 1.9601572204210274e-05, + "loss": 1.3877, + "step": 31853 + }, + { + "epoch": 2.51, + "learning_rate": 1.959546392323387e-05, + "loss": 1.4546, + "step": 31854 + }, + { + "epoch": 2.51, + "learning_rate": 1.958935652763228e-05, + "loss": 1.4812, + "step": 31855 + }, + { + "epoch": 2.51, + "learning_rate": 1.9583250017446987e-05, + "loss": 1.4044, + "step": 31856 + }, + { + "epoch": 2.51, + "learning_rate": 1.9577144392719467e-05, + "loss": 1.4594, + "step": 31857 + }, + { + "epoch": 2.51, + "learning_rate": 1.9571039653491187e-05, + "loss": 1.464, + "step": 31858 + }, + { + "epoch": 2.51, + "learning_rate": 1.9564935799803517e-05, + "loss": 1.4971, + "step": 31859 + }, + { + "epoch": 2.51, + "learning_rate": 1.9558832831698003e-05, + "loss": 1.4729, + "step": 31860 + }, + { + "epoch": 2.51, + "learning_rate": 1.9552730749216013e-05, + "loss": 1.3664, + "step": 31861 + }, + { + "epoch": 2.51, + "learning_rate": 1.9546629552398997e-05, + "loss": 1.4431, + "step": 31862 + }, + { + "epoch": 2.51, + "learning_rate": 1.9540529241288356e-05, + "loss": 1.4458, + "step": 31863 + }, + { + "epoch": 2.51, + "learning_rate": 1.9534429815925557e-05, + "loss": 1.4882, + "step": 31864 + }, + { + "epoch": 2.51, + "learning_rate": 1.952833127635195e-05, + "loss": 1.448, + "step": 31865 + }, + { + "epoch": 2.51, + "learning_rate": 1.9522233622609e-05, + "loss": 1.4676, + "step": 31866 + }, + { + "epoch": 2.51, + "learning_rate": 1.9516136854738046e-05, + "loss": 1.4876, + "step": 31867 + }, + { + "epoch": 2.51, + "learning_rate": 1.951004097278055e-05, + "loss": 1.4282, + "step": 31868 + }, + { + "epoch": 2.51, + "learning_rate": 1.9503945976777864e-05, + "loss": 1.4602, + "step": 31869 + }, + { + "epoch": 2.51, + "learning_rate": 1.9497851866771354e-05, + "loss": 1.4812, + "step": 31870 + }, + { + "epoch": 2.51, + "learning_rate": 1.9491758642802435e-05, + "loss": 1.4279, + "step": 31871 + }, + { + "epoch": 2.51, + "learning_rate": 1.9485666304912446e-05, + "loss": 1.485, + "step": 31872 + }, + { + "epoch": 2.51, + "learning_rate": 1.9479574853142733e-05, + "loss": 1.4659, + "step": 31873 + }, + { + "epoch": 2.51, + "learning_rate": 1.9473484287534714e-05, + "loss": 1.4138, + "step": 31874 + }, + { + "epoch": 2.51, + "learning_rate": 1.9467394608129706e-05, + "loss": 1.4148, + "step": 31875 + }, + { + "epoch": 2.51, + "learning_rate": 1.9461305814969026e-05, + "loss": 1.4285, + "step": 31876 + }, + { + "epoch": 2.51, + "learning_rate": 1.945521790809407e-05, + "loss": 1.4995, + "step": 31877 + }, + { + "epoch": 2.51, + "learning_rate": 1.9449130887546132e-05, + "loss": 1.4865, + "step": 31878 + }, + { + "epoch": 2.51, + "learning_rate": 1.944304475336657e-05, + "loss": 1.4749, + "step": 31879 + }, + { + "epoch": 2.51, + "learning_rate": 1.943695950559662e-05, + "loss": 1.4486, + "step": 31880 + }, + { + "epoch": 2.51, + "learning_rate": 1.943087514427772e-05, + "loss": 1.389, + "step": 31881 + }, + { + "epoch": 2.51, + "learning_rate": 1.9424791669451127e-05, + "loss": 1.4641, + "step": 31882 + }, + { + "epoch": 2.51, + "learning_rate": 1.9418709081158152e-05, + "loss": 1.4648, + "step": 31883 + }, + { + "epoch": 2.51, + "learning_rate": 1.941262737944004e-05, + "loss": 1.4275, + "step": 31884 + }, + { + "epoch": 2.51, + "learning_rate": 1.9406546564338155e-05, + "loss": 1.3989, + "step": 31885 + }, + { + "epoch": 2.51, + "learning_rate": 1.940046663589375e-05, + "loss": 1.4641, + "step": 31886 + }, + { + "epoch": 2.51, + "learning_rate": 1.9394387594148082e-05, + "loss": 1.4875, + "step": 31887 + }, + { + "epoch": 2.51, + "learning_rate": 1.9388309439142473e-05, + "loss": 1.4505, + "step": 31888 + }, + { + "epoch": 2.51, + "learning_rate": 1.9382232170918167e-05, + "loss": 1.4032, + "step": 31889 + }, + { + "epoch": 2.51, + "learning_rate": 1.937615578951639e-05, + "loss": 1.501, + "step": 31890 + }, + { + "epoch": 2.51, + "learning_rate": 1.9370080294978463e-05, + "loss": 1.4877, + "step": 31891 + }, + { + "epoch": 2.51, + "learning_rate": 1.9364005687345603e-05, + "loss": 1.4367, + "step": 31892 + }, + { + "epoch": 2.51, + "learning_rate": 1.9357931966659025e-05, + "loss": 1.3743, + "step": 31893 + }, + { + "epoch": 2.51, + "learning_rate": 1.935185913296003e-05, + "loss": 1.4148, + "step": 31894 + }, + { + "epoch": 2.51, + "learning_rate": 1.93457871862898e-05, + "loss": 1.4492, + "step": 31895 + }, + { + "epoch": 2.51, + "learning_rate": 1.9339716126689557e-05, + "loss": 1.4277, + "step": 31896 + }, + { + "epoch": 2.51, + "learning_rate": 1.9333645954200515e-05, + "loss": 1.4524, + "step": 31897 + }, + { + "epoch": 2.51, + "learning_rate": 1.932757666886396e-05, + "loss": 1.4407, + "step": 31898 + }, + { + "epoch": 2.51, + "learning_rate": 1.9321508270721054e-05, + "loss": 1.469, + "step": 31899 + }, + { + "epoch": 2.51, + "learning_rate": 1.9315440759812983e-05, + "loss": 1.4045, + "step": 31900 + }, + { + "epoch": 2.51, + "learning_rate": 1.9309374136180916e-05, + "loss": 1.4803, + "step": 31901 + }, + { + "epoch": 2.51, + "learning_rate": 1.9303308399866118e-05, + "loss": 1.4823, + "step": 31902 + }, + { + "epoch": 2.51, + "learning_rate": 1.9297243550909724e-05, + "loss": 1.4427, + "step": 31903 + }, + { + "epoch": 2.51, + "learning_rate": 1.9291179589352902e-05, + "loss": 1.4534, + "step": 31904 + }, + { + "epoch": 2.51, + "learning_rate": 1.9285116515236847e-05, + "loss": 1.4325, + "step": 31905 + }, + { + "epoch": 2.51, + "learning_rate": 1.9279054328602733e-05, + "loss": 1.4217, + "step": 31906 + }, + { + "epoch": 2.51, + "learning_rate": 1.9272993029491672e-05, + "loss": 1.4462, + "step": 31907 + }, + { + "epoch": 2.51, + "learning_rate": 1.9266932617944868e-05, + "loss": 1.4233, + "step": 31908 + }, + { + "epoch": 2.51, + "learning_rate": 1.9260873094003456e-05, + "loss": 1.4613, + "step": 31909 + }, + { + "epoch": 2.51, + "learning_rate": 1.925481445770853e-05, + "loss": 1.4139, + "step": 31910 + }, + { + "epoch": 2.51, + "learning_rate": 1.924875670910131e-05, + "loss": 1.4384, + "step": 31911 + }, + { + "epoch": 2.51, + "learning_rate": 1.924269984822283e-05, + "loss": 1.5122, + "step": 31912 + }, + { + "epoch": 2.51, + "learning_rate": 1.9236643875114294e-05, + "loss": 1.4297, + "step": 31913 + }, + { + "epoch": 2.51, + "learning_rate": 1.9230588789816748e-05, + "loss": 1.4462, + "step": 31914 + }, + { + "epoch": 2.51, + "learning_rate": 1.9224534592371375e-05, + "loss": 1.4441, + "step": 31915 + }, + { + "epoch": 2.51, + "learning_rate": 1.9218481282819246e-05, + "loss": 1.447, + "step": 31916 + }, + { + "epoch": 2.51, + "learning_rate": 1.921242886120143e-05, + "loss": 1.4316, + "step": 31917 + }, + { + "epoch": 2.51, + "learning_rate": 1.9206377327559086e-05, + "loss": 1.4337, + "step": 31918 + }, + { + "epoch": 2.51, + "learning_rate": 1.9200326681933254e-05, + "loss": 1.4408, + "step": 31919 + }, + { + "epoch": 2.51, + "learning_rate": 1.9194276924365014e-05, + "loss": 1.4664, + "step": 31920 + }, + { + "epoch": 2.51, + "learning_rate": 1.9188228054895423e-05, + "loss": 1.4237, + "step": 31921 + }, + { + "epoch": 2.51, + "learning_rate": 1.9182180073565607e-05, + "loss": 1.4858, + "step": 31922 + }, + { + "epoch": 2.51, + "learning_rate": 1.9176132980416603e-05, + "loss": 1.4607, + "step": 31923 + }, + { + "epoch": 2.51, + "learning_rate": 1.917008677548943e-05, + "loss": 1.4484, + "step": 31924 + }, + { + "epoch": 2.51, + "learning_rate": 1.9164041458825185e-05, + "loss": 1.4608, + "step": 31925 + }, + { + "epoch": 2.51, + "learning_rate": 1.9157997030464906e-05, + "loss": 1.4546, + "step": 31926 + }, + { + "epoch": 2.51, + "learning_rate": 1.9151953490449607e-05, + "loss": 1.5011, + "step": 31927 + }, + { + "epoch": 2.51, + "learning_rate": 1.9145910838820322e-05, + "loss": 1.5167, + "step": 31928 + }, + { + "epoch": 2.51, + "learning_rate": 1.913986907561812e-05, + "loss": 1.4135, + "step": 31929 + }, + { + "epoch": 2.51, + "learning_rate": 1.9133828200884e-05, + "loss": 1.4969, + "step": 31930 + }, + { + "epoch": 2.51, + "learning_rate": 1.912778821465893e-05, + "loss": 1.5326, + "step": 31931 + }, + { + "epoch": 2.51, + "learning_rate": 1.9121749116983992e-05, + "loss": 1.4341, + "step": 31932 + }, + { + "epoch": 2.51, + "learning_rate": 1.9115710907900157e-05, + "loss": 1.4757, + "step": 31933 + }, + { + "epoch": 2.51, + "learning_rate": 1.910967358744837e-05, + "loss": 1.4345, + "step": 31934 + }, + { + "epoch": 2.51, + "learning_rate": 1.910363715566972e-05, + "loss": 1.4098, + "step": 31935 + }, + { + "epoch": 2.51, + "learning_rate": 1.9097601612605125e-05, + "loss": 1.452, + "step": 31936 + }, + { + "epoch": 2.51, + "learning_rate": 1.909156695829558e-05, + "loss": 1.4598, + "step": 31937 + }, + { + "epoch": 2.51, + "learning_rate": 1.908553319278202e-05, + "loss": 1.4366, + "step": 31938 + }, + { + "epoch": 2.51, + "learning_rate": 1.9079500316105485e-05, + "loss": 1.5198, + "step": 31939 + }, + { + "epoch": 2.51, + "learning_rate": 1.9073468328306903e-05, + "loss": 1.4775, + "step": 31940 + }, + { + "epoch": 2.51, + "learning_rate": 1.9067437229427172e-05, + "loss": 1.4269, + "step": 31941 + }, + { + "epoch": 2.51, + "learning_rate": 1.9061407019507317e-05, + "loss": 1.471, + "step": 31942 + }, + { + "epoch": 2.51, + "learning_rate": 1.905537769858822e-05, + "loss": 1.5256, + "step": 31943 + }, + { + "epoch": 2.51, + "learning_rate": 1.9049349266710893e-05, + "loss": 1.4601, + "step": 31944 + }, + { + "epoch": 2.51, + "learning_rate": 1.904332172391618e-05, + "loss": 1.4405, + "step": 31945 + }, + { + "epoch": 2.51, + "learning_rate": 1.9037295070245067e-05, + "loss": 1.4613, + "step": 31946 + }, + { + "epoch": 2.51, + "learning_rate": 1.9031269305738467e-05, + "loss": 1.3943, + "step": 31947 + }, + { + "epoch": 2.51, + "learning_rate": 1.9025244430437227e-05, + "loss": 1.4585, + "step": 31948 + }, + { + "epoch": 2.51, + "learning_rate": 1.9019220444382345e-05, + "loss": 1.4406, + "step": 31949 + }, + { + "epoch": 2.51, + "learning_rate": 1.9013197347614656e-05, + "loss": 1.4752, + "step": 31950 + }, + { + "epoch": 2.51, + "learning_rate": 1.9007175140175064e-05, + "loss": 1.444, + "step": 31951 + }, + { + "epoch": 2.51, + "learning_rate": 1.900115382210448e-05, + "loss": 1.4441, + "step": 31952 + }, + { + "epoch": 2.51, + "learning_rate": 1.899513339344378e-05, + "loss": 1.4548, + "step": 31953 + }, + { + "epoch": 2.51, + "learning_rate": 1.898911385423382e-05, + "loss": 1.4933, + "step": 31954 + }, + { + "epoch": 2.51, + "learning_rate": 1.898309520451545e-05, + "loss": 1.443, + "step": 31955 + }, + { + "epoch": 2.51, + "learning_rate": 1.8977077444329603e-05, + "loss": 1.4428, + "step": 31956 + }, + { + "epoch": 2.51, + "learning_rate": 1.897106057371709e-05, + "loss": 1.4355, + "step": 31957 + }, + { + "epoch": 2.51, + "learning_rate": 1.8965044592718724e-05, + "loss": 1.4902, + "step": 31958 + }, + { + "epoch": 2.51, + "learning_rate": 1.8959029501375412e-05, + "loss": 1.4368, + "step": 31959 + }, + { + "epoch": 2.51, + "learning_rate": 1.8953015299727996e-05, + "loss": 1.432, + "step": 31960 + }, + { + "epoch": 2.51, + "learning_rate": 1.89470019878173e-05, + "loss": 1.42, + "step": 31961 + }, + { + "epoch": 2.51, + "learning_rate": 1.894098956568409e-05, + "loss": 1.479, + "step": 31962 + }, + { + "epoch": 2.51, + "learning_rate": 1.893497803336928e-05, + "loss": 1.4209, + "step": 31963 + }, + { + "epoch": 2.51, + "learning_rate": 1.892896739091364e-05, + "loss": 1.4885, + "step": 31964 + }, + { + "epoch": 2.52, + "learning_rate": 1.8922957638357955e-05, + "loss": 1.4974, + "step": 31965 + }, + { + "epoch": 2.52, + "learning_rate": 1.8916948775743073e-05, + "loss": 1.4365, + "step": 31966 + }, + { + "epoch": 2.52, + "learning_rate": 1.891094080310978e-05, + "loss": 1.4809, + "step": 31967 + }, + { + "epoch": 2.52, + "learning_rate": 1.8904933720498828e-05, + "loss": 1.4595, + "step": 31968 + }, + { + "epoch": 2.52, + "learning_rate": 1.8898927527951062e-05, + "loss": 1.4201, + "step": 31969 + }, + { + "epoch": 2.52, + "learning_rate": 1.889292222550722e-05, + "loss": 1.5028, + "step": 31970 + }, + { + "epoch": 2.52, + "learning_rate": 1.8886917813208076e-05, + "loss": 1.4689, + "step": 31971 + }, + { + "epoch": 2.52, + "learning_rate": 1.8880914291094418e-05, + "loss": 1.447, + "step": 31972 + }, + { + "epoch": 2.52, + "learning_rate": 1.8874911659207004e-05, + "loss": 1.4453, + "step": 31973 + }, + { + "epoch": 2.52, + "learning_rate": 1.8868909917586566e-05, + "loss": 1.4356, + "step": 31974 + }, + { + "epoch": 2.52, + "learning_rate": 1.8862909066273806e-05, + "loss": 1.4787, + "step": 31975 + }, + { + "epoch": 2.52, + "learning_rate": 1.885690910530959e-05, + "loss": 1.4517, + "step": 31976 + }, + { + "epoch": 2.52, + "learning_rate": 1.8850910034734605e-05, + "loss": 1.4896, + "step": 31977 + }, + { + "epoch": 2.52, + "learning_rate": 1.884491185458955e-05, + "loss": 1.447, + "step": 31978 + }, + { + "epoch": 2.52, + "learning_rate": 1.883891456491514e-05, + "loss": 1.4559, + "step": 31979 + }, + { + "epoch": 2.52, + "learning_rate": 1.8832918165752164e-05, + "loss": 1.4453, + "step": 31980 + }, + { + "epoch": 2.52, + "learning_rate": 1.882692265714127e-05, + "loss": 1.3889, + "step": 31981 + }, + { + "epoch": 2.52, + "learning_rate": 1.8820928039123155e-05, + "loss": 1.4508, + "step": 31982 + }, + { + "epoch": 2.52, + "learning_rate": 1.8814934311738595e-05, + "loss": 1.4263, + "step": 31983 + }, + { + "epoch": 2.52, + "learning_rate": 1.8808941475028217e-05, + "loss": 1.4944, + "step": 31984 + }, + { + "epoch": 2.52, + "learning_rate": 1.8802949529032706e-05, + "loss": 1.5354, + "step": 31985 + }, + { + "epoch": 2.52, + "learning_rate": 1.87969584737928e-05, + "loss": 1.4878, + "step": 31986 + }, + { + "epoch": 2.52, + "learning_rate": 1.8790968309349147e-05, + "loss": 1.4882, + "step": 31987 + }, + { + "epoch": 2.52, + "learning_rate": 1.878497903574238e-05, + "loss": 1.4301, + "step": 31988 + }, + { + "epoch": 2.52, + "learning_rate": 1.877899065301322e-05, + "loss": 1.4213, + "step": 31989 + }, + { + "epoch": 2.52, + "learning_rate": 1.8773003161202265e-05, + "loss": 1.4187, + "step": 31990 + }, + { + "epoch": 2.52, + "learning_rate": 1.8767016560350234e-05, + "loss": 1.4727, + "step": 31991 + }, + { + "epoch": 2.52, + "learning_rate": 1.8761030850497726e-05, + "loss": 1.4716, + "step": 31992 + }, + { + "epoch": 2.52, + "learning_rate": 1.875504603168541e-05, + "loss": 1.4096, + "step": 31993 + }, + { + "epoch": 2.52, + "learning_rate": 1.8749062103953903e-05, + "loss": 1.4491, + "step": 31994 + }, + { + "epoch": 2.52, + "learning_rate": 1.8743079067343842e-05, + "loss": 1.4827, + "step": 31995 + }, + { + "epoch": 2.52, + "learning_rate": 1.8737096921895806e-05, + "loss": 1.4609, + "step": 31996 + }, + { + "epoch": 2.52, + "learning_rate": 1.873111566765048e-05, + "loss": 1.4707, + "step": 31997 + }, + { + "epoch": 2.52, + "learning_rate": 1.8725135304648437e-05, + "loss": 1.4421, + "step": 31998 + }, + { + "epoch": 2.52, + "learning_rate": 1.8719155832930237e-05, + "loss": 1.4626, + "step": 31999 + }, + { + "epoch": 2.52, + "learning_rate": 1.871317725253657e-05, + "loss": 1.4421, + "step": 32000 + }, + { + "epoch": 2.52, + "learning_rate": 1.8707199563507967e-05, + "loss": 1.4212, + "step": 32001 + }, + { + "epoch": 2.52, + "learning_rate": 1.8701222765885e-05, + "loss": 1.4518, + "step": 32002 + }, + { + "epoch": 2.52, + "learning_rate": 1.8695246859708314e-05, + "loss": 1.4519, + "step": 32003 + }, + { + "epoch": 2.52, + "learning_rate": 1.8689271845018427e-05, + "loss": 1.4856, + "step": 32004 + }, + { + "epoch": 2.52, + "learning_rate": 1.868329772185591e-05, + "loss": 1.4433, + "step": 32005 + }, + { + "epoch": 2.52, + "learning_rate": 1.8677324490261315e-05, + "loss": 1.4778, + "step": 32006 + }, + { + "epoch": 2.52, + "learning_rate": 1.8671352150275253e-05, + "loss": 1.4003, + "step": 32007 + }, + { + "epoch": 2.52, + "learning_rate": 1.8665380701938248e-05, + "loss": 1.4653, + "step": 32008 + }, + { + "epoch": 2.52, + "learning_rate": 1.8659410145290782e-05, + "loss": 1.461, + "step": 32009 + }, + { + "epoch": 2.52, + "learning_rate": 1.865344048037349e-05, + "loss": 1.448, + "step": 32010 + }, + { + "epoch": 2.52, + "learning_rate": 1.8647471707226837e-05, + "loss": 1.4669, + "step": 32011 + }, + { + "epoch": 2.52, + "learning_rate": 1.8641503825891373e-05, + "loss": 1.4688, + "step": 32012 + }, + { + "epoch": 2.52, + "learning_rate": 1.863553683640759e-05, + "loss": 1.471, + "step": 32013 + }, + { + "epoch": 2.52, + "learning_rate": 1.862957073881603e-05, + "loss": 1.4664, + "step": 32014 + }, + { + "epoch": 2.52, + "learning_rate": 1.86236055331572e-05, + "loss": 1.4565, + "step": 32015 + }, + { + "epoch": 2.52, + "learning_rate": 1.8617641219471547e-05, + "loss": 1.4754, + "step": 32016 + }, + { + "epoch": 2.52, + "learning_rate": 1.8611677797799656e-05, + "loss": 1.4995, + "step": 32017 + }, + { + "epoch": 2.52, + "learning_rate": 1.860571526818195e-05, + "loss": 1.4531, + "step": 32018 + }, + { + "epoch": 2.52, + "learning_rate": 1.8599753630658902e-05, + "loss": 1.4192, + "step": 32019 + }, + { + "epoch": 2.52, + "learning_rate": 1.8593792885271043e-05, + "loss": 1.4719, + "step": 32020 + }, + { + "epoch": 2.52, + "learning_rate": 1.858783303205883e-05, + "loss": 1.4275, + "step": 32021 + }, + { + "epoch": 2.52, + "learning_rate": 1.858187407106267e-05, + "loss": 1.4196, + "step": 32022 + }, + { + "epoch": 2.52, + "learning_rate": 1.857591600232306e-05, + "loss": 1.4617, + "step": 32023 + }, + { + "epoch": 2.52, + "learning_rate": 1.856995882588047e-05, + "loss": 1.4539, + "step": 32024 + }, + { + "epoch": 2.52, + "learning_rate": 1.8564002541775354e-05, + "loss": 1.4463, + "step": 32025 + }, + { + "epoch": 2.52, + "learning_rate": 1.8558047150048088e-05, + "loss": 1.4001, + "step": 32026 + }, + { + "epoch": 2.52, + "learning_rate": 1.855209265073918e-05, + "loss": 1.4503, + "step": 32027 + }, + { + "epoch": 2.52, + "learning_rate": 1.854613904388903e-05, + "loss": 1.4499, + "step": 32028 + }, + { + "epoch": 2.52, + "learning_rate": 1.854018632953802e-05, + "loss": 1.3729, + "step": 32029 + }, + { + "epoch": 2.52, + "learning_rate": 1.8534234507726618e-05, + "loss": 1.4096, + "step": 32030 + }, + { + "epoch": 2.52, + "learning_rate": 1.852828357849523e-05, + "loss": 1.436, + "step": 32031 + }, + { + "epoch": 2.52, + "learning_rate": 1.8522333541884233e-05, + "loss": 1.3967, + "step": 32032 + }, + { + "epoch": 2.52, + "learning_rate": 1.8516384397934016e-05, + "loss": 1.443, + "step": 32033 + }, + { + "epoch": 2.52, + "learning_rate": 1.851043614668501e-05, + "loss": 1.4903, + "step": 32034 + }, + { + "epoch": 2.52, + "learning_rate": 1.8504488788177584e-05, + "loss": 1.4491, + "step": 32035 + }, + { + "epoch": 2.52, + "learning_rate": 1.849854232245209e-05, + "loss": 1.4741, + "step": 32036 + }, + { + "epoch": 2.52, + "learning_rate": 1.849259674954895e-05, + "loss": 1.4279, + "step": 32037 + }, + { + "epoch": 2.52, + "learning_rate": 1.848665206950847e-05, + "loss": 1.3821, + "step": 32038 + }, + { + "epoch": 2.52, + "learning_rate": 1.848070828237108e-05, + "loss": 1.4772, + "step": 32039 + }, + { + "epoch": 2.52, + "learning_rate": 1.8474765388177076e-05, + "loss": 1.4412, + "step": 32040 + }, + { + "epoch": 2.52, + "learning_rate": 1.8468823386966875e-05, + "loss": 1.3938, + "step": 32041 + }, + { + "epoch": 2.52, + "learning_rate": 1.8462882278780762e-05, + "loss": 1.4291, + "step": 32042 + }, + { + "epoch": 2.52, + "learning_rate": 1.845694206365907e-05, + "loss": 1.4098, + "step": 32043 + }, + { + "epoch": 2.52, + "learning_rate": 1.845100274164217e-05, + "loss": 1.4706, + "step": 32044 + }, + { + "epoch": 2.52, + "learning_rate": 1.8445064312770374e-05, + "loss": 1.4162, + "step": 32045 + }, + { + "epoch": 2.52, + "learning_rate": 1.8439126777083956e-05, + "loss": 1.5098, + "step": 32046 + }, + { + "epoch": 2.52, + "learning_rate": 1.8433190134623298e-05, + "loss": 1.416, + "step": 32047 + }, + { + "epoch": 2.52, + "learning_rate": 1.8427254385428685e-05, + "loss": 1.4068, + "step": 32048 + }, + { + "epoch": 2.52, + "learning_rate": 1.8421319529540402e-05, + "loss": 1.4494, + "step": 32049 + }, + { + "epoch": 2.52, + "learning_rate": 1.8415385566998714e-05, + "loss": 1.494, + "step": 32050 + }, + { + "epoch": 2.52, + "learning_rate": 1.8409452497843973e-05, + "loss": 1.4699, + "step": 32051 + }, + { + "epoch": 2.52, + "learning_rate": 1.8403520322116434e-05, + "loss": 1.4701, + "step": 32052 + }, + { + "epoch": 2.52, + "learning_rate": 1.839758903985634e-05, + "loss": 1.4668, + "step": 32053 + }, + { + "epoch": 2.52, + "learning_rate": 1.8391658651103985e-05, + "loss": 1.4563, + "step": 32054 + }, + { + "epoch": 2.52, + "learning_rate": 1.8385729155899682e-05, + "loss": 1.4928, + "step": 32055 + }, + { + "epoch": 2.52, + "learning_rate": 1.8379800554283646e-05, + "loss": 1.4748, + "step": 32056 + }, + { + "epoch": 2.52, + "learning_rate": 1.83738728462961e-05, + "loss": 1.4912, + "step": 32057 + }, + { + "epoch": 2.52, + "learning_rate": 1.8367946031977344e-05, + "loss": 1.4761, + "step": 32058 + }, + { + "epoch": 2.52, + "learning_rate": 1.836202011136761e-05, + "loss": 1.4171, + "step": 32059 + }, + { + "epoch": 2.52, + "learning_rate": 1.8356095084507066e-05, + "loss": 1.4506, + "step": 32060 + }, + { + "epoch": 2.52, + "learning_rate": 1.8350170951436033e-05, + "loss": 1.4574, + "step": 32061 + }, + { + "epoch": 2.52, + "learning_rate": 1.8344247712194675e-05, + "loss": 1.4716, + "step": 32062 + }, + { + "epoch": 2.52, + "learning_rate": 1.83383253668232e-05, + "loss": 1.4444, + "step": 32063 + }, + { + "epoch": 2.52, + "learning_rate": 1.8332403915361864e-05, + "loss": 1.4657, + "step": 32064 + }, + { + "epoch": 2.52, + "learning_rate": 1.8326483357850846e-05, + "loss": 1.4948, + "step": 32065 + }, + { + "epoch": 2.52, + "learning_rate": 1.832056369433036e-05, + "loss": 1.4301, + "step": 32066 + }, + { + "epoch": 2.52, + "learning_rate": 1.8314644924840523e-05, + "loss": 1.4215, + "step": 32067 + }, + { + "epoch": 2.52, + "learning_rate": 1.8308727049421618e-05, + "loss": 1.4523, + "step": 32068 + }, + { + "epoch": 2.52, + "learning_rate": 1.8302810068113766e-05, + "loss": 1.3938, + "step": 32069 + }, + { + "epoch": 2.52, + "learning_rate": 1.8296893980957135e-05, + "loss": 1.4089, + "step": 32070 + }, + { + "epoch": 2.52, + "learning_rate": 1.8290978787991957e-05, + "loss": 1.4282, + "step": 32071 + }, + { + "epoch": 2.52, + "learning_rate": 1.828506448925835e-05, + "loss": 1.4434, + "step": 32072 + }, + { + "epoch": 2.52, + "learning_rate": 1.8279151084796467e-05, + "loss": 1.4129, + "step": 32073 + }, + { + "epoch": 2.52, + "learning_rate": 1.8273238574646427e-05, + "loss": 1.3885, + "step": 32074 + }, + { + "epoch": 2.52, + "learning_rate": 1.8267326958848426e-05, + "loss": 1.4104, + "step": 32075 + }, + { + "epoch": 2.52, + "learning_rate": 1.8261416237442605e-05, + "loss": 1.4688, + "step": 32076 + }, + { + "epoch": 2.52, + "learning_rate": 1.8255506410469013e-05, + "loss": 1.4438, + "step": 32077 + }, + { + "epoch": 2.52, + "learning_rate": 1.8249597477967865e-05, + "loss": 1.4289, + "step": 32078 + }, + { + "epoch": 2.52, + "learning_rate": 1.8243689439979246e-05, + "loss": 1.4367, + "step": 32079 + }, + { + "epoch": 2.52, + "learning_rate": 1.8237782296543247e-05, + "loss": 1.4392, + "step": 32080 + }, + { + "epoch": 2.52, + "learning_rate": 1.823187604770001e-05, + "loss": 1.4579, + "step": 32081 + }, + { + "epoch": 2.52, + "learning_rate": 1.8225970693489627e-05, + "loss": 1.3934, + "step": 32082 + }, + { + "epoch": 2.52, + "learning_rate": 1.8220066233952146e-05, + "loss": 1.4447, + "step": 32083 + }, + { + "epoch": 2.52, + "learning_rate": 1.8214162669127736e-05, + "loss": 1.4449, + "step": 32084 + }, + { + "epoch": 2.52, + "learning_rate": 1.8208259999056396e-05, + "loss": 1.4388, + "step": 32085 + }, + { + "epoch": 2.52, + "learning_rate": 1.8202358223778263e-05, + "loss": 1.4761, + "step": 32086 + }, + { + "epoch": 2.52, + "learning_rate": 1.819645734333337e-05, + "loss": 1.4519, + "step": 32087 + }, + { + "epoch": 2.52, + "learning_rate": 1.819055735776182e-05, + "loss": 1.4626, + "step": 32088 + }, + { + "epoch": 2.52, + "learning_rate": 1.8184658267103665e-05, + "loss": 1.4222, + "step": 32089 + }, + { + "epoch": 2.52, + "learning_rate": 1.8178760071398918e-05, + "loss": 1.4816, + "step": 32090 + }, + { + "epoch": 2.52, + "learning_rate": 1.8172862770687617e-05, + "loss": 1.441, + "step": 32091 + }, + { + "epoch": 2.53, + "learning_rate": 1.8166966365009866e-05, + "loss": 1.4655, + "step": 32092 + }, + { + "epoch": 2.53, + "learning_rate": 1.8161070854405664e-05, + "loss": 1.4725, + "step": 32093 + }, + { + "epoch": 2.53, + "learning_rate": 1.8155176238914994e-05, + "loss": 1.4211, + "step": 32094 + }, + { + "epoch": 2.53, + "learning_rate": 1.8149282518577958e-05, + "loss": 1.4235, + "step": 32095 + }, + { + "epoch": 2.53, + "learning_rate": 1.814338969343454e-05, + "loss": 1.4331, + "step": 32096 + }, + { + "epoch": 2.53, + "learning_rate": 1.8137497763524693e-05, + "loss": 1.4555, + "step": 32097 + }, + { + "epoch": 2.53, + "learning_rate": 1.813160672888852e-05, + "loss": 1.5239, + "step": 32098 + }, + { + "epoch": 2.53, + "learning_rate": 1.8125716589565952e-05, + "loss": 1.4282, + "step": 32099 + }, + { + "epoch": 2.53, + "learning_rate": 1.811982734559696e-05, + "loss": 1.4628, + "step": 32100 + }, + { + "epoch": 2.53, + "learning_rate": 1.8113938997021578e-05, + "loss": 1.4941, + "step": 32101 + }, + { + "epoch": 2.53, + "learning_rate": 1.8108051543879787e-05, + "loss": 1.435, + "step": 32102 + }, + { + "epoch": 2.53, + "learning_rate": 1.8102164986211542e-05, + "loss": 1.4468, + "step": 32103 + }, + { + "epoch": 2.53, + "learning_rate": 1.8096279324056778e-05, + "loss": 1.4733, + "step": 32104 + }, + { + "epoch": 2.53, + "learning_rate": 1.809039455745553e-05, + "loss": 1.4431, + "step": 32105 + }, + { + "epoch": 2.53, + "learning_rate": 1.8084510686447694e-05, + "loss": 1.4467, + "step": 32106 + }, + { + "epoch": 2.53, + "learning_rate": 1.8078627711073247e-05, + "loss": 1.3905, + "step": 32107 + }, + { + "epoch": 2.53, + "learning_rate": 1.807274563137208e-05, + "loss": 1.4156, + "step": 32108 + }, + { + "epoch": 2.53, + "learning_rate": 1.8066864447384205e-05, + "loss": 1.435, + "step": 32109 + }, + { + "epoch": 2.53, + "learning_rate": 1.80609841591495e-05, + "loss": 1.4092, + "step": 32110 + }, + { + "epoch": 2.53, + "learning_rate": 1.8055104766707885e-05, + "loss": 1.4228, + "step": 32111 + }, + { + "epoch": 2.53, + "learning_rate": 1.8049226270099326e-05, + "loss": 1.4628, + "step": 32112 + }, + { + "epoch": 2.53, + "learning_rate": 1.8043348669363696e-05, + "loss": 1.3984, + "step": 32113 + }, + { + "epoch": 2.53, + "learning_rate": 1.803747196454087e-05, + "loss": 1.4489, + "step": 32114 + }, + { + "epoch": 2.53, + "learning_rate": 1.803159615567083e-05, + "loss": 1.5089, + "step": 32115 + }, + { + "epoch": 2.53, + "learning_rate": 1.8025721242793402e-05, + "loss": 1.4625, + "step": 32116 + }, + { + "epoch": 2.53, + "learning_rate": 1.801984722594852e-05, + "loss": 1.4586, + "step": 32117 + }, + { + "epoch": 2.53, + "learning_rate": 1.8013974105176006e-05, + "loss": 1.4351, + "step": 32118 + }, + { + "epoch": 2.53, + "learning_rate": 1.8008101880515808e-05, + "loss": 1.4379, + "step": 32119 + }, + { + "epoch": 2.53, + "learning_rate": 1.8002230552007764e-05, + "loss": 1.4636, + "step": 32120 + }, + { + "epoch": 2.53, + "learning_rate": 1.7996360119691688e-05, + "loss": 1.4226, + "step": 32121 + }, + { + "epoch": 2.53, + "learning_rate": 1.799049058360752e-05, + "loss": 1.4334, + "step": 32122 + }, + { + "epoch": 2.53, + "learning_rate": 1.7984621943795075e-05, + "loss": 1.4219, + "step": 32123 + }, + { + "epoch": 2.53, + "learning_rate": 1.7978754200294153e-05, + "loss": 1.3798, + "step": 32124 + }, + { + "epoch": 2.53, + "learning_rate": 1.7972887353144678e-05, + "loss": 1.4346, + "step": 32125 + }, + { + "epoch": 2.53, + "learning_rate": 1.7967021402386444e-05, + "loss": 1.3801, + "step": 32126 + }, + { + "epoch": 2.53, + "learning_rate": 1.7961156348059258e-05, + "loss": 1.4346, + "step": 32127 + }, + { + "epoch": 2.53, + "learning_rate": 1.7955292190202934e-05, + "loss": 1.4253, + "step": 32128 + }, + { + "epoch": 2.53, + "learning_rate": 1.7949428928857327e-05, + "loss": 1.4455, + "step": 32129 + }, + { + "epoch": 2.53, + "learning_rate": 1.794356656406224e-05, + "loss": 1.4743, + "step": 32130 + }, + { + "epoch": 2.53, + "learning_rate": 1.7937705095857417e-05, + "loss": 1.4475, + "step": 32131 + }, + { + "epoch": 2.53, + "learning_rate": 1.79318445242827e-05, + "loss": 1.4633, + "step": 32132 + }, + { + "epoch": 2.53, + "learning_rate": 1.792598484937792e-05, + "loss": 1.4355, + "step": 32133 + }, + { + "epoch": 2.53, + "learning_rate": 1.7920126071182815e-05, + "loss": 1.4338, + "step": 32134 + }, + { + "epoch": 2.53, + "learning_rate": 1.7914268189737137e-05, + "loss": 1.4294, + "step": 32135 + }, + { + "epoch": 2.53, + "learning_rate": 1.7908411205080713e-05, + "loss": 1.4607, + "step": 32136 + }, + { + "epoch": 2.53, + "learning_rate": 1.7902555117253287e-05, + "loss": 1.4431, + "step": 32137 + }, + { + "epoch": 2.53, + "learning_rate": 1.7896699926294572e-05, + "loss": 1.4576, + "step": 32138 + }, + { + "epoch": 2.53, + "learning_rate": 1.7890845632244404e-05, + "loss": 1.4479, + "step": 32139 + }, + { + "epoch": 2.53, + "learning_rate": 1.7884992235142486e-05, + "loss": 1.4156, + "step": 32140 + }, + { + "epoch": 2.53, + "learning_rate": 1.7879139735028537e-05, + "loss": 1.4654, + "step": 32141 + }, + { + "epoch": 2.53, + "learning_rate": 1.7873288131942354e-05, + "loss": 1.4928, + "step": 32142 + }, + { + "epoch": 2.53, + "learning_rate": 1.7867437425923625e-05, + "loss": 1.4753, + "step": 32143 + }, + { + "epoch": 2.53, + "learning_rate": 1.7861587617012087e-05, + "loss": 1.4714, + "step": 32144 + }, + { + "epoch": 2.53, + "learning_rate": 1.78557387052474e-05, + "loss": 1.4411, + "step": 32145 + }, + { + "epoch": 2.53, + "learning_rate": 1.784989069066936e-05, + "loss": 1.4875, + "step": 32146 + }, + { + "epoch": 2.53, + "learning_rate": 1.7844043573317647e-05, + "loss": 1.444, + "step": 32147 + }, + { + "epoch": 2.53, + "learning_rate": 1.783819735323191e-05, + "loss": 1.4627, + "step": 32148 + }, + { + "epoch": 2.53, + "learning_rate": 1.7832352030451886e-05, + "loss": 1.4882, + "step": 32149 + }, + { + "epoch": 2.53, + "learning_rate": 1.7826507605017276e-05, + "loss": 1.4395, + "step": 32150 + }, + { + "epoch": 2.53, + "learning_rate": 1.782066407696775e-05, + "loss": 1.4295, + "step": 32151 + }, + { + "epoch": 2.53, + "learning_rate": 1.7814821446342943e-05, + "loss": 1.4263, + "step": 32152 + }, + { + "epoch": 2.53, + "learning_rate": 1.780897971318257e-05, + "loss": 1.4443, + "step": 32153 + }, + { + "epoch": 2.53, + "learning_rate": 1.7803138877526285e-05, + "loss": 1.4511, + "step": 32154 + }, + { + "epoch": 2.53, + "learning_rate": 1.7797298939413706e-05, + "loss": 1.4404, + "step": 32155 + }, + { + "epoch": 2.53, + "learning_rate": 1.7791459898884535e-05, + "loss": 1.4692, + "step": 32156 + }, + { + "epoch": 2.53, + "learning_rate": 1.778562175597841e-05, + "loss": 1.4442, + "step": 32157 + }, + { + "epoch": 2.53, + "learning_rate": 1.7779784510734906e-05, + "loss": 1.445, + "step": 32158 + }, + { + "epoch": 2.53, + "learning_rate": 1.7773948163193736e-05, + "loss": 1.4739, + "step": 32159 + }, + { + "epoch": 2.53, + "learning_rate": 1.776811271339448e-05, + "loss": 1.4012, + "step": 32160 + }, + { + "epoch": 2.53, + "learning_rate": 1.776227816137677e-05, + "loss": 1.4935, + "step": 32161 + }, + { + "epoch": 2.53, + "learning_rate": 1.7756444507180197e-05, + "loss": 1.4845, + "step": 32162 + }, + { + "epoch": 2.53, + "learning_rate": 1.7750611750844373e-05, + "loss": 1.4759, + "step": 32163 + }, + { + "epoch": 2.53, + "learning_rate": 1.7744779892408955e-05, + "loss": 1.4559, + "step": 32164 + }, + { + "epoch": 2.53, + "learning_rate": 1.7738948931913494e-05, + "loss": 1.4793, + "step": 32165 + }, + { + "epoch": 2.53, + "learning_rate": 1.7733118869397555e-05, + "loss": 1.4597, + "step": 32166 + }, + { + "epoch": 2.53, + "learning_rate": 1.772728970490076e-05, + "loss": 1.4585, + "step": 32167 + }, + { + "epoch": 2.53, + "learning_rate": 1.772146143846269e-05, + "loss": 1.4295, + "step": 32168 + }, + { + "epoch": 2.53, + "learning_rate": 1.771563407012287e-05, + "loss": 1.4382, + "step": 32169 + }, + { + "epoch": 2.53, + "learning_rate": 1.7709807599920928e-05, + "loss": 1.4443, + "step": 32170 + }, + { + "epoch": 2.53, + "learning_rate": 1.7703982027896386e-05, + "loss": 1.4732, + "step": 32171 + }, + { + "epoch": 2.53, + "learning_rate": 1.769815735408876e-05, + "loss": 1.4485, + "step": 32172 + }, + { + "epoch": 2.53, + "learning_rate": 1.7692333578537672e-05, + "loss": 1.4404, + "step": 32173 + }, + { + "epoch": 2.53, + "learning_rate": 1.7686510701282617e-05, + "loss": 1.4922, + "step": 32174 + }, + { + "epoch": 2.53, + "learning_rate": 1.7680688722363123e-05, + "loss": 1.4543, + "step": 32175 + }, + { + "epoch": 2.53, + "learning_rate": 1.767486764181875e-05, + "loss": 1.4582, + "step": 32176 + }, + { + "epoch": 2.53, + "learning_rate": 1.7669047459689007e-05, + "loss": 1.4081, + "step": 32177 + }, + { + "epoch": 2.53, + "learning_rate": 1.7663228176013406e-05, + "loss": 1.4864, + "step": 32178 + }, + { + "epoch": 2.53, + "learning_rate": 1.76574097908314e-05, + "loss": 1.4739, + "step": 32179 + }, + { + "epoch": 2.53, + "learning_rate": 1.765159230418261e-05, + "loss": 1.4202, + "step": 32180 + }, + { + "epoch": 2.53, + "learning_rate": 1.7645775716106453e-05, + "loss": 1.4946, + "step": 32181 + }, + { + "epoch": 2.53, + "learning_rate": 1.763996002664243e-05, + "loss": 1.434, + "step": 32182 + }, + { + "epoch": 2.53, + "learning_rate": 1.763414523583006e-05, + "loss": 1.4537, + "step": 32183 + }, + { + "epoch": 2.53, + "learning_rate": 1.7628331343708796e-05, + "loss": 1.4246, + "step": 32184 + }, + { + "epoch": 2.53, + "learning_rate": 1.762251835031812e-05, + "loss": 1.4554, + "step": 32185 + }, + { + "epoch": 2.53, + "learning_rate": 1.7616706255697454e-05, + "loss": 1.4636, + "step": 32186 + }, + { + "epoch": 2.53, + "learning_rate": 1.761089505988633e-05, + "loss": 1.4523, + "step": 32187 + }, + { + "epoch": 2.53, + "learning_rate": 1.7605084762924186e-05, + "loss": 1.3838, + "step": 32188 + }, + { + "epoch": 2.53, + "learning_rate": 1.7599275364850407e-05, + "loss": 1.4278, + "step": 32189 + }, + { + "epoch": 2.53, + "learning_rate": 1.759346686570451e-05, + "loss": 1.4498, + "step": 32190 + }, + { + "epoch": 2.53, + "learning_rate": 1.7587659265525912e-05, + "loss": 1.457, + "step": 32191 + }, + { + "epoch": 2.53, + "learning_rate": 1.7581852564354015e-05, + "loss": 1.4394, + "step": 32192 + }, + { + "epoch": 2.53, + "learning_rate": 1.757604676222829e-05, + "loss": 1.4678, + "step": 32193 + }, + { + "epoch": 2.53, + "learning_rate": 1.7570241859188123e-05, + "loss": 1.4002, + "step": 32194 + }, + { + "epoch": 2.53, + "learning_rate": 1.7564437855272913e-05, + "loss": 1.4903, + "step": 32195 + }, + { + "epoch": 2.53, + "learning_rate": 1.7558634750522075e-05, + "loss": 1.4372, + "step": 32196 + }, + { + "epoch": 2.53, + "learning_rate": 1.7552832544975055e-05, + "loss": 1.4761, + "step": 32197 + }, + { + "epoch": 2.53, + "learning_rate": 1.7547031238671213e-05, + "loss": 1.4835, + "step": 32198 + }, + { + "epoch": 2.53, + "learning_rate": 1.75412308316499e-05, + "loss": 1.467, + "step": 32199 + }, + { + "epoch": 2.53, + "learning_rate": 1.7535431323950556e-05, + "loss": 1.4624, + "step": 32200 + }, + { + "epoch": 2.53, + "learning_rate": 1.7529632715612546e-05, + "loss": 1.4798, + "step": 32201 + }, + { + "epoch": 2.53, + "learning_rate": 1.7523835006675225e-05, + "loss": 1.407, + "step": 32202 + }, + { + "epoch": 2.53, + "learning_rate": 1.7518038197177925e-05, + "loss": 1.4468, + "step": 32203 + }, + { + "epoch": 2.53, + "learning_rate": 1.7512242287160066e-05, + "loss": 1.4454, + "step": 32204 + }, + { + "epoch": 2.53, + "learning_rate": 1.7506447276660985e-05, + "loss": 1.4502, + "step": 32205 + }, + { + "epoch": 2.53, + "learning_rate": 1.7500653165719965e-05, + "loss": 1.4651, + "step": 32206 + }, + { + "epoch": 2.53, + "learning_rate": 1.749485995437642e-05, + "loss": 1.4133, + "step": 32207 + }, + { + "epoch": 2.53, + "learning_rate": 1.7489067642669662e-05, + "loss": 1.3928, + "step": 32208 + }, + { + "epoch": 2.53, + "learning_rate": 1.748327623063897e-05, + "loss": 1.4168, + "step": 32209 + }, + { + "epoch": 2.53, + "learning_rate": 1.7477485718323698e-05, + "loss": 1.4815, + "step": 32210 + }, + { + "epoch": 2.53, + "learning_rate": 1.747169610576321e-05, + "loss": 1.4279, + "step": 32211 + }, + { + "epoch": 2.53, + "learning_rate": 1.7465907392996763e-05, + "loss": 1.455, + "step": 32212 + }, + { + "epoch": 2.53, + "learning_rate": 1.746011958006364e-05, + "loss": 1.4751, + "step": 32213 + }, + { + "epoch": 2.53, + "learning_rate": 1.7454332667003197e-05, + "loss": 1.4396, + "step": 32214 + }, + { + "epoch": 2.53, + "learning_rate": 1.744854665385468e-05, + "loss": 1.4287, + "step": 32215 + }, + { + "epoch": 2.53, + "learning_rate": 1.7442761540657358e-05, + "loss": 1.4284, + "step": 32216 + }, + { + "epoch": 2.53, + "learning_rate": 1.7436977327450567e-05, + "loss": 1.4288, + "step": 32217 + }, + { + "epoch": 2.53, + "learning_rate": 1.7431194014273546e-05, + "loss": 1.4065, + "step": 32218 + }, + { + "epoch": 2.54, + "learning_rate": 1.7425411601165562e-05, + "loss": 1.4756, + "step": 32219 + }, + { + "epoch": 2.54, + "learning_rate": 1.741963008816583e-05, + "loss": 1.453, + "step": 32220 + }, + { + "epoch": 2.54, + "learning_rate": 1.741384947531369e-05, + "loss": 1.4597, + "step": 32221 + }, + { + "epoch": 2.54, + "learning_rate": 1.7408069762648342e-05, + "loss": 1.4344, + "step": 32222 + }, + { + "epoch": 2.54, + "learning_rate": 1.7402290950209e-05, + "loss": 1.4442, + "step": 32223 + }, + { + "epoch": 2.54, + "learning_rate": 1.7396513038034958e-05, + "loss": 1.4639, + "step": 32224 + }, + { + "epoch": 2.54, + "learning_rate": 1.7390736026165415e-05, + "loss": 1.4583, + "step": 32225 + }, + { + "epoch": 2.54, + "learning_rate": 1.738495991463955e-05, + "loss": 1.4227, + "step": 32226 + }, + { + "epoch": 2.54, + "learning_rate": 1.737918470349664e-05, + "loss": 1.4048, + "step": 32227 + }, + { + "epoch": 2.54, + "learning_rate": 1.7373410392775916e-05, + "loss": 1.4645, + "step": 32228 + }, + { + "epoch": 2.54, + "learning_rate": 1.736763698251653e-05, + "loss": 1.4652, + "step": 32229 + }, + { + "epoch": 2.54, + "learning_rate": 1.736186447275767e-05, + "loss": 1.431, + "step": 32230 + }, + { + "epoch": 2.54, + "learning_rate": 1.73560928635386e-05, + "loss": 1.4261, + "step": 32231 + }, + { + "epoch": 2.54, + "learning_rate": 1.7350322154898446e-05, + "loss": 1.4589, + "step": 32232 + }, + { + "epoch": 2.54, + "learning_rate": 1.7344552346876365e-05, + "loss": 1.4259, + "step": 32233 + }, + { + "epoch": 2.54, + "learning_rate": 1.733878343951162e-05, + "loss": 1.4086, + "step": 32234 + }, + { + "epoch": 2.54, + "learning_rate": 1.7333015432843312e-05, + "loss": 1.4488, + "step": 32235 + }, + { + "epoch": 2.54, + "learning_rate": 1.7327248326910588e-05, + "loss": 1.4072, + "step": 32236 + }, + { + "epoch": 2.54, + "learning_rate": 1.7321482121752666e-05, + "loss": 1.5135, + "step": 32237 + }, + { + "epoch": 2.54, + "learning_rate": 1.731571681740867e-05, + "loss": 1.4318, + "step": 32238 + }, + { + "epoch": 2.54, + "learning_rate": 1.7309952413917717e-05, + "loss": 1.3922, + "step": 32239 + }, + { + "epoch": 2.54, + "learning_rate": 1.7304188911318957e-05, + "loss": 1.4261, + "step": 32240 + }, + { + "epoch": 2.54, + "learning_rate": 1.7298426309651544e-05, + "loss": 1.512, + "step": 32241 + }, + { + "epoch": 2.54, + "learning_rate": 1.7292664608954543e-05, + "loss": 1.4327, + "step": 32242 + }, + { + "epoch": 2.54, + "learning_rate": 1.728690380926716e-05, + "loss": 1.4269, + "step": 32243 + }, + { + "epoch": 2.54, + "learning_rate": 1.7281143910628432e-05, + "loss": 1.442, + "step": 32244 + }, + { + "epoch": 2.54, + "learning_rate": 1.7275384913077523e-05, + "loss": 1.4772, + "step": 32245 + }, + { + "epoch": 2.54, + "learning_rate": 1.7269626816653503e-05, + "loss": 1.4252, + "step": 32246 + }, + { + "epoch": 2.54, + "learning_rate": 1.7263869621395443e-05, + "loss": 1.4494, + "step": 32247 + }, + { + "epoch": 2.54, + "learning_rate": 1.725811332734249e-05, + "loss": 1.4303, + "step": 32248 + }, + { + "epoch": 2.54, + "learning_rate": 1.7252357934533707e-05, + "loss": 1.3363, + "step": 32249 + }, + { + "epoch": 2.54, + "learning_rate": 1.7246603443008118e-05, + "loss": 1.4312, + "step": 32250 + }, + { + "epoch": 2.54, + "learning_rate": 1.724084985280486e-05, + "loss": 1.4686, + "step": 32251 + }, + { + "epoch": 2.54, + "learning_rate": 1.7235097163962958e-05, + "loss": 1.4769, + "step": 32252 + }, + { + "epoch": 2.54, + "learning_rate": 1.7229345376521474e-05, + "loss": 1.4261, + "step": 32253 + }, + { + "epoch": 2.54, + "learning_rate": 1.7223594490519483e-05, + "loss": 1.4302, + "step": 32254 + }, + { + "epoch": 2.54, + "learning_rate": 1.7217844505996016e-05, + "loss": 1.443, + "step": 32255 + }, + { + "epoch": 2.54, + "learning_rate": 1.7212095422990107e-05, + "loss": 1.4889, + "step": 32256 + }, + { + "epoch": 2.54, + "learning_rate": 1.7206347241540762e-05, + "loss": 1.4858, + "step": 32257 + }, + { + "epoch": 2.54, + "learning_rate": 1.7200599961687035e-05, + "loss": 1.3917, + "step": 32258 + }, + { + "epoch": 2.54, + "learning_rate": 1.719485358346799e-05, + "loss": 1.4643, + "step": 32259 + }, + { + "epoch": 2.54, + "learning_rate": 1.7189108106922578e-05, + "loss": 1.4929, + "step": 32260 + }, + { + "epoch": 2.54, + "learning_rate": 1.7183363532089822e-05, + "loss": 1.44, + "step": 32261 + }, + { + "epoch": 2.54, + "learning_rate": 1.7177619859008758e-05, + "loss": 1.4562, + "step": 32262 + }, + { + "epoch": 2.54, + "learning_rate": 1.717187708771835e-05, + "loss": 1.4345, + "step": 32263 + }, + { + "epoch": 2.54, + "learning_rate": 1.716613521825759e-05, + "loss": 1.4327, + "step": 32264 + }, + { + "epoch": 2.54, + "learning_rate": 1.716039425066547e-05, + "loss": 1.4678, + "step": 32265 + }, + { + "epoch": 2.54, + "learning_rate": 1.715465418498099e-05, + "loss": 1.3999, + "step": 32266 + }, + { + "epoch": 2.54, + "learning_rate": 1.7148915021243036e-05, + "loss": 1.4682, + "step": 32267 + }, + { + "epoch": 2.54, + "learning_rate": 1.714317675949069e-05, + "loss": 1.4621, + "step": 32268 + }, + { + "epoch": 2.54, + "learning_rate": 1.7137439399762864e-05, + "loss": 1.4132, + "step": 32269 + }, + { + "epoch": 2.54, + "learning_rate": 1.7131702942098463e-05, + "loss": 1.4375, + "step": 32270 + }, + { + "epoch": 2.54, + "learning_rate": 1.7125967386536504e-05, + "loss": 1.4347, + "step": 32271 + }, + { + "epoch": 2.54, + "learning_rate": 1.7120232733115906e-05, + "loss": 1.4961, + "step": 32272 + }, + { + "epoch": 2.54, + "learning_rate": 1.7114498981875556e-05, + "loss": 1.3846, + "step": 32273 + }, + { + "epoch": 2.54, + "learning_rate": 1.710876613285444e-05, + "loss": 1.4736, + "step": 32274 + }, + { + "epoch": 2.54, + "learning_rate": 1.710303418609149e-05, + "loss": 1.434, + "step": 32275 + }, + { + "epoch": 2.54, + "learning_rate": 1.7097303141625594e-05, + "loss": 1.4238, + "step": 32276 + }, + { + "epoch": 2.54, + "learning_rate": 1.709157299949569e-05, + "loss": 1.4617, + "step": 32277 + }, + { + "epoch": 2.54, + "learning_rate": 1.7085843759740607e-05, + "loss": 1.4296, + "step": 32278 + }, + { + "epoch": 2.54, + "learning_rate": 1.708011542239934e-05, + "loss": 1.4381, + "step": 32279 + }, + { + "epoch": 2.54, + "learning_rate": 1.707438798751073e-05, + "loss": 1.4415, + "step": 32280 + }, + { + "epoch": 2.54, + "learning_rate": 1.7068661455113653e-05, + "loss": 1.4141, + "step": 32281 + }, + { + "epoch": 2.54, + "learning_rate": 1.7062935825247027e-05, + "loss": 1.4248, + "step": 32282 + }, + { + "epoch": 2.54, + "learning_rate": 1.70572110979497e-05, + "loss": 1.4462, + "step": 32283 + }, + { + "epoch": 2.54, + "learning_rate": 1.7051487273260515e-05, + "loss": 1.4402, + "step": 32284 + }, + { + "epoch": 2.54, + "learning_rate": 1.7045764351218404e-05, + "loss": 1.5021, + "step": 32285 + }, + { + "epoch": 2.54, + "learning_rate": 1.7040042331862187e-05, + "loss": 1.4734, + "step": 32286 + }, + { + "epoch": 2.54, + "learning_rate": 1.7034321215230677e-05, + "loss": 1.4656, + "step": 32287 + }, + { + "epoch": 2.54, + "learning_rate": 1.702860100136277e-05, + "loss": 1.4173, + "step": 32288 + }, + { + "epoch": 2.54, + "learning_rate": 1.7022881690297256e-05, + "loss": 1.4287, + "step": 32289 + }, + { + "epoch": 2.54, + "learning_rate": 1.7017163282073033e-05, + "loss": 1.4601, + "step": 32290 + }, + { + "epoch": 2.54, + "learning_rate": 1.7011445776728844e-05, + "loss": 1.4705, + "step": 32291 + }, + { + "epoch": 2.54, + "learning_rate": 1.7005729174303593e-05, + "loss": 1.5031, + "step": 32292 + }, + { + "epoch": 2.54, + "learning_rate": 1.7000013474836037e-05, + "loss": 1.4429, + "step": 32293 + }, + { + "epoch": 2.54, + "learning_rate": 1.699429867836496e-05, + "loss": 1.4944, + "step": 32294 + }, + { + "epoch": 2.54, + "learning_rate": 1.698858478492923e-05, + "loss": 1.4575, + "step": 32295 + }, + { + "epoch": 2.54, + "learning_rate": 1.6982871794567608e-05, + "loss": 1.3894, + "step": 32296 + }, + { + "epoch": 2.54, + "learning_rate": 1.6977159707318893e-05, + "loss": 1.4613, + "step": 32297 + }, + { + "epoch": 2.54, + "learning_rate": 1.6971448523221816e-05, + "loss": 1.4164, + "step": 32298 + }, + { + "epoch": 2.54, + "learning_rate": 1.6965738242315208e-05, + "loss": 1.4634, + "step": 32299 + }, + { + "epoch": 2.54, + "learning_rate": 1.6960028864637843e-05, + "loss": 1.41, + "step": 32300 + }, + { + "epoch": 2.54, + "learning_rate": 1.695432039022842e-05, + "loss": 1.4144, + "step": 32301 + }, + { + "epoch": 2.54, + "learning_rate": 1.6948612819125778e-05, + "loss": 1.4299, + "step": 32302 + }, + { + "epoch": 2.54, + "learning_rate": 1.6942906151368636e-05, + "loss": 1.497, + "step": 32303 + }, + { + "epoch": 2.54, + "learning_rate": 1.6937200386995707e-05, + "loss": 1.4532, + "step": 32304 + }, + { + "epoch": 2.54, + "learning_rate": 1.693149552604575e-05, + "loss": 1.4833, + "step": 32305 + }, + { + "epoch": 2.54, + "learning_rate": 1.6925791568557535e-05, + "loss": 1.4488, + "step": 32306 + }, + { + "epoch": 2.54, + "learning_rate": 1.692008851456976e-05, + "loss": 1.472, + "step": 32307 + }, + { + "epoch": 2.54, + "learning_rate": 1.6914386364121107e-05, + "loss": 1.4569, + "step": 32308 + }, + { + "epoch": 2.54, + "learning_rate": 1.690868511725037e-05, + "loss": 1.4191, + "step": 32309 + }, + { + "epoch": 2.54, + "learning_rate": 1.6902984773996214e-05, + "loss": 1.4241, + "step": 32310 + }, + { + "epoch": 2.54, + "learning_rate": 1.689728533439731e-05, + "loss": 1.4946, + "step": 32311 + }, + { + "epoch": 2.54, + "learning_rate": 1.6891586798492407e-05, + "loss": 1.3673, + "step": 32312 + }, + { + "epoch": 2.54, + "learning_rate": 1.6885889166320178e-05, + "loss": 1.3875, + "step": 32313 + }, + { + "epoch": 2.54, + "learning_rate": 1.6880192437919303e-05, + "loss": 1.4244, + "step": 32314 + }, + { + "epoch": 2.54, + "learning_rate": 1.687449661332844e-05, + "loss": 1.4481, + "step": 32315 + }, + { + "epoch": 2.54, + "learning_rate": 1.6868801692586308e-05, + "loss": 1.4642, + "step": 32316 + }, + { + "epoch": 2.54, + "learning_rate": 1.6863107675731542e-05, + "loss": 1.4658, + "step": 32317 + }, + { + "epoch": 2.54, + "learning_rate": 1.6857414562802772e-05, + "loss": 1.4626, + "step": 32318 + }, + { + "epoch": 2.54, + "learning_rate": 1.685172235383871e-05, + "loss": 1.4676, + "step": 32319 + }, + { + "epoch": 2.54, + "learning_rate": 1.684603104887795e-05, + "loss": 1.4357, + "step": 32320 + }, + { + "epoch": 2.54, + "learning_rate": 1.6840340647959183e-05, + "loss": 1.4847, + "step": 32321 + }, + { + "epoch": 2.54, + "learning_rate": 1.683465115112101e-05, + "loss": 1.4456, + "step": 32322 + }, + { + "epoch": 2.54, + "learning_rate": 1.682896255840208e-05, + "loss": 1.3916, + "step": 32323 + }, + { + "epoch": 2.54, + "learning_rate": 1.6823274869841e-05, + "loss": 1.4503, + "step": 32324 + }, + { + "epoch": 2.54, + "learning_rate": 1.6817588085476375e-05, + "loss": 1.425, + "step": 32325 + }, + { + "epoch": 2.54, + "learning_rate": 1.681190220534685e-05, + "loss": 1.4485, + "step": 32326 + }, + { + "epoch": 2.54, + "learning_rate": 1.6806217229491016e-05, + "loss": 1.4401, + "step": 32327 + }, + { + "epoch": 2.54, + "learning_rate": 1.6800533157947436e-05, + "loss": 1.4194, + "step": 32328 + }, + { + "epoch": 2.54, + "learning_rate": 1.6794849990754755e-05, + "loss": 1.4368, + "step": 32329 + }, + { + "epoch": 2.54, + "learning_rate": 1.6789167727951534e-05, + "loss": 1.5148, + "step": 32330 + }, + { + "epoch": 2.54, + "learning_rate": 1.678348636957635e-05, + "loss": 1.4447, + "step": 32331 + }, + { + "epoch": 2.54, + "learning_rate": 1.6777805915667764e-05, + "loss": 1.4511, + "step": 32332 + }, + { + "epoch": 2.54, + "learning_rate": 1.6772126366264364e-05, + "loss": 1.4345, + "step": 32333 + }, + { + "epoch": 2.54, + "learning_rate": 1.6766447721404725e-05, + "loss": 1.494, + "step": 32334 + }, + { + "epoch": 2.54, + "learning_rate": 1.6760769981127342e-05, + "loss": 1.4732, + "step": 32335 + }, + { + "epoch": 2.54, + "learning_rate": 1.6755093145470806e-05, + "loss": 1.3974, + "step": 32336 + }, + { + "epoch": 2.54, + "learning_rate": 1.674941721447368e-05, + "loss": 1.4778, + "step": 32337 + }, + { + "epoch": 2.54, + "learning_rate": 1.674374218817449e-05, + "loss": 1.4761, + "step": 32338 + }, + { + "epoch": 2.54, + "learning_rate": 1.6738068066611722e-05, + "loss": 1.4293, + "step": 32339 + }, + { + "epoch": 2.54, + "learning_rate": 1.6732394849823954e-05, + "loss": 1.4756, + "step": 32340 + }, + { + "epoch": 2.54, + "learning_rate": 1.672672253784968e-05, + "loss": 1.454, + "step": 32341 + }, + { + "epoch": 2.54, + "learning_rate": 1.6721051130727397e-05, + "loss": 1.4336, + "step": 32342 + }, + { + "epoch": 2.54, + "learning_rate": 1.6715380628495646e-05, + "loss": 1.4319, + "step": 32343 + }, + { + "epoch": 2.54, + "learning_rate": 1.6709711031192907e-05, + "loss": 1.4593, + "step": 32344 + }, + { + "epoch": 2.54, + "learning_rate": 1.6704042338857654e-05, + "loss": 1.4414, + "step": 32345 + }, + { + "epoch": 2.55, + "learning_rate": 1.6698374551528422e-05, + "loss": 1.4389, + "step": 32346 + }, + { + "epoch": 2.55, + "learning_rate": 1.6692707669243662e-05, + "loss": 1.4522, + "step": 32347 + }, + { + "epoch": 2.55, + "learning_rate": 1.6687041692041825e-05, + "loss": 1.418, + "step": 32348 + }, + { + "epoch": 2.55, + "learning_rate": 1.668137661996142e-05, + "loss": 1.461, + "step": 32349 + }, + { + "epoch": 2.55, + "learning_rate": 1.6675712453040925e-05, + "loss": 1.4604, + "step": 32350 + }, + { + "epoch": 2.55, + "learning_rate": 1.6670049191318748e-05, + "loss": 1.4446, + "step": 32351 + }, + { + "epoch": 2.55, + "learning_rate": 1.6664386834833305e-05, + "loss": 1.4736, + "step": 32352 + }, + { + "epoch": 2.55, + "learning_rate": 1.665872538362315e-05, + "loss": 1.433, + "step": 32353 + }, + { + "epoch": 2.55, + "learning_rate": 1.665306483772667e-05, + "loss": 1.4602, + "step": 32354 + }, + { + "epoch": 2.55, + "learning_rate": 1.66474051971823e-05, + "loss": 1.508, + "step": 32355 + }, + { + "epoch": 2.55, + "learning_rate": 1.664174646202841e-05, + "loss": 1.4707, + "step": 32356 + }, + { + "epoch": 2.55, + "learning_rate": 1.6636088632303517e-05, + "loss": 1.4507, + "step": 32357 + }, + { + "epoch": 2.55, + "learning_rate": 1.6630431708045978e-05, + "loss": 1.4706, + "step": 32358 + }, + { + "epoch": 2.55, + "learning_rate": 1.6624775689294174e-05, + "loss": 1.432, + "step": 32359 + }, + { + "epoch": 2.55, + "learning_rate": 1.6619120576086575e-05, + "loss": 1.4481, + "step": 32360 + }, + { + "epoch": 2.55, + "learning_rate": 1.6613466368461554e-05, + "loss": 1.442, + "step": 32361 + }, + { + "epoch": 2.55, + "learning_rate": 1.6607813066457442e-05, + "loss": 1.5083, + "step": 32362 + }, + { + "epoch": 2.55, + "learning_rate": 1.6602160670112697e-05, + "loss": 1.4707, + "step": 32363 + }, + { + "epoch": 2.55, + "learning_rate": 1.6596509179465665e-05, + "loss": 1.4769, + "step": 32364 + }, + { + "epoch": 2.55, + "learning_rate": 1.6590858594554705e-05, + "loss": 1.4355, + "step": 32365 + }, + { + "epoch": 2.55, + "learning_rate": 1.6585208915418203e-05, + "loss": 1.4771, + "step": 32366 + }, + { + "epoch": 2.55, + "learning_rate": 1.6579560142094524e-05, + "loss": 1.456, + "step": 32367 + }, + { + "epoch": 2.55, + "learning_rate": 1.657391227462197e-05, + "loss": 1.4954, + "step": 32368 + }, + { + "epoch": 2.55, + "learning_rate": 1.6568265313038914e-05, + "loss": 1.3981, + "step": 32369 + }, + { + "epoch": 2.55, + "learning_rate": 1.6562619257383743e-05, + "loss": 1.4977, + "step": 32370 + }, + { + "epoch": 2.55, + "learning_rate": 1.6556974107694737e-05, + "loss": 1.3972, + "step": 32371 + }, + { + "epoch": 2.55, + "learning_rate": 1.6551329864010237e-05, + "loss": 1.3905, + "step": 32372 + }, + { + "epoch": 2.55, + "learning_rate": 1.6545686526368545e-05, + "loss": 1.4192, + "step": 32373 + }, + { + "epoch": 2.55, + "learning_rate": 1.654004409480803e-05, + "loss": 1.452, + "step": 32374 + }, + { + "epoch": 2.55, + "learning_rate": 1.6534402569366946e-05, + "loss": 1.4552, + "step": 32375 + }, + { + "epoch": 2.55, + "learning_rate": 1.652876195008361e-05, + "loss": 1.4369, + "step": 32376 + }, + { + "epoch": 2.55, + "learning_rate": 1.652312223699634e-05, + "loss": 1.4743, + "step": 32377 + }, + { + "epoch": 2.55, + "learning_rate": 1.6517483430143408e-05, + "loss": 1.4393, + "step": 32378 + }, + { + "epoch": 2.55, + "learning_rate": 1.6511845529563084e-05, + "loss": 1.4327, + "step": 32379 + }, + { + "epoch": 2.55, + "learning_rate": 1.6506208535293686e-05, + "loss": 1.4112, + "step": 32380 + }, + { + "epoch": 2.55, + "learning_rate": 1.6500572447373468e-05, + "loss": 1.4282, + "step": 32381 + }, + { + "epoch": 2.55, + "learning_rate": 1.6494937265840662e-05, + "loss": 1.4736, + "step": 32382 + }, + { + "epoch": 2.55, + "learning_rate": 1.648930299073356e-05, + "loss": 1.4524, + "step": 32383 + }, + { + "epoch": 2.55, + "learning_rate": 1.6483669622090427e-05, + "loss": 1.4424, + "step": 32384 + }, + { + "epoch": 2.55, + "learning_rate": 1.647803715994952e-05, + "loss": 1.4716, + "step": 32385 + }, + { + "epoch": 2.55, + "learning_rate": 1.6472405604349004e-05, + "loss": 1.5036, + "step": 32386 + }, + { + "epoch": 2.55, + "learning_rate": 1.6466774955327216e-05, + "loss": 1.4642, + "step": 32387 + }, + { + "epoch": 2.55, + "learning_rate": 1.6461145212922328e-05, + "loss": 1.4372, + "step": 32388 + }, + { + "epoch": 2.55, + "learning_rate": 1.6455516377172573e-05, + "loss": 1.436, + "step": 32389 + }, + { + "epoch": 2.55, + "learning_rate": 1.6449888448116137e-05, + "loss": 1.4397, + "step": 32390 + }, + { + "epoch": 2.55, + "learning_rate": 1.6444261425791294e-05, + "loss": 1.4315, + "step": 32391 + }, + { + "epoch": 2.55, + "learning_rate": 1.643863531023621e-05, + "loss": 1.4753, + "step": 32392 + }, + { + "epoch": 2.55, + "learning_rate": 1.6433010101489052e-05, + "loss": 1.446, + "step": 32393 + }, + { + "epoch": 2.55, + "learning_rate": 1.6427385799588077e-05, + "loss": 1.5026, + "step": 32394 + }, + { + "epoch": 2.55, + "learning_rate": 1.6421762404571452e-05, + "loss": 1.4716, + "step": 32395 + }, + { + "epoch": 2.55, + "learning_rate": 1.64161399164773e-05, + "loss": 1.4526, + "step": 32396 + }, + { + "epoch": 2.55, + "learning_rate": 1.6410518335343885e-05, + "loss": 1.4286, + "step": 32397 + }, + { + "epoch": 2.55, + "learning_rate": 1.6404897661209316e-05, + "loss": 1.4286, + "step": 32398 + }, + { + "epoch": 2.55, + "learning_rate": 1.639927789411174e-05, + "loss": 1.3563, + "step": 32399 + }, + { + "epoch": 2.55, + "learning_rate": 1.6393659034089346e-05, + "loss": 1.4419, + "step": 32400 + }, + { + "epoch": 2.55, + "learning_rate": 1.638804108118032e-05, + "loss": 1.4318, + "step": 32401 + }, + { + "epoch": 2.55, + "learning_rate": 1.638242403542275e-05, + "loss": 1.4249, + "step": 32402 + }, + { + "epoch": 2.55, + "learning_rate": 1.637680789685475e-05, + "loss": 1.4683, + "step": 32403 + }, + { + "epoch": 2.55, + "learning_rate": 1.637119266551451e-05, + "loss": 1.5127, + "step": 32404 + }, + { + "epoch": 2.55, + "learning_rate": 1.6365578341440134e-05, + "loss": 1.4796, + "step": 32405 + }, + { + "epoch": 2.55, + "learning_rate": 1.6359964924669704e-05, + "loss": 1.3922, + "step": 32406 + }, + { + "epoch": 2.55, + "learning_rate": 1.635435241524141e-05, + "loss": 1.4912, + "step": 32407 + }, + { + "epoch": 2.55, + "learning_rate": 1.634874081319329e-05, + "loss": 1.4626, + "step": 32408 + }, + { + "epoch": 2.55, + "learning_rate": 1.6343130118563476e-05, + "loss": 1.4465, + "step": 32409 + }, + { + "epoch": 2.55, + "learning_rate": 1.6337520331390018e-05, + "loss": 1.4062, + "step": 32410 + }, + { + "epoch": 2.55, + "learning_rate": 1.633191145171108e-05, + "loss": 1.3992, + "step": 32411 + }, + { + "epoch": 2.55, + "learning_rate": 1.6326303479564682e-05, + "loss": 1.4629, + "step": 32412 + }, + { + "epoch": 2.55, + "learning_rate": 1.6320696414988875e-05, + "loss": 1.4631, + "step": 32413 + }, + { + "epoch": 2.55, + "learning_rate": 1.6315090258021823e-05, + "loss": 1.4665, + "step": 32414 + }, + { + "epoch": 2.55, + "learning_rate": 1.6309485008701494e-05, + "loss": 1.4488, + "step": 32415 + }, + { + "epoch": 2.55, + "learning_rate": 1.6303880667066012e-05, + "loss": 1.4386, + "step": 32416 + }, + { + "epoch": 2.55, + "learning_rate": 1.629827723315339e-05, + "loss": 1.4185, + "step": 32417 + }, + { + "epoch": 2.55, + "learning_rate": 1.6292674707001684e-05, + "loss": 1.4212, + "step": 32418 + }, + { + "epoch": 2.55, + "learning_rate": 1.628707308864895e-05, + "loss": 1.4094, + "step": 32419 + }, + { + "epoch": 2.55, + "learning_rate": 1.628147237813317e-05, + "loss": 1.4498, + "step": 32420 + }, + { + "epoch": 2.55, + "learning_rate": 1.6275872575492434e-05, + "loss": 1.4646, + "step": 32421 + }, + { + "epoch": 2.55, + "learning_rate": 1.6270273680764705e-05, + "loss": 1.4444, + "step": 32422 + }, + { + "epoch": 2.55, + "learning_rate": 1.626467569398801e-05, + "loss": 1.4508, + "step": 32423 + }, + { + "epoch": 2.55, + "learning_rate": 1.62590786152004e-05, + "loss": 1.4386, + "step": 32424 + }, + { + "epoch": 2.55, + "learning_rate": 1.6253482444439824e-05, + "loss": 1.4427, + "step": 32425 + }, + { + "epoch": 2.55, + "learning_rate": 1.6247887181744307e-05, + "loss": 1.421, + "step": 32426 + }, + { + "epoch": 2.55, + "learning_rate": 1.6242292827151797e-05, + "loss": 1.4525, + "step": 32427 + }, + { + "epoch": 2.55, + "learning_rate": 1.6236699380700317e-05, + "loss": 1.4424, + "step": 32428 + }, + { + "epoch": 2.55, + "learning_rate": 1.6231106842427854e-05, + "loss": 1.4003, + "step": 32429 + }, + { + "epoch": 2.55, + "learning_rate": 1.622551521237231e-05, + "loss": 1.4606, + "step": 32430 + }, + { + "epoch": 2.55, + "learning_rate": 1.62199244905717e-05, + "loss": 1.4367, + "step": 32431 + }, + { + "epoch": 2.55, + "learning_rate": 1.6214334677064017e-05, + "loss": 1.4257, + "step": 32432 + }, + { + "epoch": 2.55, + "learning_rate": 1.620874577188716e-05, + "loss": 1.4184, + "step": 32433 + }, + { + "epoch": 2.55, + "learning_rate": 1.6203157775079067e-05, + "loss": 1.437, + "step": 32434 + }, + { + "epoch": 2.55, + "learning_rate": 1.6197570686677725e-05, + "loss": 1.412, + "step": 32435 + }, + { + "epoch": 2.55, + "learning_rate": 1.6191984506721035e-05, + "loss": 1.4659, + "step": 32436 + }, + { + "epoch": 2.55, + "learning_rate": 1.61863992352469e-05, + "loss": 1.4935, + "step": 32437 + }, + { + "epoch": 2.55, + "learning_rate": 1.618081487229329e-05, + "loss": 1.4292, + "step": 32438 + }, + { + "epoch": 2.55, + "learning_rate": 1.617523141789811e-05, + "loss": 1.4503, + "step": 32439 + }, + { + "epoch": 2.55, + "learning_rate": 1.6169648872099227e-05, + "loss": 1.4613, + "step": 32440 + }, + { + "epoch": 2.55, + "learning_rate": 1.6164067234934613e-05, + "loss": 1.4803, + "step": 32441 + }, + { + "epoch": 2.55, + "learning_rate": 1.615848650644212e-05, + "loss": 1.5, + "step": 32442 + }, + { + "epoch": 2.55, + "learning_rate": 1.6152906686659634e-05, + "loss": 1.4196, + "step": 32443 + }, + { + "epoch": 2.55, + "learning_rate": 1.6147327775625025e-05, + "loss": 1.42, + "step": 32444 + }, + { + "epoch": 2.55, + "learning_rate": 1.614174977337623e-05, + "loss": 1.4866, + "step": 32445 + }, + { + "epoch": 2.55, + "learning_rate": 1.613617267995105e-05, + "loss": 1.4047, + "step": 32446 + }, + { + "epoch": 2.55, + "learning_rate": 1.613059649538739e-05, + "loss": 1.4337, + "step": 32447 + }, + { + "epoch": 2.55, + "learning_rate": 1.6125021219723118e-05, + "loss": 1.4734, + "step": 32448 + }, + { + "epoch": 2.55, + "learning_rate": 1.611944685299609e-05, + "loss": 1.4729, + "step": 32449 + }, + { + "epoch": 2.55, + "learning_rate": 1.6113873395244138e-05, + "loss": 1.4672, + "step": 32450 + }, + { + "epoch": 2.55, + "learning_rate": 1.610830084650507e-05, + "loss": 1.4507, + "step": 32451 + }, + { + "epoch": 2.55, + "learning_rate": 1.6102729206816765e-05, + "loss": 1.4366, + "step": 32452 + }, + { + "epoch": 2.55, + "learning_rate": 1.6097158476217055e-05, + "loss": 1.4576, + "step": 32453 + }, + { + "epoch": 2.55, + "learning_rate": 1.6091588654743716e-05, + "loss": 1.4187, + "step": 32454 + }, + { + "epoch": 2.55, + "learning_rate": 1.6086019742434604e-05, + "loss": 1.4446, + "step": 32455 + }, + { + "epoch": 2.55, + "learning_rate": 1.6080451739327537e-05, + "loss": 1.4436, + "step": 32456 + }, + { + "epoch": 2.55, + "learning_rate": 1.6074884645460255e-05, + "loss": 1.4247, + "step": 32457 + }, + { + "epoch": 2.55, + "learning_rate": 1.6069318460870645e-05, + "loss": 1.4874, + "step": 32458 + }, + { + "epoch": 2.55, + "learning_rate": 1.6063753185596457e-05, + "loss": 1.3946, + "step": 32459 + }, + { + "epoch": 2.55, + "learning_rate": 1.605818881967543e-05, + "loss": 1.4628, + "step": 32460 + }, + { + "epoch": 2.55, + "learning_rate": 1.6052625363145428e-05, + "loss": 1.5079, + "step": 32461 + }, + { + "epoch": 2.55, + "learning_rate": 1.6047062816044142e-05, + "loss": 1.4431, + "step": 32462 + }, + { + "epoch": 2.55, + "learning_rate": 1.604150117840941e-05, + "loss": 1.4601, + "step": 32463 + }, + { + "epoch": 2.55, + "learning_rate": 1.6035940450278916e-05, + "loss": 1.4341, + "step": 32464 + }, + { + "epoch": 2.55, + "learning_rate": 1.6030380631690514e-05, + "loss": 1.431, + "step": 32465 + }, + { + "epoch": 2.55, + "learning_rate": 1.6024821722681873e-05, + "loss": 1.4626, + "step": 32466 + }, + { + "epoch": 2.55, + "learning_rate": 1.601926372329078e-05, + "loss": 1.4429, + "step": 32467 + }, + { + "epoch": 2.55, + "learning_rate": 1.6013706633554907e-05, + "loss": 1.4427, + "step": 32468 + }, + { + "epoch": 2.55, + "learning_rate": 1.600815045351207e-05, + "loss": 1.4196, + "step": 32469 + }, + { + "epoch": 2.55, + "learning_rate": 1.600259518319994e-05, + "loss": 1.4345, + "step": 32470 + }, + { + "epoch": 2.55, + "learning_rate": 1.5997040822656205e-05, + "loss": 1.4658, + "step": 32471 + }, + { + "epoch": 2.55, + "learning_rate": 1.5991487371918647e-05, + "loss": 1.4314, + "step": 32472 + }, + { + "epoch": 2.56, + "learning_rate": 1.5985934831024945e-05, + "loss": 1.4512, + "step": 32473 + }, + { + "epoch": 2.56, + "learning_rate": 1.598038320001276e-05, + "loss": 1.3844, + "step": 32474 + }, + { + "epoch": 2.56, + "learning_rate": 1.5974832478919847e-05, + "loss": 1.5001, + "step": 32475 + }, + { + "epoch": 2.56, + "learning_rate": 1.5969282667783846e-05, + "loss": 1.4566, + "step": 32476 + }, + { + "epoch": 2.56, + "learning_rate": 1.596373376664244e-05, + "loss": 1.4218, + "step": 32477 + }, + { + "epoch": 2.56, + "learning_rate": 1.59581857755333e-05, + "loss": 1.4358, + "step": 32478 + }, + { + "epoch": 2.56, + "learning_rate": 1.5952638694494146e-05, + "loss": 1.4503, + "step": 32479 + }, + { + "epoch": 2.56, + "learning_rate": 1.5947092523562598e-05, + "loss": 1.4503, + "step": 32480 + }, + { + "epoch": 2.56, + "learning_rate": 1.5941547262776276e-05, + "loss": 1.4056, + "step": 32481 + }, + { + "epoch": 2.56, + "learning_rate": 1.593600291217292e-05, + "loss": 1.4782, + "step": 32482 + }, + { + "epoch": 2.56, + "learning_rate": 1.593045947179011e-05, + "loss": 1.4393, + "step": 32483 + }, + { + "epoch": 2.56, + "learning_rate": 1.59249169416655e-05, + "loss": 1.4148, + "step": 32484 + }, + { + "epoch": 2.56, + "learning_rate": 1.5919375321836664e-05, + "loss": 1.4471, + "step": 32485 + }, + { + "epoch": 2.56, + "learning_rate": 1.5913834612341337e-05, + "loss": 1.5213, + "step": 32486 + }, + { + "epoch": 2.56, + "learning_rate": 1.5908294813217053e-05, + "loss": 1.4709, + "step": 32487 + }, + { + "epoch": 2.56, + "learning_rate": 1.5902755924501435e-05, + "loss": 1.4879, + "step": 32488 + }, + { + "epoch": 2.56, + "learning_rate": 1.5897217946232138e-05, + "loss": 1.4663, + "step": 32489 + }, + { + "epoch": 2.56, + "learning_rate": 1.589168087844671e-05, + "loss": 1.4352, + "step": 32490 + }, + { + "epoch": 2.56, + "learning_rate": 1.588614472118274e-05, + "loss": 1.4188, + "step": 32491 + }, + { + "epoch": 2.56, + "learning_rate": 1.588060947447787e-05, + "loss": 1.4922, + "step": 32492 + }, + { + "epoch": 2.56, + "learning_rate": 1.5875075138369627e-05, + "loss": 1.4286, + "step": 32493 + }, + { + "epoch": 2.56, + "learning_rate": 1.5869541712895617e-05, + "loss": 1.4395, + "step": 32494 + }, + { + "epoch": 2.56, + "learning_rate": 1.586400919809338e-05, + "loss": 1.4807, + "step": 32495 + }, + { + "epoch": 2.56, + "learning_rate": 1.5858477594000534e-05, + "loss": 1.3964, + "step": 32496 + }, + { + "epoch": 2.56, + "learning_rate": 1.5852946900654583e-05, + "loss": 1.4342, + "step": 32497 + }, + { + "epoch": 2.56, + "learning_rate": 1.584741711809308e-05, + "loss": 1.4875, + "step": 32498 + }, + { + "epoch": 2.56, + "learning_rate": 1.5841888246353612e-05, + "loss": 1.4361, + "step": 32499 + }, + { + "epoch": 2.56, + "learning_rate": 1.583636028547368e-05, + "loss": 1.4575, + "step": 32500 + }, + { + "epoch": 2.56, + "learning_rate": 1.5830833235490793e-05, + "loss": 1.4611, + "step": 32501 + }, + { + "epoch": 2.56, + "learning_rate": 1.5825307096442546e-05, + "loss": 1.4543, + "step": 32502 + }, + { + "epoch": 2.56, + "learning_rate": 1.5819781868366416e-05, + "loss": 1.4794, + "step": 32503 + }, + { + "epoch": 2.56, + "learning_rate": 1.581425755129992e-05, + "loss": 1.4544, + "step": 32504 + }, + { + "epoch": 2.56, + "learning_rate": 1.5808734145280526e-05, + "loss": 1.449, + "step": 32505 + }, + { + "epoch": 2.56, + "learning_rate": 1.5803211650345827e-05, + "loss": 1.4415, + "step": 32506 + }, + { + "epoch": 2.56, + "learning_rate": 1.5797690066533254e-05, + "loss": 1.4168, + "step": 32507 + }, + { + "epoch": 2.56, + "learning_rate": 1.5792169393880278e-05, + "loss": 1.4822, + "step": 32508 + }, + { + "epoch": 2.56, + "learning_rate": 1.5786649632424404e-05, + "loss": 1.4311, + "step": 32509 + }, + { + "epoch": 2.56, + "learning_rate": 1.578113078220315e-05, + "loss": 1.4255, + "step": 32510 + }, + { + "epoch": 2.56, + "learning_rate": 1.5775612843253938e-05, + "loss": 1.4235, + "step": 32511 + }, + { + "epoch": 2.56, + "learning_rate": 1.577009581561422e-05, + "loss": 1.4604, + "step": 32512 + }, + { + "epoch": 2.56, + "learning_rate": 1.576457969932152e-05, + "loss": 1.4806, + "step": 32513 + }, + { + "epoch": 2.56, + "learning_rate": 1.575906449441323e-05, + "loss": 1.4607, + "step": 32514 + }, + { + "epoch": 2.56, + "learning_rate": 1.5753550200926784e-05, + "loss": 1.4444, + "step": 32515 + }, + { + "epoch": 2.56, + "learning_rate": 1.5748036818899677e-05, + "loss": 1.3905, + "step": 32516 + }, + { + "epoch": 2.56, + "learning_rate": 1.5742524348369333e-05, + "loss": 1.4516, + "step": 32517 + }, + { + "epoch": 2.56, + "learning_rate": 1.5737012789373105e-05, + "loss": 1.3773, + "step": 32518 + }, + { + "epoch": 2.56, + "learning_rate": 1.573150214194851e-05, + "loss": 1.4616, + "step": 32519 + }, + { + "epoch": 2.56, + "learning_rate": 1.572599240613292e-05, + "loss": 1.4408, + "step": 32520 + }, + { + "epoch": 2.56, + "learning_rate": 1.5720483581963737e-05, + "loss": 1.4701, + "step": 32521 + }, + { + "epoch": 2.56, + "learning_rate": 1.571497566947835e-05, + "loss": 1.418, + "step": 32522 + }, + { + "epoch": 2.56, + "learning_rate": 1.5709468668714197e-05, + "loss": 1.4034, + "step": 32523 + }, + { + "epoch": 2.56, + "learning_rate": 1.5703962579708644e-05, + "loss": 1.4345, + "step": 32524 + }, + { + "epoch": 2.56, + "learning_rate": 1.569845740249905e-05, + "loss": 1.4629, + "step": 32525 + }, + { + "epoch": 2.56, + "learning_rate": 1.569295313712281e-05, + "loss": 1.4348, + "step": 32526 + }, + { + "epoch": 2.56, + "learning_rate": 1.5687449783617334e-05, + "loss": 1.4043, + "step": 32527 + }, + { + "epoch": 2.56, + "learning_rate": 1.568194734201994e-05, + "loss": 1.4124, + "step": 32528 + }, + { + "epoch": 2.56, + "learning_rate": 1.5676445812367983e-05, + "loss": 1.4621, + "step": 32529 + }, + { + "epoch": 2.56, + "learning_rate": 1.5670945194698864e-05, + "loss": 1.4156, + "step": 32530 + }, + { + "epoch": 2.56, + "learning_rate": 1.5665445489049906e-05, + "loss": 1.4578, + "step": 32531 + }, + { + "epoch": 2.56, + "learning_rate": 1.565994669545839e-05, + "loss": 1.4174, + "step": 32532 + }, + { + "epoch": 2.56, + "learning_rate": 1.5654448813961744e-05, + "loss": 1.4275, + "step": 32533 + }, + { + "epoch": 2.56, + "learning_rate": 1.5648951844597268e-05, + "loss": 1.466, + "step": 32534 + }, + { + "epoch": 2.56, + "learning_rate": 1.5643455787402214e-05, + "loss": 1.4407, + "step": 32535 + }, + { + "epoch": 2.56, + "learning_rate": 1.5637960642413988e-05, + "loss": 1.4638, + "step": 32536 + }, + { + "epoch": 2.56, + "learning_rate": 1.5632466409669857e-05, + "loss": 1.4693, + "step": 32537 + }, + { + "epoch": 2.56, + "learning_rate": 1.5626973089207146e-05, + "loss": 1.4587, + "step": 32538 + }, + { + "epoch": 2.56, + "learning_rate": 1.5621480681063087e-05, + "loss": 1.3954, + "step": 32539 + }, + { + "epoch": 2.56, + "learning_rate": 1.5615989185275034e-05, + "loss": 1.4322, + "step": 32540 + }, + { + "epoch": 2.56, + "learning_rate": 1.5610498601880277e-05, + "loss": 1.4983, + "step": 32541 + }, + { + "epoch": 2.56, + "learning_rate": 1.560500893091607e-05, + "loss": 1.4489, + "step": 32542 + }, + { + "epoch": 2.56, + "learning_rate": 1.5599520172419662e-05, + "loss": 1.3997, + "step": 32543 + }, + { + "epoch": 2.56, + "learning_rate": 1.559403232642836e-05, + "loss": 1.4291, + "step": 32544 + }, + { + "epoch": 2.56, + "learning_rate": 1.558854539297943e-05, + "loss": 1.507, + "step": 32545 + }, + { + "epoch": 2.56, + "learning_rate": 1.5583059372110045e-05, + "loss": 1.4502, + "step": 32546 + }, + { + "epoch": 2.56, + "learning_rate": 1.5577574263857563e-05, + "loss": 1.4653, + "step": 32547 + }, + { + "epoch": 2.56, + "learning_rate": 1.5572090068259162e-05, + "loss": 1.4489, + "step": 32548 + }, + { + "epoch": 2.56, + "learning_rate": 1.5566606785352053e-05, + "loss": 1.4333, + "step": 32549 + }, + { + "epoch": 2.56, + "learning_rate": 1.5561124415173536e-05, + "loss": 1.4094, + "step": 32550 + }, + { + "epoch": 2.56, + "learning_rate": 1.5555642957760783e-05, + "loss": 1.4405, + "step": 32551 + }, + { + "epoch": 2.56, + "learning_rate": 1.5550162413150998e-05, + "loss": 1.4377, + "step": 32552 + }, + { + "epoch": 2.56, + "learning_rate": 1.5544682781381444e-05, + "loss": 1.4676, + "step": 32553 + }, + { + "epoch": 2.56, + "learning_rate": 1.5539204062489303e-05, + "loss": 1.4286, + "step": 32554 + }, + { + "epoch": 2.56, + "learning_rate": 1.5533726256511752e-05, + "loss": 1.4431, + "step": 32555 + }, + { + "epoch": 2.56, + "learning_rate": 1.552824936348595e-05, + "loss": 1.4988, + "step": 32556 + }, + { + "epoch": 2.56, + "learning_rate": 1.5522773383449165e-05, + "loss": 1.3952, + "step": 32557 + }, + { + "epoch": 2.56, + "learning_rate": 1.5517298316438552e-05, + "loss": 1.466, + "step": 32558 + }, + { + "epoch": 2.56, + "learning_rate": 1.5511824162491248e-05, + "loss": 1.4542, + "step": 32559 + }, + { + "epoch": 2.56, + "learning_rate": 1.5506350921644455e-05, + "loss": 1.4492, + "step": 32560 + }, + { + "epoch": 2.56, + "learning_rate": 1.5500878593935328e-05, + "loss": 1.3659, + "step": 32561 + }, + { + "epoch": 2.56, + "learning_rate": 1.549540717940102e-05, + "loss": 1.5246, + "step": 32562 + }, + { + "epoch": 2.56, + "learning_rate": 1.5489936678078633e-05, + "loss": 1.4515, + "step": 32563 + }, + { + "epoch": 2.56, + "learning_rate": 1.5484467090005376e-05, + "loss": 1.4508, + "step": 32564 + }, + { + "epoch": 2.56, + "learning_rate": 1.5478998415218363e-05, + "loss": 1.4389, + "step": 32565 + }, + { + "epoch": 2.56, + "learning_rate": 1.5473530653754668e-05, + "loss": 1.4443, + "step": 32566 + }, + { + "epoch": 2.56, + "learning_rate": 1.546806380565151e-05, + "loss": 1.426, + "step": 32567 + }, + { + "epoch": 2.56, + "learning_rate": 1.5462597870945943e-05, + "loss": 1.4076, + "step": 32568 + }, + { + "epoch": 2.56, + "learning_rate": 1.5457132849675086e-05, + "loss": 1.5049, + "step": 32569 + }, + { + "epoch": 2.56, + "learning_rate": 1.5451668741876062e-05, + "loss": 1.4308, + "step": 32570 + }, + { + "epoch": 2.56, + "learning_rate": 1.5446205547585955e-05, + "loss": 1.3974, + "step": 32571 + }, + { + "epoch": 2.56, + "learning_rate": 1.5440743266841837e-05, + "loss": 1.4617, + "step": 32572 + }, + { + "epoch": 2.56, + "learning_rate": 1.543528189968081e-05, + "loss": 1.4673, + "step": 32573 + }, + { + "epoch": 2.56, + "learning_rate": 1.5429821446140002e-05, + "loss": 1.4327, + "step": 32574 + }, + { + "epoch": 2.56, + "learning_rate": 1.5424361906256438e-05, + "loss": 1.4748, + "step": 32575 + }, + { + "epoch": 2.56, + "learning_rate": 1.5418903280067162e-05, + "loss": 1.4782, + "step": 32576 + }, + { + "epoch": 2.56, + "learning_rate": 1.5413445567609294e-05, + "loss": 1.4232, + "step": 32577 + }, + { + "epoch": 2.56, + "learning_rate": 1.5407988768919853e-05, + "loss": 1.4735, + "step": 32578 + }, + { + "epoch": 2.56, + "learning_rate": 1.5402532884035894e-05, + "loss": 1.4151, + "step": 32579 + }, + { + "epoch": 2.56, + "learning_rate": 1.5397077912994438e-05, + "loss": 1.4633, + "step": 32580 + }, + { + "epoch": 2.56, + "learning_rate": 1.539162385583257e-05, + "loss": 1.4822, + "step": 32581 + }, + { + "epoch": 2.56, + "learning_rate": 1.5386170712587293e-05, + "loss": 1.4494, + "step": 32582 + }, + { + "epoch": 2.56, + "learning_rate": 1.5380718483295613e-05, + "loss": 1.456, + "step": 32583 + }, + { + "epoch": 2.56, + "learning_rate": 1.537526716799458e-05, + "loss": 1.4293, + "step": 32584 + }, + { + "epoch": 2.56, + "learning_rate": 1.5369816766721187e-05, + "loss": 1.4445, + "step": 32585 + }, + { + "epoch": 2.56, + "learning_rate": 1.5364367279512417e-05, + "loss": 1.4562, + "step": 32586 + }, + { + "epoch": 2.56, + "learning_rate": 1.5358918706405345e-05, + "loss": 1.4641, + "step": 32587 + }, + { + "epoch": 2.56, + "learning_rate": 1.5353471047436866e-05, + "loss": 1.4425, + "step": 32588 + }, + { + "epoch": 2.56, + "learning_rate": 1.534802430264404e-05, + "loss": 1.4029, + "step": 32589 + }, + { + "epoch": 2.56, + "learning_rate": 1.5342578472063805e-05, + "loss": 1.4413, + "step": 32590 + }, + { + "epoch": 2.56, + "learning_rate": 1.533713355573316e-05, + "loss": 1.3982, + "step": 32591 + }, + { + "epoch": 2.56, + "learning_rate": 1.533168955368908e-05, + "loss": 1.4699, + "step": 32592 + }, + { + "epoch": 2.56, + "learning_rate": 1.5326246465968482e-05, + "loss": 1.4329, + "step": 32593 + }, + { + "epoch": 2.56, + "learning_rate": 1.532080429260839e-05, + "loss": 1.5017, + "step": 32594 + }, + { + "epoch": 2.56, + "learning_rate": 1.5315363033645705e-05, + "loss": 1.4083, + "step": 32595 + }, + { + "epoch": 2.56, + "learning_rate": 1.5309922689117384e-05, + "loss": 1.4545, + "step": 32596 + }, + { + "epoch": 2.56, + "learning_rate": 1.5304483259060323e-05, + "loss": 1.451, + "step": 32597 + }, + { + "epoch": 2.56, + "learning_rate": 1.529904474351152e-05, + "loss": 1.4296, + "step": 32598 + }, + { + "epoch": 2.56, + "learning_rate": 1.5293607142507884e-05, + "loss": 1.3928, + "step": 32599 + }, + { + "epoch": 2.57, + "learning_rate": 1.5288170456086278e-05, + "loss": 1.453, + "step": 32600 + }, + { + "epoch": 2.57, + "learning_rate": 1.528273468428367e-05, + "loss": 1.468, + "step": 32601 + }, + { + "epoch": 2.57, + "learning_rate": 1.5277299827136964e-05, + "loss": 1.4668, + "step": 32602 + }, + { + "epoch": 2.57, + "learning_rate": 1.5271865884683026e-05, + "loss": 1.3954, + "step": 32603 + }, + { + "epoch": 2.57, + "learning_rate": 1.5266432856958748e-05, + "loss": 1.4064, + "step": 32604 + }, + { + "epoch": 2.57, + "learning_rate": 1.5261000744001084e-05, + "loss": 1.4432, + "step": 32605 + }, + { + "epoch": 2.57, + "learning_rate": 1.5255569545846868e-05, + "loss": 1.4365, + "step": 32606 + }, + { + "epoch": 2.57, + "learning_rate": 1.525013926253294e-05, + "loss": 1.3994, + "step": 32607 + }, + { + "epoch": 2.57, + "learning_rate": 1.5244709894096252e-05, + "loss": 1.4479, + "step": 32608 + }, + { + "epoch": 2.57, + "learning_rate": 1.523928144057361e-05, + "loss": 1.4556, + "step": 32609 + }, + { + "epoch": 2.57, + "learning_rate": 1.5233853902001846e-05, + "loss": 1.4702, + "step": 32610 + }, + { + "epoch": 2.57, + "learning_rate": 1.522842727841787e-05, + "loss": 1.489, + "step": 32611 + }, + { + "epoch": 2.57, + "learning_rate": 1.52230015698585e-05, + "loss": 1.4529, + "step": 32612 + }, + { + "epoch": 2.57, + "learning_rate": 1.5217576776360558e-05, + "loss": 1.4497, + "step": 32613 + }, + { + "epoch": 2.57, + "learning_rate": 1.521215289796091e-05, + "loss": 1.4605, + "step": 32614 + }, + { + "epoch": 2.57, + "learning_rate": 1.5206729934696348e-05, + "loss": 1.3837, + "step": 32615 + }, + { + "epoch": 2.57, + "learning_rate": 1.5201307886603725e-05, + "loss": 1.3836, + "step": 32616 + }, + { + "epoch": 2.57, + "learning_rate": 1.5195886753719794e-05, + "loss": 1.4036, + "step": 32617 + }, + { + "epoch": 2.57, + "learning_rate": 1.5190466536081442e-05, + "loss": 1.4264, + "step": 32618 + }, + { + "epoch": 2.57, + "learning_rate": 1.5185047233725389e-05, + "loss": 1.4456, + "step": 32619 + }, + { + "epoch": 2.57, + "learning_rate": 1.5179628846688507e-05, + "loss": 1.4703, + "step": 32620 + }, + { + "epoch": 2.57, + "learning_rate": 1.51742113750075e-05, + "loss": 1.4063, + "step": 32621 + }, + { + "epoch": 2.57, + "learning_rate": 1.5168794818719238e-05, + "loss": 1.4358, + "step": 32622 + }, + { + "epoch": 2.57, + "learning_rate": 1.5163379177860441e-05, + "loss": 1.5084, + "step": 32623 + }, + { + "epoch": 2.57, + "learning_rate": 1.5157964452467863e-05, + "loss": 1.5137, + "step": 32624 + }, + { + "epoch": 2.57, + "learning_rate": 1.5152550642578343e-05, + "loss": 1.4284, + "step": 32625 + }, + { + "epoch": 2.57, + "learning_rate": 1.5147137748228565e-05, + "loss": 1.4454, + "step": 32626 + }, + { + "epoch": 2.57, + "learning_rate": 1.5141725769455288e-05, + "loss": 1.452, + "step": 32627 + }, + { + "epoch": 2.57, + "learning_rate": 1.5136314706295293e-05, + "loss": 1.4601, + "step": 32628 + }, + { + "epoch": 2.57, + "learning_rate": 1.5130904558785306e-05, + "loss": 1.4783, + "step": 32629 + }, + { + "epoch": 2.57, + "learning_rate": 1.5125495326962011e-05, + "loss": 1.4196, + "step": 32630 + }, + { + "epoch": 2.57, + "learning_rate": 1.5120087010862214e-05, + "loss": 1.469, + "step": 32631 + }, + { + "epoch": 2.57, + "learning_rate": 1.5114679610522584e-05, + "loss": 1.4634, + "step": 32632 + }, + { + "epoch": 2.57, + "learning_rate": 1.5109273125979843e-05, + "loss": 1.4157, + "step": 32633 + }, + { + "epoch": 2.57, + "learning_rate": 1.5103867557270676e-05, + "loss": 1.4506, + "step": 32634 + }, + { + "epoch": 2.57, + "learning_rate": 1.5098462904431807e-05, + "loss": 1.4786, + "step": 32635 + }, + { + "epoch": 2.57, + "learning_rate": 1.5093059167499955e-05, + "loss": 1.4274, + "step": 32636 + }, + { + "epoch": 2.57, + "learning_rate": 1.5087656346511772e-05, + "loss": 1.4303, + "step": 32637 + }, + { + "epoch": 2.57, + "learning_rate": 1.5082254441503949e-05, + "loss": 1.4143, + "step": 32638 + }, + { + "epoch": 2.57, + "learning_rate": 1.507685345251317e-05, + "loss": 1.412, + "step": 32639 + }, + { + "epoch": 2.57, + "learning_rate": 1.5071453379576109e-05, + "loss": 1.4198, + "step": 32640 + }, + { + "epoch": 2.57, + "learning_rate": 1.5066054222729384e-05, + "loss": 1.465, + "step": 32641 + }, + { + "epoch": 2.57, + "learning_rate": 1.5060655982009734e-05, + "loss": 1.4229, + "step": 32642 + }, + { + "epoch": 2.57, + "learning_rate": 1.5055258657453744e-05, + "loss": 1.4172, + "step": 32643 + }, + { + "epoch": 2.57, + "learning_rate": 1.504986224909807e-05, + "loss": 1.4333, + "step": 32644 + }, + { + "epoch": 2.57, + "learning_rate": 1.5044466756979367e-05, + "loss": 1.5021, + "step": 32645 + }, + { + "epoch": 2.57, + "learning_rate": 1.503907218113427e-05, + "loss": 1.4159, + "step": 32646 + }, + { + "epoch": 2.57, + "learning_rate": 1.5033678521599368e-05, + "loss": 1.4773, + "step": 32647 + }, + { + "epoch": 2.57, + "learning_rate": 1.5028285778411348e-05, + "loss": 1.4405, + "step": 32648 + }, + { + "epoch": 2.57, + "learning_rate": 1.5022893951606763e-05, + "loss": 1.4336, + "step": 32649 + }, + { + "epoch": 2.57, + "learning_rate": 1.5017503041222234e-05, + "loss": 1.4351, + "step": 32650 + }, + { + "epoch": 2.57, + "learning_rate": 1.501211304729435e-05, + "loss": 1.4593, + "step": 32651 + }, + { + "epoch": 2.57, + "learning_rate": 1.5006723969859763e-05, + "loss": 1.4573, + "step": 32652 + }, + { + "epoch": 2.57, + "learning_rate": 1.5001335808955029e-05, + "loss": 1.4541, + "step": 32653 + }, + { + "epoch": 2.57, + "learning_rate": 1.4995948564616717e-05, + "loss": 1.4362, + "step": 32654 + }, + { + "epoch": 2.57, + "learning_rate": 1.4990562236881398e-05, + "loss": 1.4948, + "step": 32655 + }, + { + "epoch": 2.57, + "learning_rate": 1.4985176825785677e-05, + "loss": 1.44, + "step": 32656 + }, + { + "epoch": 2.57, + "learning_rate": 1.4979792331366092e-05, + "loss": 1.4315, + "step": 32657 + }, + { + "epoch": 2.57, + "learning_rate": 1.4974408753659195e-05, + "loss": 1.4124, + "step": 32658 + }, + { + "epoch": 2.57, + "learning_rate": 1.4969026092701559e-05, + "loss": 1.4576, + "step": 32659 + }, + { + "epoch": 2.57, + "learning_rate": 1.4963644348529735e-05, + "loss": 1.4268, + "step": 32660 + }, + { + "epoch": 2.57, + "learning_rate": 1.4958263521180197e-05, + "loss": 1.4586, + "step": 32661 + }, + { + "epoch": 2.57, + "learning_rate": 1.4952883610689581e-05, + "loss": 1.4461, + "step": 32662 + }, + { + "epoch": 2.57, + "learning_rate": 1.494750461709434e-05, + "loss": 1.4177, + "step": 32663 + }, + { + "epoch": 2.57, + "learning_rate": 1.4942126540430998e-05, + "loss": 1.4954, + "step": 32664 + }, + { + "epoch": 2.57, + "learning_rate": 1.4936749380736107e-05, + "loss": 1.4011, + "step": 32665 + }, + { + "epoch": 2.57, + "learning_rate": 1.4931373138046138e-05, + "loss": 1.415, + "step": 32666 + }, + { + "epoch": 2.57, + "learning_rate": 1.4925997812397627e-05, + "loss": 1.4682, + "step": 32667 + }, + { + "epoch": 2.57, + "learning_rate": 1.4920623403827015e-05, + "loss": 1.448, + "step": 32668 + }, + { + "epoch": 2.57, + "learning_rate": 1.491524991237087e-05, + "loss": 1.4346, + "step": 32669 + }, + { + "epoch": 2.57, + "learning_rate": 1.490987733806563e-05, + "loss": 1.4639, + "step": 32670 + }, + { + "epoch": 2.57, + "learning_rate": 1.4904505680947748e-05, + "loss": 1.4541, + "step": 32671 + }, + { + "epoch": 2.57, + "learning_rate": 1.489913494105373e-05, + "loss": 1.4445, + "step": 32672 + }, + { + "epoch": 2.57, + "learning_rate": 1.4893765118420048e-05, + "loss": 1.4469, + "step": 32673 + }, + { + "epoch": 2.57, + "learning_rate": 1.4888396213083137e-05, + "loss": 1.4693, + "step": 32674 + }, + { + "epoch": 2.57, + "learning_rate": 1.4883028225079435e-05, + "loss": 1.4805, + "step": 32675 + }, + { + "epoch": 2.57, + "learning_rate": 1.4877661154445431e-05, + "loss": 1.5403, + "step": 32676 + }, + { + "epoch": 2.57, + "learning_rate": 1.4872295001217526e-05, + "loss": 1.386, + "step": 32677 + }, + { + "epoch": 2.57, + "learning_rate": 1.4866929765432162e-05, + "loss": 1.4953, + "step": 32678 + }, + { + "epoch": 2.57, + "learning_rate": 1.486156544712579e-05, + "loss": 1.52, + "step": 32679 + }, + { + "epoch": 2.57, + "learning_rate": 1.4856202046334814e-05, + "loss": 1.4584, + "step": 32680 + }, + { + "epoch": 2.57, + "learning_rate": 1.4850839563095623e-05, + "loss": 1.4162, + "step": 32681 + }, + { + "epoch": 2.57, + "learning_rate": 1.4845477997444654e-05, + "loss": 1.3912, + "step": 32682 + }, + { + "epoch": 2.57, + "learning_rate": 1.4840117349418328e-05, + "loss": 1.4601, + "step": 32683 + }, + { + "epoch": 2.57, + "learning_rate": 1.4834757619053018e-05, + "loss": 1.4465, + "step": 32684 + }, + { + "epoch": 2.57, + "learning_rate": 1.4829398806385073e-05, + "loss": 1.484, + "step": 32685 + }, + { + "epoch": 2.57, + "learning_rate": 1.4824040911450952e-05, + "loss": 1.4311, + "step": 32686 + }, + { + "epoch": 2.57, + "learning_rate": 1.4818683934287007e-05, + "loss": 1.4932, + "step": 32687 + }, + { + "epoch": 2.57, + "learning_rate": 1.4813327874929559e-05, + "loss": 1.4562, + "step": 32688 + }, + { + "epoch": 2.57, + "learning_rate": 1.4807972733415047e-05, + "loss": 1.4504, + "step": 32689 + }, + { + "epoch": 2.57, + "learning_rate": 1.480261850977979e-05, + "loss": 1.4916, + "step": 32690 + }, + { + "epoch": 2.57, + "learning_rate": 1.479726520406016e-05, + "loss": 1.4083, + "step": 32691 + }, + { + "epoch": 2.57, + "learning_rate": 1.4791912816292445e-05, + "loss": 1.4271, + "step": 32692 + }, + { + "epoch": 2.57, + "learning_rate": 1.4786561346513066e-05, + "loss": 1.4738, + "step": 32693 + }, + { + "epoch": 2.57, + "learning_rate": 1.4781210794758308e-05, + "loss": 1.4875, + "step": 32694 + }, + { + "epoch": 2.57, + "learning_rate": 1.4775861161064494e-05, + "loss": 1.4191, + "step": 32695 + }, + { + "epoch": 2.57, + "learning_rate": 1.477051244546798e-05, + "loss": 1.45, + "step": 32696 + }, + { + "epoch": 2.57, + "learning_rate": 1.4765164648005052e-05, + "loss": 1.4399, + "step": 32697 + }, + { + "epoch": 2.57, + "learning_rate": 1.4759817768712012e-05, + "loss": 1.4387, + "step": 32698 + }, + { + "epoch": 2.57, + "learning_rate": 1.4754471807625168e-05, + "loss": 1.4668, + "step": 32699 + }, + { + "epoch": 2.57, + "learning_rate": 1.4749126764780856e-05, + "loss": 1.4223, + "step": 32700 + }, + { + "epoch": 2.57, + "learning_rate": 1.4743782640215345e-05, + "loss": 1.4498, + "step": 32701 + }, + { + "epoch": 2.57, + "learning_rate": 1.4738439433964877e-05, + "loss": 1.4368, + "step": 32702 + }, + { + "epoch": 2.57, + "learning_rate": 1.4733097146065787e-05, + "loss": 1.4323, + "step": 32703 + }, + { + "epoch": 2.57, + "learning_rate": 1.4727755776554312e-05, + "loss": 1.4922, + "step": 32704 + }, + { + "epoch": 2.57, + "learning_rate": 1.4722415325466707e-05, + "loss": 1.4208, + "step": 32705 + }, + { + "epoch": 2.57, + "learning_rate": 1.4717075792839278e-05, + "loss": 1.4555, + "step": 32706 + }, + { + "epoch": 2.57, + "learning_rate": 1.4711737178708261e-05, + "loss": 1.4616, + "step": 32707 + }, + { + "epoch": 2.57, + "learning_rate": 1.4706399483109876e-05, + "loss": 1.4401, + "step": 32708 + }, + { + "epoch": 2.57, + "learning_rate": 1.4701062706080346e-05, + "loss": 1.4476, + "step": 32709 + }, + { + "epoch": 2.57, + "learning_rate": 1.4695726847655976e-05, + "loss": 1.4431, + "step": 32710 + }, + { + "epoch": 2.57, + "learning_rate": 1.469039190787295e-05, + "loss": 1.4459, + "step": 32711 + }, + { + "epoch": 2.57, + "learning_rate": 1.468505788676746e-05, + "loss": 1.3787, + "step": 32712 + }, + { + "epoch": 2.57, + "learning_rate": 1.4679724784375757e-05, + "loss": 1.4907, + "step": 32713 + }, + { + "epoch": 2.57, + "learning_rate": 1.4674392600734063e-05, + "loss": 1.4337, + "step": 32714 + }, + { + "epoch": 2.57, + "learning_rate": 1.4669061335878584e-05, + "loss": 1.4728, + "step": 32715 + }, + { + "epoch": 2.57, + "learning_rate": 1.4663730989845457e-05, + "loss": 1.4657, + "step": 32716 + }, + { + "epoch": 2.57, + "learning_rate": 1.4658401562670952e-05, + "loss": 1.4542, + "step": 32717 + }, + { + "epoch": 2.57, + "learning_rate": 1.4653073054391207e-05, + "loss": 1.4417, + "step": 32718 + }, + { + "epoch": 2.57, + "learning_rate": 1.464774546504236e-05, + "loss": 1.4393, + "step": 32719 + }, + { + "epoch": 2.57, + "learning_rate": 1.4642418794660681e-05, + "loss": 1.4119, + "step": 32720 + }, + { + "epoch": 2.57, + "learning_rate": 1.463709304328226e-05, + "loss": 1.4319, + "step": 32721 + }, + { + "epoch": 2.57, + "learning_rate": 1.4631768210943268e-05, + "loss": 1.496, + "step": 32722 + }, + { + "epoch": 2.57, + "learning_rate": 1.462644429767989e-05, + "loss": 1.4281, + "step": 32723 + }, + { + "epoch": 2.57, + "learning_rate": 1.462112130352825e-05, + "loss": 1.4594, + "step": 32724 + }, + { + "epoch": 2.57, + "learning_rate": 1.461579922852445e-05, + "loss": 1.4621, + "step": 32725 + }, + { + "epoch": 2.57, + "learning_rate": 1.4610478072704695e-05, + "loss": 1.4547, + "step": 32726 + }, + { + "epoch": 2.58, + "learning_rate": 1.4605157836105092e-05, + "loss": 1.3533, + "step": 32727 + }, + { + "epoch": 2.58, + "learning_rate": 1.4599838518761742e-05, + "loss": 1.3802, + "step": 32728 + }, + { + "epoch": 2.58, + "learning_rate": 1.4594520120710718e-05, + "loss": 1.4193, + "step": 32729 + }, + { + "epoch": 2.58, + "learning_rate": 1.4589202641988224e-05, + "loss": 1.4774, + "step": 32730 + }, + { + "epoch": 2.58, + "learning_rate": 1.4583886082630313e-05, + "loss": 1.4404, + "step": 32731 + }, + { + "epoch": 2.58, + "learning_rate": 1.457857044267311e-05, + "loss": 1.4449, + "step": 32732 + }, + { + "epoch": 2.58, + "learning_rate": 1.4573255722152632e-05, + "loss": 1.4383, + "step": 32733 + }, + { + "epoch": 2.58, + "learning_rate": 1.4567941921105052e-05, + "loss": 1.4543, + "step": 32734 + }, + { + "epoch": 2.58, + "learning_rate": 1.456262903956641e-05, + "loss": 1.5027, + "step": 32735 + }, + { + "epoch": 2.58, + "learning_rate": 1.455731707757274e-05, + "loss": 1.4125, + "step": 32736 + }, + { + "epoch": 2.58, + "learning_rate": 1.455200603516018e-05, + "loss": 1.4157, + "step": 32737 + }, + { + "epoch": 2.58, + "learning_rate": 1.4546695912364753e-05, + "loss": 1.473, + "step": 32738 + }, + { + "epoch": 2.58, + "learning_rate": 1.454138670922248e-05, + "loss": 1.463, + "step": 32739 + }, + { + "epoch": 2.58, + "learning_rate": 1.4536078425769466e-05, + "loss": 1.4087, + "step": 32740 + }, + { + "epoch": 2.58, + "learning_rate": 1.453077106204173e-05, + "loss": 1.4525, + "step": 32741 + }, + { + "epoch": 2.58, + "learning_rate": 1.4525464618075261e-05, + "loss": 1.4227, + "step": 32742 + }, + { + "epoch": 2.58, + "learning_rate": 1.4520159093906164e-05, + "loss": 1.4651, + "step": 32743 + }, + { + "epoch": 2.58, + "learning_rate": 1.4514854489570427e-05, + "loss": 1.5297, + "step": 32744 + }, + { + "epoch": 2.58, + "learning_rate": 1.450955080510402e-05, + "loss": 1.4407, + "step": 32745 + }, + { + "epoch": 2.58, + "learning_rate": 1.4504248040542999e-05, + "loss": 1.4404, + "step": 32746 + }, + { + "epoch": 2.58, + "learning_rate": 1.4498946195923383e-05, + "loss": 1.4225, + "step": 32747 + }, + { + "epoch": 2.58, + "learning_rate": 1.4493645271281162e-05, + "loss": 1.4525, + "step": 32748 + }, + { + "epoch": 2.58, + "learning_rate": 1.448834526665229e-05, + "loss": 1.4915, + "step": 32749 + }, + { + "epoch": 2.58, + "learning_rate": 1.4483046182072755e-05, + "loss": 1.4463, + "step": 32750 + }, + { + "epoch": 2.58, + "learning_rate": 1.4477748017578595e-05, + "loss": 1.43, + "step": 32751 + }, + { + "epoch": 2.58, + "learning_rate": 1.4472450773205712e-05, + "loss": 1.4527, + "step": 32752 + }, + { + "epoch": 2.58, + "learning_rate": 1.4467154448990082e-05, + "loss": 1.4696, + "step": 32753 + }, + { + "epoch": 2.58, + "learning_rate": 1.4461859044967721e-05, + "loss": 1.4066, + "step": 32754 + }, + { + "epoch": 2.58, + "learning_rate": 1.4456564561174521e-05, + "loss": 1.4254, + "step": 32755 + }, + { + "epoch": 2.58, + "learning_rate": 1.4451270997646437e-05, + "loss": 1.4356, + "step": 32756 + }, + { + "epoch": 2.58, + "learning_rate": 1.4445978354419436e-05, + "loss": 1.4659, + "step": 32757 + }, + { + "epoch": 2.58, + "learning_rate": 1.4440686631529441e-05, + "loss": 1.4435, + "step": 32758 + }, + { + "epoch": 2.58, + "learning_rate": 1.4435395829012342e-05, + "loss": 1.4257, + "step": 32759 + }, + { + "epoch": 2.58, + "learning_rate": 1.4430105946904108e-05, + "loss": 1.4447, + "step": 32760 + }, + { + "epoch": 2.58, + "learning_rate": 1.4424816985240662e-05, + "loss": 1.4196, + "step": 32761 + }, + { + "epoch": 2.58, + "learning_rate": 1.441952894405789e-05, + "loss": 1.4606, + "step": 32762 + }, + { + "epoch": 2.58, + "learning_rate": 1.4414241823391665e-05, + "loss": 1.495, + "step": 32763 + }, + { + "epoch": 2.58, + "learning_rate": 1.4408955623277956e-05, + "loss": 1.4353, + "step": 32764 + }, + { + "epoch": 2.58, + "learning_rate": 1.4403670343752604e-05, + "loss": 1.4177, + "step": 32765 + }, + { + "epoch": 2.58, + "learning_rate": 1.4398385984851496e-05, + "loss": 1.4768, + "step": 32766 + }, + { + "epoch": 2.58, + "learning_rate": 1.4393102546610502e-05, + "loss": 1.4719, + "step": 32767 + }, + { + "epoch": 2.58, + "learning_rate": 1.4387820029065528e-05, + "loss": 1.4597, + "step": 32768 + }, + { + "epoch": 2.58, + "learning_rate": 1.4382538432252428e-05, + "loss": 1.4689, + "step": 32769 + }, + { + "epoch": 2.58, + "learning_rate": 1.4377257756207006e-05, + "loss": 1.4613, + "step": 32770 + }, + { + "epoch": 2.58, + "learning_rate": 1.4371978000965201e-05, + "loss": 1.4105, + "step": 32771 + }, + { + "epoch": 2.58, + "learning_rate": 1.4366699166562817e-05, + "loss": 1.4487, + "step": 32772 + }, + { + "epoch": 2.58, + "learning_rate": 1.4361421253035677e-05, + "loss": 1.4292, + "step": 32773 + }, + { + "epoch": 2.58, + "learning_rate": 1.435614426041965e-05, + "loss": 1.4869, + "step": 32774 + }, + { + "epoch": 2.58, + "learning_rate": 1.4350868188750558e-05, + "loss": 1.4802, + "step": 32775 + }, + { + "epoch": 2.58, + "learning_rate": 1.434559303806419e-05, + "loss": 1.4576, + "step": 32776 + }, + { + "epoch": 2.58, + "learning_rate": 1.4340318808396385e-05, + "loss": 1.4122, + "step": 32777 + }, + { + "epoch": 2.58, + "learning_rate": 1.433504549978296e-05, + "loss": 1.3959, + "step": 32778 + }, + { + "epoch": 2.58, + "learning_rate": 1.4329773112259723e-05, + "loss": 1.4512, + "step": 32779 + }, + { + "epoch": 2.58, + "learning_rate": 1.432450164586243e-05, + "loss": 1.3803, + "step": 32780 + }, + { + "epoch": 2.58, + "learning_rate": 1.4319231100626933e-05, + "loss": 1.4137, + "step": 32781 + }, + { + "epoch": 2.58, + "learning_rate": 1.431396147658897e-05, + "loss": 1.4529, + "step": 32782 + }, + { + "epoch": 2.58, + "learning_rate": 1.4308692773784313e-05, + "loss": 1.4088, + "step": 32783 + }, + { + "epoch": 2.58, + "learning_rate": 1.4303424992248786e-05, + "loss": 1.3772, + "step": 32784 + }, + { + "epoch": 2.58, + "learning_rate": 1.4298158132018106e-05, + "loss": 1.4096, + "step": 32785 + }, + { + "epoch": 2.58, + "learning_rate": 1.4292892193128047e-05, + "loss": 1.3887, + "step": 32786 + }, + { + "epoch": 2.58, + "learning_rate": 1.428762717561433e-05, + "loss": 1.4315, + "step": 32787 + }, + { + "epoch": 2.58, + "learning_rate": 1.428236307951276e-05, + "loss": 1.4537, + "step": 32788 + }, + { + "epoch": 2.58, + "learning_rate": 1.4277099904859058e-05, + "loss": 1.421, + "step": 32789 + }, + { + "epoch": 2.58, + "learning_rate": 1.4271837651688927e-05, + "loss": 1.4428, + "step": 32790 + }, + { + "epoch": 2.58, + "learning_rate": 1.4266576320038125e-05, + "loss": 1.4524, + "step": 32791 + }, + { + "epoch": 2.58, + "learning_rate": 1.4261315909942356e-05, + "loss": 1.4353, + "step": 32792 + }, + { + "epoch": 2.58, + "learning_rate": 1.4256056421437357e-05, + "loss": 1.4604, + "step": 32793 + }, + { + "epoch": 2.58, + "learning_rate": 1.4250797854558816e-05, + "loss": 1.4785, + "step": 32794 + }, + { + "epoch": 2.58, + "learning_rate": 1.4245540209342454e-05, + "loss": 1.4112, + "step": 32795 + }, + { + "epoch": 2.58, + "learning_rate": 1.4240283485823978e-05, + "loss": 1.4785, + "step": 32796 + }, + { + "epoch": 2.58, + "learning_rate": 1.4235027684039025e-05, + "loss": 1.4061, + "step": 32797 + }, + { + "epoch": 2.58, + "learning_rate": 1.4229772804023332e-05, + "loss": 1.4784, + "step": 32798 + }, + { + "epoch": 2.58, + "learning_rate": 1.4224518845812554e-05, + "loss": 1.4553, + "step": 32799 + }, + { + "epoch": 2.58, + "learning_rate": 1.4219265809442349e-05, + "loss": 1.4116, + "step": 32800 + }, + { + "epoch": 2.58, + "learning_rate": 1.4214013694948417e-05, + "loss": 1.3998, + "step": 32801 + }, + { + "epoch": 2.58, + "learning_rate": 1.4208762502366416e-05, + "loss": 1.4612, + "step": 32802 + }, + { + "epoch": 2.58, + "learning_rate": 1.4203512231731967e-05, + "loss": 1.4681, + "step": 32803 + }, + { + "epoch": 2.58, + "learning_rate": 1.4198262883080708e-05, + "loss": 1.4606, + "step": 32804 + }, + { + "epoch": 2.58, + "learning_rate": 1.4193014456448326e-05, + "loss": 1.4854, + "step": 32805 + }, + { + "epoch": 2.58, + "learning_rate": 1.4187766951870444e-05, + "loss": 1.4929, + "step": 32806 + }, + { + "epoch": 2.58, + "learning_rate": 1.4182520369382633e-05, + "loss": 1.4351, + "step": 32807 + }, + { + "epoch": 2.58, + "learning_rate": 1.4177274709020565e-05, + "loss": 1.5063, + "step": 32808 + }, + { + "epoch": 2.58, + "learning_rate": 1.4172029970819875e-05, + "loss": 1.4655, + "step": 32809 + }, + { + "epoch": 2.58, + "learning_rate": 1.4166786154816157e-05, + "loss": 1.4275, + "step": 32810 + }, + { + "epoch": 2.58, + "learning_rate": 1.416154326104496e-05, + "loss": 1.4501, + "step": 32811 + }, + { + "epoch": 2.58, + "learning_rate": 1.415630128954196e-05, + "loss": 1.4291, + "step": 32812 + }, + { + "epoch": 2.58, + "learning_rate": 1.415106024034271e-05, + "loss": 1.4457, + "step": 32813 + }, + { + "epoch": 2.58, + "learning_rate": 1.4145820113482748e-05, + "loss": 1.4733, + "step": 32814 + }, + { + "epoch": 2.58, + "learning_rate": 1.4140580908997746e-05, + "loss": 1.4532, + "step": 32815 + }, + { + "epoch": 2.58, + "learning_rate": 1.4135342626923225e-05, + "loss": 1.437, + "step": 32816 + }, + { + "epoch": 2.58, + "learning_rate": 1.4130105267294705e-05, + "loss": 1.4412, + "step": 32817 + }, + { + "epoch": 2.58, + "learning_rate": 1.4124868830147828e-05, + "loss": 1.4527, + "step": 32818 + }, + { + "epoch": 2.58, + "learning_rate": 1.4119633315518114e-05, + "loss": 1.472, + "step": 32819 + }, + { + "epoch": 2.58, + "learning_rate": 1.41143987234411e-05, + "loss": 1.4639, + "step": 32820 + }, + { + "epoch": 2.58, + "learning_rate": 1.4109165053952309e-05, + "loss": 1.4411, + "step": 32821 + }, + { + "epoch": 2.58, + "learning_rate": 1.4103932307087312e-05, + "loss": 1.4443, + "step": 32822 + }, + { + "epoch": 2.58, + "learning_rate": 1.4098700482881614e-05, + "loss": 1.4717, + "step": 32823 + }, + { + "epoch": 2.58, + "learning_rate": 1.409346958137072e-05, + "loss": 1.4801, + "step": 32824 + }, + { + "epoch": 2.58, + "learning_rate": 1.4088239602590218e-05, + "loss": 1.4169, + "step": 32825 + }, + { + "epoch": 2.58, + "learning_rate": 1.4083010546575546e-05, + "loss": 1.4371, + "step": 32826 + }, + { + "epoch": 2.58, + "learning_rate": 1.4077782413362243e-05, + "loss": 1.4871, + "step": 32827 + }, + { + "epoch": 2.58, + "learning_rate": 1.4072555202985747e-05, + "loss": 1.4392, + "step": 32828 + }, + { + "epoch": 2.58, + "learning_rate": 1.4067328915481629e-05, + "loss": 1.4133, + "step": 32829 + }, + { + "epoch": 2.58, + "learning_rate": 1.4062103550885328e-05, + "loss": 1.4238, + "step": 32830 + }, + { + "epoch": 2.58, + "learning_rate": 1.40568791092323e-05, + "loss": 1.4512, + "step": 32831 + }, + { + "epoch": 2.58, + "learning_rate": 1.4051655590558081e-05, + "loss": 1.4269, + "step": 32832 + }, + { + "epoch": 2.58, + "learning_rate": 1.4046432994898094e-05, + "loss": 1.479, + "step": 32833 + }, + { + "epoch": 2.58, + "learning_rate": 1.404121132228776e-05, + "loss": 1.4149, + "step": 32834 + }, + { + "epoch": 2.58, + "learning_rate": 1.4035990572762617e-05, + "loss": 1.3975, + "step": 32835 + }, + { + "epoch": 2.58, + "learning_rate": 1.4030770746358056e-05, + "loss": 1.4556, + "step": 32836 + }, + { + "epoch": 2.58, + "learning_rate": 1.4025551843109512e-05, + "loss": 1.4769, + "step": 32837 + }, + { + "epoch": 2.58, + "learning_rate": 1.4020333863052457e-05, + "loss": 1.4576, + "step": 32838 + }, + { + "epoch": 2.58, + "learning_rate": 1.4015116806222266e-05, + "loss": 1.4371, + "step": 32839 + }, + { + "epoch": 2.58, + "learning_rate": 1.4009900672654406e-05, + "loss": 1.5019, + "step": 32840 + }, + { + "epoch": 2.58, + "learning_rate": 1.4004685462384251e-05, + "loss": 1.4645, + "step": 32841 + }, + { + "epoch": 2.58, + "learning_rate": 1.3999471175447274e-05, + "loss": 1.483, + "step": 32842 + }, + { + "epoch": 2.58, + "learning_rate": 1.3994257811878828e-05, + "loss": 1.4755, + "step": 32843 + }, + { + "epoch": 2.58, + "learning_rate": 1.398904537171432e-05, + "loss": 1.4384, + "step": 32844 + }, + { + "epoch": 2.58, + "learning_rate": 1.39838338549891e-05, + "loss": 1.4331, + "step": 32845 + }, + { + "epoch": 2.58, + "learning_rate": 1.397862326173863e-05, + "loss": 1.4592, + "step": 32846 + }, + { + "epoch": 2.58, + "learning_rate": 1.3973413591998245e-05, + "loss": 1.4338, + "step": 32847 + }, + { + "epoch": 2.58, + "learning_rate": 1.3968204845803283e-05, + "loss": 1.454, + "step": 32848 + }, + { + "epoch": 2.58, + "learning_rate": 1.3962997023189165e-05, + "loss": 1.4748, + "step": 32849 + }, + { + "epoch": 2.58, + "learning_rate": 1.3957790124191232e-05, + "loss": 1.4412, + "step": 32850 + }, + { + "epoch": 2.58, + "learning_rate": 1.3952584148844802e-05, + "loss": 1.4626, + "step": 32851 + }, + { + "epoch": 2.58, + "learning_rate": 1.3947379097185268e-05, + "loss": 1.4744, + "step": 32852 + }, + { + "epoch": 2.58, + "learning_rate": 1.3942174969247949e-05, + "loss": 1.4594, + "step": 32853 + }, + { + "epoch": 2.58, + "learning_rate": 1.3936971765068167e-05, + "loss": 1.3956, + "step": 32854 + }, + { + "epoch": 2.59, + "learning_rate": 1.3931769484681244e-05, + "loss": 1.4763, + "step": 32855 + }, + { + "epoch": 2.59, + "learning_rate": 1.3926568128122567e-05, + "loss": 1.4238, + "step": 32856 + }, + { + "epoch": 2.59, + "learning_rate": 1.3921367695427377e-05, + "loss": 1.4291, + "step": 32857 + }, + { + "epoch": 2.59, + "learning_rate": 1.3916168186630994e-05, + "loss": 1.4082, + "step": 32858 + }, + { + "epoch": 2.59, + "learning_rate": 1.3910969601768757e-05, + "loss": 1.447, + "step": 32859 + }, + { + "epoch": 2.59, + "learning_rate": 1.3905771940875921e-05, + "loss": 1.4523, + "step": 32860 + }, + { + "epoch": 2.59, + "learning_rate": 1.3900575203987808e-05, + "loss": 1.4257, + "step": 32861 + }, + { + "epoch": 2.59, + "learning_rate": 1.3895379391139656e-05, + "loss": 1.4168, + "step": 32862 + }, + { + "epoch": 2.59, + "learning_rate": 1.3890184502366785e-05, + "loss": 1.4892, + "step": 32863 + }, + { + "epoch": 2.59, + "learning_rate": 1.3884990537704454e-05, + "loss": 1.436, + "step": 32864 + }, + { + "epoch": 2.59, + "learning_rate": 1.38797974971879e-05, + "loss": 1.4544, + "step": 32865 + }, + { + "epoch": 2.59, + "learning_rate": 1.3874605380852427e-05, + "loss": 1.4344, + "step": 32866 + }, + { + "epoch": 2.59, + "learning_rate": 1.3869414188733257e-05, + "loss": 1.3928, + "step": 32867 + }, + { + "epoch": 2.59, + "learning_rate": 1.3864223920865631e-05, + "loss": 1.449, + "step": 32868 + }, + { + "epoch": 2.59, + "learning_rate": 1.3859034577284816e-05, + "loss": 1.4041, + "step": 32869 + }, + { + "epoch": 2.59, + "learning_rate": 1.3853846158026021e-05, + "loss": 1.4657, + "step": 32870 + }, + { + "epoch": 2.59, + "learning_rate": 1.3848658663124468e-05, + "loss": 1.4408, + "step": 32871 + }, + { + "epoch": 2.59, + "learning_rate": 1.3843472092615376e-05, + "loss": 1.4285, + "step": 32872 + }, + { + "epoch": 2.59, + "learning_rate": 1.3838286446534002e-05, + "loss": 1.4372, + "step": 32873 + }, + { + "epoch": 2.59, + "learning_rate": 1.3833101724915519e-05, + "loss": 1.4631, + "step": 32874 + }, + { + "epoch": 2.59, + "learning_rate": 1.3827917927795113e-05, + "loss": 1.4606, + "step": 32875 + }, + { + "epoch": 2.59, + "learning_rate": 1.3822735055208006e-05, + "loss": 1.4172, + "step": 32876 + }, + { + "epoch": 2.59, + "learning_rate": 1.3817553107189405e-05, + "loss": 1.488, + "step": 32877 + }, + { + "epoch": 2.59, + "learning_rate": 1.3812372083774432e-05, + "loss": 1.4447, + "step": 32878 + }, + { + "epoch": 2.59, + "learning_rate": 1.3807191984998307e-05, + "loss": 1.5076, + "step": 32879 + }, + { + "epoch": 2.59, + "learning_rate": 1.3802012810896218e-05, + "loss": 1.499, + "step": 32880 + }, + { + "epoch": 2.59, + "learning_rate": 1.379683456150329e-05, + "loss": 1.4639, + "step": 32881 + }, + { + "epoch": 2.59, + "learning_rate": 1.3791657236854659e-05, + "loss": 1.4456, + "step": 32882 + }, + { + "epoch": 2.59, + "learning_rate": 1.3786480836985547e-05, + "loss": 1.4248, + "step": 32883 + }, + { + "epoch": 2.59, + "learning_rate": 1.3781305361931044e-05, + "loss": 1.4349, + "step": 32884 + }, + { + "epoch": 2.59, + "learning_rate": 1.3776130811726289e-05, + "loss": 1.4429, + "step": 32885 + }, + { + "epoch": 2.59, + "learning_rate": 1.3770957186406434e-05, + "loss": 1.413, + "step": 32886 + }, + { + "epoch": 2.59, + "learning_rate": 1.3765784486006637e-05, + "loss": 1.4541, + "step": 32887 + }, + { + "epoch": 2.59, + "learning_rate": 1.376061271056197e-05, + "loss": 1.5028, + "step": 32888 + }, + { + "epoch": 2.59, + "learning_rate": 1.3755441860107535e-05, + "loss": 1.4519, + "step": 32889 + }, + { + "epoch": 2.59, + "learning_rate": 1.3750271934678492e-05, + "loss": 1.4353, + "step": 32890 + }, + { + "epoch": 2.59, + "learning_rate": 1.374510293430991e-05, + "loss": 1.441, + "step": 32891 + }, + { + "epoch": 2.59, + "learning_rate": 1.3739934859036878e-05, + "loss": 1.4583, + "step": 32892 + }, + { + "epoch": 2.59, + "learning_rate": 1.37347677088945e-05, + "loss": 1.4511, + "step": 32893 + }, + { + "epoch": 2.59, + "learning_rate": 1.3729601483917869e-05, + "loss": 1.402, + "step": 32894 + }, + { + "epoch": 2.59, + "learning_rate": 1.3724436184142002e-05, + "loss": 1.4401, + "step": 32895 + }, + { + "epoch": 2.59, + "learning_rate": 1.371927180960204e-05, + "loss": 1.4148, + "step": 32896 + }, + { + "epoch": 2.59, + "learning_rate": 1.371410836033302e-05, + "loss": 1.4375, + "step": 32897 + }, + { + "epoch": 2.59, + "learning_rate": 1.370894583637e-05, + "loss": 1.4858, + "step": 32898 + }, + { + "epoch": 2.59, + "learning_rate": 1.3703784237747983e-05, + "loss": 1.3696, + "step": 32899 + }, + { + "epoch": 2.59, + "learning_rate": 1.3698623564502093e-05, + "loss": 1.4369, + "step": 32900 + }, + { + "epoch": 2.59, + "learning_rate": 1.3693463816667334e-05, + "loss": 1.4227, + "step": 32901 + }, + { + "epoch": 2.59, + "learning_rate": 1.3688304994278709e-05, + "loss": 1.4336, + "step": 32902 + }, + { + "epoch": 2.59, + "learning_rate": 1.3683147097371262e-05, + "loss": 1.4419, + "step": 32903 + }, + { + "epoch": 2.59, + "learning_rate": 1.367799012598006e-05, + "loss": 1.5171, + "step": 32904 + }, + { + "epoch": 2.59, + "learning_rate": 1.3672834080140078e-05, + "loss": 1.4022, + "step": 32905 + }, + { + "epoch": 2.59, + "learning_rate": 1.3667678959886285e-05, + "loss": 1.468, + "step": 32906 + }, + { + "epoch": 2.59, + "learning_rate": 1.3662524765253741e-05, + "loss": 1.4398, + "step": 32907 + }, + { + "epoch": 2.59, + "learning_rate": 1.3657371496277413e-05, + "loss": 1.4594, + "step": 32908 + }, + { + "epoch": 2.59, + "learning_rate": 1.3652219152992278e-05, + "loss": 1.442, + "step": 32909 + }, + { + "epoch": 2.59, + "learning_rate": 1.3647067735433353e-05, + "loss": 1.4239, + "step": 32910 + }, + { + "epoch": 2.59, + "learning_rate": 1.3641917243635597e-05, + "loss": 1.4137, + "step": 32911 + }, + { + "epoch": 2.59, + "learning_rate": 1.3636767677633947e-05, + "loss": 1.4573, + "step": 32912 + }, + { + "epoch": 2.59, + "learning_rate": 1.3631619037463409e-05, + "loss": 1.4662, + "step": 32913 + }, + { + "epoch": 2.59, + "learning_rate": 1.3626471323158939e-05, + "loss": 1.4503, + "step": 32914 + }, + { + "epoch": 2.59, + "learning_rate": 1.3621324534755457e-05, + "loss": 1.474, + "step": 32915 + }, + { + "epoch": 2.59, + "learning_rate": 1.3616178672287902e-05, + "loss": 1.4748, + "step": 32916 + }, + { + "epoch": 2.59, + "learning_rate": 1.3611033735791266e-05, + "loss": 1.4676, + "step": 32917 + }, + { + "epoch": 2.59, + "learning_rate": 1.36058897253004e-05, + "loss": 1.4499, + "step": 32918 + }, + { + "epoch": 2.59, + "learning_rate": 1.3600746640850313e-05, + "loss": 1.455, + "step": 32919 + }, + { + "epoch": 2.59, + "learning_rate": 1.3595604482475859e-05, + "loss": 1.4892, + "step": 32920 + }, + { + "epoch": 2.59, + "learning_rate": 1.3590463250212008e-05, + "loss": 1.4085, + "step": 32921 + }, + { + "epoch": 2.59, + "learning_rate": 1.3585322944093618e-05, + "loss": 1.4884, + "step": 32922 + }, + { + "epoch": 2.59, + "learning_rate": 1.3580183564155594e-05, + "loss": 1.4436, + "step": 32923 + }, + { + "epoch": 2.59, + "learning_rate": 1.3575045110432858e-05, + "loss": 1.3982, + "step": 32924 + }, + { + "epoch": 2.59, + "learning_rate": 1.3569907582960281e-05, + "loss": 1.4398, + "step": 32925 + }, + { + "epoch": 2.59, + "learning_rate": 1.3564770981772722e-05, + "loss": 1.4241, + "step": 32926 + }, + { + "epoch": 2.59, + "learning_rate": 1.3559635306905098e-05, + "loss": 1.459, + "step": 32927 + }, + { + "epoch": 2.59, + "learning_rate": 1.3554500558392268e-05, + "loss": 1.4469, + "step": 32928 + }, + { + "epoch": 2.59, + "learning_rate": 1.3549366736269035e-05, + "loss": 1.4111, + "step": 32929 + }, + { + "epoch": 2.59, + "learning_rate": 1.354423384057034e-05, + "loss": 1.4965, + "step": 32930 + }, + { + "epoch": 2.59, + "learning_rate": 1.3539101871331004e-05, + "loss": 1.4359, + "step": 32931 + }, + { + "epoch": 2.59, + "learning_rate": 1.353397082858585e-05, + "loss": 1.4594, + "step": 32932 + }, + { + "epoch": 2.59, + "learning_rate": 1.3528840712369665e-05, + "loss": 1.4364, + "step": 32933 + }, + { + "epoch": 2.59, + "learning_rate": 1.3523711522717407e-05, + "loss": 1.4338, + "step": 32934 + }, + { + "epoch": 2.59, + "learning_rate": 1.3518583259663828e-05, + "loss": 1.4884, + "step": 32935 + }, + { + "epoch": 2.59, + "learning_rate": 1.3513455923243738e-05, + "loss": 1.4272, + "step": 32936 + }, + { + "epoch": 2.59, + "learning_rate": 1.3508329513491973e-05, + "loss": 1.4486, + "step": 32937 + }, + { + "epoch": 2.59, + "learning_rate": 1.3503204030443337e-05, + "loss": 1.4395, + "step": 32938 + }, + { + "epoch": 2.59, + "learning_rate": 1.3498079474132623e-05, + "loss": 1.3722, + "step": 32939 + }, + { + "epoch": 2.59, + "learning_rate": 1.3492955844594583e-05, + "loss": 1.4616, + "step": 32940 + }, + { + "epoch": 2.59, + "learning_rate": 1.3487833141864073e-05, + "loss": 1.4757, + "step": 32941 + }, + { + "epoch": 2.59, + "learning_rate": 1.348271136597585e-05, + "loss": 1.418, + "step": 32942 + }, + { + "epoch": 2.59, + "learning_rate": 1.3477590516964654e-05, + "loss": 1.4508, + "step": 32943 + }, + { + "epoch": 2.59, + "learning_rate": 1.3472470594865287e-05, + "loss": 1.4017, + "step": 32944 + }, + { + "epoch": 2.59, + "learning_rate": 1.3467351599712522e-05, + "loss": 1.45, + "step": 32945 + }, + { + "epoch": 2.59, + "learning_rate": 1.3462233531541067e-05, + "loss": 1.4985, + "step": 32946 + }, + { + "epoch": 2.59, + "learning_rate": 1.3457116390385709e-05, + "loss": 1.3775, + "step": 32947 + }, + { + "epoch": 2.59, + "learning_rate": 1.3452000176281203e-05, + "loss": 1.4624, + "step": 32948 + }, + { + "epoch": 2.59, + "learning_rate": 1.3446884889262222e-05, + "loss": 1.4347, + "step": 32949 + }, + { + "epoch": 2.59, + "learning_rate": 1.3441770529363539e-05, + "loss": 1.4073, + "step": 32950 + }, + { + "epoch": 2.59, + "learning_rate": 1.343665709661989e-05, + "loss": 1.4304, + "step": 32951 + }, + { + "epoch": 2.59, + "learning_rate": 1.3431544591065984e-05, + "loss": 1.3994, + "step": 32952 + }, + { + "epoch": 2.59, + "learning_rate": 1.342643301273651e-05, + "loss": 1.5001, + "step": 32953 + }, + { + "epoch": 2.59, + "learning_rate": 1.3421322361666204e-05, + "loss": 1.4526, + "step": 32954 + }, + { + "epoch": 2.59, + "learning_rate": 1.3416212637889757e-05, + "loss": 1.4345, + "step": 32955 + }, + { + "epoch": 2.59, + "learning_rate": 1.3411103841441857e-05, + "loss": 1.4068, + "step": 32956 + }, + { + "epoch": 2.59, + "learning_rate": 1.3405995972357142e-05, + "loss": 1.4082, + "step": 32957 + }, + { + "epoch": 2.59, + "learning_rate": 1.3400889030670369e-05, + "loss": 1.4403, + "step": 32958 + }, + { + "epoch": 2.59, + "learning_rate": 1.3395783016416178e-05, + "loss": 1.4523, + "step": 32959 + }, + { + "epoch": 2.59, + "learning_rate": 1.3390677929629223e-05, + "loss": 1.4575, + "step": 32960 + }, + { + "epoch": 2.59, + "learning_rate": 1.3385573770344177e-05, + "loss": 1.4408, + "step": 32961 + }, + { + "epoch": 2.59, + "learning_rate": 1.3380470538595711e-05, + "loss": 1.4386, + "step": 32962 + }, + { + "epoch": 2.59, + "learning_rate": 1.3375368234418431e-05, + "loss": 1.4311, + "step": 32963 + }, + { + "epoch": 2.59, + "learning_rate": 1.3370266857847046e-05, + "loss": 1.442, + "step": 32964 + }, + { + "epoch": 2.59, + "learning_rate": 1.3365166408916106e-05, + "loss": 1.4949, + "step": 32965 + }, + { + "epoch": 2.59, + "learning_rate": 1.3360066887660303e-05, + "loss": 1.4181, + "step": 32966 + }, + { + "epoch": 2.59, + "learning_rate": 1.3354968294114226e-05, + "loss": 1.4883, + "step": 32967 + }, + { + "epoch": 2.59, + "learning_rate": 1.3349870628312532e-05, + "loss": 1.4755, + "step": 32968 + }, + { + "epoch": 2.59, + "learning_rate": 1.3344773890289823e-05, + "loss": 1.4365, + "step": 32969 + }, + { + "epoch": 2.59, + "learning_rate": 1.333967808008064e-05, + "loss": 1.4333, + "step": 32970 + }, + { + "epoch": 2.59, + "learning_rate": 1.3334583197719656e-05, + "loss": 1.4554, + "step": 32971 + }, + { + "epoch": 2.59, + "learning_rate": 1.3329489243241442e-05, + "loss": 1.4559, + "step": 32972 + }, + { + "epoch": 2.59, + "learning_rate": 1.3324396216680572e-05, + "loss": 1.4768, + "step": 32973 + }, + { + "epoch": 2.59, + "learning_rate": 1.33193041180716e-05, + "loss": 1.4664, + "step": 32974 + }, + { + "epoch": 2.59, + "learning_rate": 1.3314212947449149e-05, + "loss": 1.4691, + "step": 32975 + }, + { + "epoch": 2.59, + "learning_rate": 1.3309122704847774e-05, + "loss": 1.4624, + "step": 32976 + }, + { + "epoch": 2.59, + "learning_rate": 1.3304033390301983e-05, + "loss": 1.4173, + "step": 32977 + }, + { + "epoch": 2.59, + "learning_rate": 1.3298945003846396e-05, + "loss": 1.4319, + "step": 32978 + }, + { + "epoch": 2.59, + "learning_rate": 1.3293857545515551e-05, + "loss": 1.477, + "step": 32979 + }, + { + "epoch": 2.59, + "learning_rate": 1.328877101534394e-05, + "loss": 1.4624, + "step": 32980 + }, + { + "epoch": 2.59, + "learning_rate": 1.3283685413366119e-05, + "loss": 1.4423, + "step": 32981 + }, + { + "epoch": 2.6, + "learning_rate": 1.3278600739616657e-05, + "loss": 1.4816, + "step": 32982 + }, + { + "epoch": 2.6, + "learning_rate": 1.3273516994130062e-05, + "loss": 1.4357, + "step": 32983 + }, + { + "epoch": 2.6, + "learning_rate": 1.326843417694079e-05, + "loss": 1.4576, + "step": 32984 + }, + { + "epoch": 2.6, + "learning_rate": 1.3263352288083428e-05, + "loss": 1.384, + "step": 32985 + }, + { + "epoch": 2.6, + "learning_rate": 1.3258271327592451e-05, + "loss": 1.468, + "step": 32986 + }, + { + "epoch": 2.6, + "learning_rate": 1.325319129550233e-05, + "loss": 1.4084, + "step": 32987 + }, + { + "epoch": 2.6, + "learning_rate": 1.3248112191847588e-05, + "loss": 1.4841, + "step": 32988 + }, + { + "epoch": 2.6, + "learning_rate": 1.3243034016662712e-05, + "loss": 1.4281, + "step": 32989 + }, + { + "epoch": 2.6, + "learning_rate": 1.3237956769982128e-05, + "loss": 1.4622, + "step": 32990 + }, + { + "epoch": 2.6, + "learning_rate": 1.3232880451840388e-05, + "loss": 1.4741, + "step": 32991 + }, + { + "epoch": 2.6, + "learning_rate": 1.3227805062271902e-05, + "loss": 1.4394, + "step": 32992 + }, + { + "epoch": 2.6, + "learning_rate": 1.3222730601311154e-05, + "loss": 1.3981, + "step": 32993 + }, + { + "epoch": 2.6, + "learning_rate": 1.3217657068992537e-05, + "loss": 1.4773, + "step": 32994 + }, + { + "epoch": 2.6, + "learning_rate": 1.321258446535059e-05, + "loss": 1.3958, + "step": 32995 + }, + { + "epoch": 2.6, + "learning_rate": 1.3207512790419684e-05, + "loss": 1.4459, + "step": 32996 + }, + { + "epoch": 2.6, + "learning_rate": 1.3202442044234308e-05, + "loss": 1.4609, + "step": 32997 + }, + { + "epoch": 2.6, + "learning_rate": 1.3197372226828817e-05, + "loss": 1.4281, + "step": 32998 + }, + { + "epoch": 2.6, + "learning_rate": 1.3192303338237704e-05, + "loss": 1.4466, + "step": 32999 + }, + { + "epoch": 2.6, + "learning_rate": 1.3187235378495353e-05, + "loss": 1.4055, + "step": 33000 + }, + { + "epoch": 2.6, + "learning_rate": 1.3182168347636157e-05, + "loss": 1.4632, + "step": 33001 + }, + { + "epoch": 2.6, + "learning_rate": 1.3177102245694571e-05, + "loss": 1.4703, + "step": 33002 + }, + { + "epoch": 2.6, + "learning_rate": 1.3172037072704932e-05, + "loss": 1.4172, + "step": 33003 + }, + { + "epoch": 2.6, + "learning_rate": 1.316697282870165e-05, + "loss": 1.4873, + "step": 33004 + }, + { + "epoch": 2.6, + "learning_rate": 1.3161909513719126e-05, + "loss": 1.4586, + "step": 33005 + }, + { + "epoch": 2.6, + "learning_rate": 1.315684712779172e-05, + "loss": 1.4753, + "step": 33006 + }, + { + "epoch": 2.6, + "learning_rate": 1.3151785670953785e-05, + "loss": 1.5135, + "step": 33007 + }, + { + "epoch": 2.6, + "learning_rate": 1.3146725143239728e-05, + "loss": 1.4366, + "step": 33008 + }, + { + "epoch": 2.6, + "learning_rate": 1.3141665544683889e-05, + "loss": 1.4237, + "step": 33009 + }, + { + "epoch": 2.6, + "learning_rate": 1.3136606875320604e-05, + "loss": 1.4215, + "step": 33010 + }, + { + "epoch": 2.6, + "learning_rate": 1.3131549135184216e-05, + "loss": 1.461, + "step": 33011 + }, + { + "epoch": 2.6, + "learning_rate": 1.312649232430908e-05, + "loss": 1.4543, + "step": 33012 + }, + { + "epoch": 2.6, + "learning_rate": 1.3121436442729549e-05, + "loss": 1.4267, + "step": 33013 + }, + { + "epoch": 2.6, + "learning_rate": 1.3116381490479932e-05, + "loss": 1.4683, + "step": 33014 + }, + { + "epoch": 2.6, + "learning_rate": 1.3111327467594535e-05, + "loss": 1.4211, + "step": 33015 + }, + { + "epoch": 2.6, + "learning_rate": 1.3106274374107694e-05, + "loss": 1.484, + "step": 33016 + }, + { + "epoch": 2.6, + "learning_rate": 1.3101222210053703e-05, + "loss": 1.4886, + "step": 33017 + }, + { + "epoch": 2.6, + "learning_rate": 1.3096170975466847e-05, + "loss": 1.4589, + "step": 33018 + }, + { + "epoch": 2.6, + "learning_rate": 1.3091120670381467e-05, + "loss": 1.4149, + "step": 33019 + }, + { + "epoch": 2.6, + "learning_rate": 1.3086071294831819e-05, + "loss": 1.4413, + "step": 33020 + }, + { + "epoch": 2.6, + "learning_rate": 1.3081022848852158e-05, + "loss": 1.4292, + "step": 33021 + }, + { + "epoch": 2.6, + "learning_rate": 1.307597533247684e-05, + "loss": 1.4248, + "step": 33022 + }, + { + "epoch": 2.6, + "learning_rate": 1.3070928745740072e-05, + "loss": 1.4645, + "step": 33023 + }, + { + "epoch": 2.6, + "learning_rate": 1.306588308867611e-05, + "loss": 1.4337, + "step": 33024 + }, + { + "epoch": 2.6, + "learning_rate": 1.3060838361319276e-05, + "loss": 1.4808, + "step": 33025 + }, + { + "epoch": 2.6, + "learning_rate": 1.3055794563703758e-05, + "loss": 1.497, + "step": 33026 + }, + { + "epoch": 2.6, + "learning_rate": 1.305075169586383e-05, + "loss": 1.4767, + "step": 33027 + }, + { + "epoch": 2.6, + "learning_rate": 1.3045709757833684e-05, + "loss": 1.4741, + "step": 33028 + }, + { + "epoch": 2.6, + "learning_rate": 1.3040668749647638e-05, + "loss": 1.4408, + "step": 33029 + }, + { + "epoch": 2.6, + "learning_rate": 1.3035628671339865e-05, + "loss": 1.5025, + "step": 33030 + }, + { + "epoch": 2.6, + "learning_rate": 1.303058952294459e-05, + "loss": 1.4477, + "step": 33031 + }, + { + "epoch": 2.6, + "learning_rate": 1.3025551304496002e-05, + "loss": 1.3662, + "step": 33032 + }, + { + "epoch": 2.6, + "learning_rate": 1.3020514016028355e-05, + "loss": 1.4492, + "step": 33033 + }, + { + "epoch": 2.6, + "learning_rate": 1.301547765757584e-05, + "loss": 1.5008, + "step": 33034 + }, + { + "epoch": 2.6, + "learning_rate": 1.3010442229172597e-05, + "loss": 1.4269, + "step": 33035 + }, + { + "epoch": 2.6, + "learning_rate": 1.300540773085288e-05, + "loss": 1.4358, + "step": 33036 + }, + { + "epoch": 2.6, + "learning_rate": 1.3000374162650862e-05, + "loss": 1.4365, + "step": 33037 + }, + { + "epoch": 2.6, + "learning_rate": 1.299534152460065e-05, + "loss": 1.4536, + "step": 33038 + }, + { + "epoch": 2.6, + "learning_rate": 1.29903098167365e-05, + "loss": 1.4952, + "step": 33039 + }, + { + "epoch": 2.6, + "learning_rate": 1.298527903909255e-05, + "loss": 1.4743, + "step": 33040 + }, + { + "epoch": 2.6, + "learning_rate": 1.2980249191702908e-05, + "loss": 1.4267, + "step": 33041 + }, + { + "epoch": 2.6, + "learning_rate": 1.2975220274601778e-05, + "loss": 1.4297, + "step": 33042 + }, + { + "epoch": 2.6, + "learning_rate": 1.2970192287823267e-05, + "loss": 1.4525, + "step": 33043 + }, + { + "epoch": 2.6, + "learning_rate": 1.2965165231401565e-05, + "loss": 1.4187, + "step": 33044 + }, + { + "epoch": 2.6, + "learning_rate": 1.2960139105370726e-05, + "loss": 1.4263, + "step": 33045 + }, + { + "epoch": 2.6, + "learning_rate": 1.2955113909764957e-05, + "loss": 1.4387, + "step": 33046 + }, + { + "epoch": 2.6, + "learning_rate": 1.2950089644618334e-05, + "loss": 1.4261, + "step": 33047 + }, + { + "epoch": 2.6, + "learning_rate": 1.2945066309964957e-05, + "loss": 1.4532, + "step": 33048 + }, + { + "epoch": 2.6, + "learning_rate": 1.2940043905838954e-05, + "loss": 1.4065, + "step": 33049 + }, + { + "epoch": 2.6, + "learning_rate": 1.2935022432274428e-05, + "loss": 1.4296, + "step": 33050 + }, + { + "epoch": 2.6, + "learning_rate": 1.2930001889305452e-05, + "loss": 1.4486, + "step": 33051 + }, + { + "epoch": 2.6, + "learning_rate": 1.29249822769661e-05, + "loss": 1.448, + "step": 33052 + }, + { + "epoch": 2.6, + "learning_rate": 1.291996359529051e-05, + "loss": 1.4209, + "step": 33053 + }, + { + "epoch": 2.6, + "learning_rate": 1.2914945844312708e-05, + "loss": 1.4668, + "step": 33054 + }, + { + "epoch": 2.6, + "learning_rate": 1.2909929024066745e-05, + "loss": 1.4442, + "step": 33055 + }, + { + "epoch": 2.6, + "learning_rate": 1.2904913134586747e-05, + "loss": 1.4796, + "step": 33056 + }, + { + "epoch": 2.6, + "learning_rate": 1.2899898175906737e-05, + "loss": 1.4795, + "step": 33057 + }, + { + "epoch": 2.6, + "learning_rate": 1.289488414806072e-05, + "loss": 1.4727, + "step": 33058 + }, + { + "epoch": 2.6, + "learning_rate": 1.2889871051082784e-05, + "loss": 1.5212, + "step": 33059 + }, + { + "epoch": 2.6, + "learning_rate": 1.2884858885006987e-05, + "loss": 1.4357, + "step": 33060 + }, + { + "epoch": 2.6, + "learning_rate": 1.2879847649867337e-05, + "loss": 1.4827, + "step": 33061 + }, + { + "epoch": 2.6, + "learning_rate": 1.2874837345697819e-05, + "loss": 1.4437, + "step": 33062 + }, + { + "epoch": 2.6, + "learning_rate": 1.2869827972532509e-05, + "loss": 1.4881, + "step": 33063 + }, + { + "epoch": 2.6, + "learning_rate": 1.2864819530405395e-05, + "loss": 1.4337, + "step": 33064 + }, + { + "epoch": 2.6, + "learning_rate": 1.2859812019350469e-05, + "loss": 1.4623, + "step": 33065 + }, + { + "epoch": 2.6, + "learning_rate": 1.285480543940175e-05, + "loss": 1.4889, + "step": 33066 + }, + { + "epoch": 2.6, + "learning_rate": 1.2849799790593213e-05, + "loss": 1.4127, + "step": 33067 + }, + { + "epoch": 2.6, + "learning_rate": 1.2844795072958847e-05, + "loss": 1.4177, + "step": 33068 + }, + { + "epoch": 2.6, + "learning_rate": 1.2839791286532624e-05, + "loss": 1.4742, + "step": 33069 + }, + { + "epoch": 2.6, + "learning_rate": 1.2834788431348552e-05, + "loss": 1.4704, + "step": 33070 + }, + { + "epoch": 2.6, + "learning_rate": 1.2829786507440554e-05, + "loss": 1.4279, + "step": 33071 + }, + { + "epoch": 2.6, + "learning_rate": 1.28247855148426e-05, + "loss": 1.4858, + "step": 33072 + }, + { + "epoch": 2.6, + "learning_rate": 1.2819785453588682e-05, + "loss": 1.4401, + "step": 33073 + }, + { + "epoch": 2.6, + "learning_rate": 1.2814786323712706e-05, + "loss": 1.4414, + "step": 33074 + }, + { + "epoch": 2.6, + "learning_rate": 1.2809788125248593e-05, + "loss": 1.446, + "step": 33075 + }, + { + "epoch": 2.6, + "learning_rate": 1.2804790858230336e-05, + "loss": 1.5283, + "step": 33076 + }, + { + "epoch": 2.6, + "learning_rate": 1.2799794522691837e-05, + "loss": 1.4332, + "step": 33077 + }, + { + "epoch": 2.6, + "learning_rate": 1.2794799118667038e-05, + "loss": 1.4488, + "step": 33078 + }, + { + "epoch": 2.6, + "learning_rate": 1.278980464618981e-05, + "loss": 1.4109, + "step": 33079 + }, + { + "epoch": 2.6, + "learning_rate": 1.2784811105294113e-05, + "loss": 1.4567, + "step": 33080 + }, + { + "epoch": 2.6, + "learning_rate": 1.2779818496013815e-05, + "loss": 1.4173, + "step": 33081 + }, + { + "epoch": 2.6, + "learning_rate": 1.2774826818382811e-05, + "loss": 1.4541, + "step": 33082 + }, + { + "epoch": 2.6, + "learning_rate": 1.2769836072435035e-05, + "loss": 1.4396, + "step": 33083 + }, + { + "epoch": 2.6, + "learning_rate": 1.2764846258204348e-05, + "loss": 1.4453, + "step": 33084 + }, + { + "epoch": 2.6, + "learning_rate": 1.2759857375724603e-05, + "loss": 1.4878, + "step": 33085 + }, + { + "epoch": 2.6, + "learning_rate": 1.2754869425029673e-05, + "loss": 1.3883, + "step": 33086 + }, + { + "epoch": 2.6, + "learning_rate": 1.2749882406153466e-05, + "loss": 1.4459, + "step": 33087 + }, + { + "epoch": 2.6, + "learning_rate": 1.2744896319129822e-05, + "loss": 1.3688, + "step": 33088 + }, + { + "epoch": 2.6, + "learning_rate": 1.2739911163992561e-05, + "loss": 1.4771, + "step": 33089 + }, + { + "epoch": 2.6, + "learning_rate": 1.2734926940775574e-05, + "loss": 1.5112, + "step": 33090 + }, + { + "epoch": 2.6, + "learning_rate": 1.272994364951267e-05, + "loss": 1.4309, + "step": 33091 + }, + { + "epoch": 2.6, + "learning_rate": 1.2724961290237717e-05, + "loss": 1.4991, + "step": 33092 + }, + { + "epoch": 2.6, + "learning_rate": 1.2719979862984508e-05, + "loss": 1.4131, + "step": 33093 + }, + { + "epoch": 2.6, + "learning_rate": 1.2714999367786883e-05, + "loss": 1.4563, + "step": 33094 + }, + { + "epoch": 2.6, + "learning_rate": 1.2710019804678661e-05, + "loss": 1.4663, + "step": 33095 + }, + { + "epoch": 2.6, + "learning_rate": 1.270504117369362e-05, + "loss": 1.4705, + "step": 33096 + }, + { + "epoch": 2.6, + "learning_rate": 1.2700063474865613e-05, + "loss": 1.4679, + "step": 33097 + }, + { + "epoch": 2.6, + "learning_rate": 1.2695086708228398e-05, + "loss": 1.4518, + "step": 33098 + }, + { + "epoch": 2.6, + "learning_rate": 1.2690110873815746e-05, + "loss": 1.4317, + "step": 33099 + }, + { + "epoch": 2.6, + "learning_rate": 1.2685135971661498e-05, + "loss": 1.4494, + "step": 33100 + }, + { + "epoch": 2.6, + "learning_rate": 1.268016200179941e-05, + "loss": 1.4499, + "step": 33101 + }, + { + "epoch": 2.6, + "learning_rate": 1.2675188964263206e-05, + "loss": 1.4276, + "step": 33102 + }, + { + "epoch": 2.6, + "learning_rate": 1.2670216859086707e-05, + "loss": 1.4306, + "step": 33103 + }, + { + "epoch": 2.6, + "learning_rate": 1.2665245686303655e-05, + "loss": 1.4616, + "step": 33104 + }, + { + "epoch": 2.6, + "learning_rate": 1.2660275445947805e-05, + "loss": 1.4449, + "step": 33105 + }, + { + "epoch": 2.6, + "learning_rate": 1.2655306138052828e-05, + "loss": 1.4769, + "step": 33106 + }, + { + "epoch": 2.6, + "learning_rate": 1.2650337762652602e-05, + "loss": 1.4679, + "step": 33107 + }, + { + "epoch": 2.6, + "learning_rate": 1.2645370319780762e-05, + "loss": 1.4894, + "step": 33108 + }, + { + "epoch": 2.61, + "learning_rate": 1.2640403809471083e-05, + "loss": 1.4347, + "step": 33109 + }, + { + "epoch": 2.61, + "learning_rate": 1.2635438231757222e-05, + "loss": 1.4661, + "step": 33110 + }, + { + "epoch": 2.61, + "learning_rate": 1.2630473586672951e-05, + "loss": 1.4615, + "step": 33111 + }, + { + "epoch": 2.61, + "learning_rate": 1.262550987425196e-05, + "loss": 1.4069, + "step": 33112 + }, + { + "epoch": 2.61, + "learning_rate": 1.262054709452794e-05, + "loss": 1.437, + "step": 33113 + }, + { + "epoch": 2.61, + "learning_rate": 1.2615585247534593e-05, + "loss": 1.4516, + "step": 33114 + }, + { + "epoch": 2.61, + "learning_rate": 1.261062433330563e-05, + "loss": 1.4592, + "step": 33115 + }, + { + "epoch": 2.61, + "learning_rate": 1.2605664351874673e-05, + "loss": 1.4427, + "step": 33116 + }, + { + "epoch": 2.61, + "learning_rate": 1.260070530327546e-05, + "loss": 1.4491, + "step": 33117 + }, + { + "epoch": 2.61, + "learning_rate": 1.2595747187541633e-05, + "loss": 1.463, + "step": 33118 + }, + { + "epoch": 2.61, + "learning_rate": 1.259079000470683e-05, + "loss": 1.4524, + "step": 33119 + }, + { + "epoch": 2.61, + "learning_rate": 1.2585833754804775e-05, + "loss": 1.42, + "step": 33120 + }, + { + "epoch": 2.61, + "learning_rate": 1.2580878437869057e-05, + "loss": 1.3941, + "step": 33121 + }, + { + "epoch": 2.61, + "learning_rate": 1.2575924053933317e-05, + "loss": 1.4379, + "step": 33122 + }, + { + "epoch": 2.61, + "learning_rate": 1.2570970603031227e-05, + "loss": 1.4605, + "step": 33123 + }, + { + "epoch": 2.61, + "learning_rate": 1.2566018085196428e-05, + "loss": 1.4478, + "step": 33124 + }, + { + "epoch": 2.61, + "learning_rate": 1.2561066500462525e-05, + "loss": 1.4409, + "step": 33125 + }, + { + "epoch": 2.61, + "learning_rate": 1.255611584886314e-05, + "loss": 1.4394, + "step": 33126 + }, + { + "epoch": 2.61, + "learning_rate": 1.255116613043185e-05, + "loss": 1.465, + "step": 33127 + }, + { + "epoch": 2.61, + "learning_rate": 1.2546217345202308e-05, + "loss": 1.4051, + "step": 33128 + }, + { + "epoch": 2.61, + "learning_rate": 1.2541269493208107e-05, + "loss": 1.4446, + "step": 33129 + }, + { + "epoch": 2.61, + "learning_rate": 1.2536322574482816e-05, + "loss": 1.4654, + "step": 33130 + }, + { + "epoch": 2.61, + "learning_rate": 1.2531376589060043e-05, + "loss": 1.5024, + "step": 33131 + }, + { + "epoch": 2.61, + "learning_rate": 1.2526431536973363e-05, + "loss": 1.4542, + "step": 33132 + }, + { + "epoch": 2.61, + "learning_rate": 1.2521487418256331e-05, + "loss": 1.4906, + "step": 33133 + }, + { + "epoch": 2.61, + "learning_rate": 1.2516544232942554e-05, + "loss": 1.4667, + "step": 33134 + }, + { + "epoch": 2.61, + "learning_rate": 1.2511601981065572e-05, + "loss": 1.5069, + "step": 33135 + }, + { + "epoch": 2.61, + "learning_rate": 1.2506660662658907e-05, + "loss": 1.4216, + "step": 33136 + }, + { + "epoch": 2.61, + "learning_rate": 1.2501720277756183e-05, + "loss": 1.4554, + "step": 33137 + }, + { + "epoch": 2.61, + "learning_rate": 1.2496780826390857e-05, + "loss": 1.417, + "step": 33138 + }, + { + "epoch": 2.61, + "learning_rate": 1.249184230859655e-05, + "loss": 1.4269, + "step": 33139 + }, + { + "epoch": 2.61, + "learning_rate": 1.248690472440672e-05, + "loss": 1.4377, + "step": 33140 + }, + { + "epoch": 2.61, + "learning_rate": 1.2481968073854941e-05, + "loss": 1.4574, + "step": 33141 + }, + { + "epoch": 2.61, + "learning_rate": 1.2477032356974719e-05, + "loss": 1.4265, + "step": 33142 + }, + { + "epoch": 2.61, + "learning_rate": 1.2472097573799545e-05, + "loss": 1.4202, + "step": 33143 + }, + { + "epoch": 2.61, + "learning_rate": 1.2467163724362922e-05, + "loss": 1.422, + "step": 33144 + }, + { + "epoch": 2.61, + "learning_rate": 1.2462230808698375e-05, + "loss": 1.3917, + "step": 33145 + }, + { + "epoch": 2.61, + "learning_rate": 1.245729882683938e-05, + "loss": 1.4438, + "step": 33146 + }, + { + "epoch": 2.61, + "learning_rate": 1.2452367778819405e-05, + "loss": 1.4446, + "step": 33147 + }, + { + "epoch": 2.61, + "learning_rate": 1.2447437664671978e-05, + "loss": 1.4497, + "step": 33148 + }, + { + "epoch": 2.61, + "learning_rate": 1.2442508484430536e-05, + "loss": 1.4203, + "step": 33149 + }, + { + "epoch": 2.61, + "learning_rate": 1.243758023812852e-05, + "loss": 1.4536, + "step": 33150 + }, + { + "epoch": 2.61, + "learning_rate": 1.2432652925799452e-05, + "loss": 1.4576, + "step": 33151 + }, + { + "epoch": 2.61, + "learning_rate": 1.2427726547476758e-05, + "loss": 1.4422, + "step": 33152 + }, + { + "epoch": 2.61, + "learning_rate": 1.2422801103193841e-05, + "loss": 1.4359, + "step": 33153 + }, + { + "epoch": 2.61, + "learning_rate": 1.2417876592984195e-05, + "loss": 1.4272, + "step": 33154 + }, + { + "epoch": 2.61, + "learning_rate": 1.2412953016881271e-05, + "loss": 1.4939, + "step": 33155 + }, + { + "epoch": 2.61, + "learning_rate": 1.2408030374918466e-05, + "loss": 1.4506, + "step": 33156 + }, + { + "epoch": 2.61, + "learning_rate": 1.240310866712918e-05, + "loss": 1.4867, + "step": 33157 + }, + { + "epoch": 2.61, + "learning_rate": 1.2398187893546874e-05, + "loss": 1.4221, + "step": 33158 + }, + { + "epoch": 2.61, + "learning_rate": 1.2393268054204936e-05, + "loss": 1.4017, + "step": 33159 + }, + { + "epoch": 2.61, + "learning_rate": 1.2388349149136756e-05, + "loss": 1.5081, + "step": 33160 + }, + { + "epoch": 2.61, + "learning_rate": 1.2383431178375757e-05, + "loss": 1.49, + "step": 33161 + }, + { + "epoch": 2.61, + "learning_rate": 1.2378514141955331e-05, + "loss": 1.4922, + "step": 33162 + }, + { + "epoch": 2.61, + "learning_rate": 1.237359803990885e-05, + "loss": 1.4264, + "step": 33163 + }, + { + "epoch": 2.61, + "learning_rate": 1.2368682872269653e-05, + "loss": 1.431, + "step": 33164 + }, + { + "epoch": 2.61, + "learning_rate": 1.236376863907118e-05, + "loss": 1.4905, + "step": 33165 + }, + { + "epoch": 2.61, + "learning_rate": 1.2358855340346757e-05, + "loss": 1.3934, + "step": 33166 + }, + { + "epoch": 2.61, + "learning_rate": 1.2353942976129722e-05, + "loss": 1.4796, + "step": 33167 + }, + { + "epoch": 2.61, + "learning_rate": 1.2349031546453497e-05, + "loss": 1.485, + "step": 33168 + }, + { + "epoch": 2.61, + "learning_rate": 1.234412105135134e-05, + "loss": 1.4431, + "step": 33169 + }, + { + "epoch": 2.61, + "learning_rate": 1.2339211490856676e-05, + "loss": 1.4485, + "step": 33170 + }, + { + "epoch": 2.61, + "learning_rate": 1.2334302865002777e-05, + "loss": 1.4425, + "step": 33171 + }, + { + "epoch": 2.61, + "learning_rate": 1.2329395173822998e-05, + "loss": 1.42, + "step": 33172 + }, + { + "epoch": 2.61, + "learning_rate": 1.2324488417350664e-05, + "loss": 1.4256, + "step": 33173 + }, + { + "epoch": 2.61, + "learning_rate": 1.231958259561905e-05, + "loss": 1.4351, + "step": 33174 + }, + { + "epoch": 2.61, + "learning_rate": 1.2314677708661524e-05, + "loss": 1.4452, + "step": 33175 + }, + { + "epoch": 2.61, + "learning_rate": 1.2309773756511349e-05, + "loss": 1.4181, + "step": 33176 + }, + { + "epoch": 2.61, + "learning_rate": 1.2304870739201795e-05, + "loss": 1.4171, + "step": 33177 + }, + { + "epoch": 2.61, + "learning_rate": 1.2299968656766218e-05, + "loss": 1.461, + "step": 33178 + }, + { + "epoch": 2.61, + "learning_rate": 1.229506750923786e-05, + "loss": 1.4399, + "step": 33179 + }, + { + "epoch": 2.61, + "learning_rate": 1.2290167296650011e-05, + "loss": 1.444, + "step": 33180 + }, + { + "epoch": 2.61, + "learning_rate": 1.2285268019035893e-05, + "loss": 1.3954, + "step": 33181 + }, + { + "epoch": 2.61, + "learning_rate": 1.2280369676428847e-05, + "loss": 1.4186, + "step": 33182 + }, + { + "epoch": 2.61, + "learning_rate": 1.227547226886208e-05, + "loss": 1.4068, + "step": 33183 + }, + { + "epoch": 2.61, + "learning_rate": 1.2270575796368831e-05, + "loss": 1.4515, + "step": 33184 + }, + { + "epoch": 2.61, + "learning_rate": 1.2265680258982357e-05, + "loss": 1.4256, + "step": 33185 + }, + { + "epoch": 2.61, + "learning_rate": 1.2260785656735949e-05, + "loss": 1.4428, + "step": 33186 + }, + { + "epoch": 2.61, + "learning_rate": 1.225589198966278e-05, + "loss": 1.4364, + "step": 33187 + }, + { + "epoch": 2.61, + "learning_rate": 1.2250999257796074e-05, + "loss": 1.466, + "step": 33188 + }, + { + "epoch": 2.61, + "learning_rate": 1.2246107461169103e-05, + "loss": 1.4197, + "step": 33189 + }, + { + "epoch": 2.61, + "learning_rate": 1.2241216599815024e-05, + "loss": 1.4673, + "step": 33190 + }, + { + "epoch": 2.61, + "learning_rate": 1.2236326673767045e-05, + "loss": 1.4725, + "step": 33191 + }, + { + "epoch": 2.61, + "learning_rate": 1.223143768305842e-05, + "loss": 1.4643, + "step": 33192 + }, + { + "epoch": 2.61, + "learning_rate": 1.2226549627722293e-05, + "loss": 1.4298, + "step": 33193 + }, + { + "epoch": 2.61, + "learning_rate": 1.2221662507791835e-05, + "loss": 1.4611, + "step": 33194 + }, + { + "epoch": 2.61, + "learning_rate": 1.2216776323300286e-05, + "loss": 1.4964, + "step": 33195 + }, + { + "epoch": 2.61, + "learning_rate": 1.221189107428079e-05, + "loss": 1.448, + "step": 33196 + }, + { + "epoch": 2.61, + "learning_rate": 1.220700676076653e-05, + "loss": 1.4281, + "step": 33197 + }, + { + "epoch": 2.61, + "learning_rate": 1.2202123382790619e-05, + "loss": 1.4853, + "step": 33198 + }, + { + "epoch": 2.61, + "learning_rate": 1.2197240940386261e-05, + "loss": 1.441, + "step": 33199 + }, + { + "epoch": 2.61, + "learning_rate": 1.2192359433586596e-05, + "loss": 1.4073, + "step": 33200 + }, + { + "epoch": 2.61, + "learning_rate": 1.2187478862424716e-05, + "loss": 1.4335, + "step": 33201 + }, + { + "epoch": 2.61, + "learning_rate": 1.2182599226933858e-05, + "loss": 1.4247, + "step": 33202 + }, + { + "epoch": 2.61, + "learning_rate": 1.21777205271471e-05, + "loss": 1.4896, + "step": 33203 + }, + { + "epoch": 2.61, + "learning_rate": 1.2172842763097545e-05, + "loss": 1.436, + "step": 33204 + }, + { + "epoch": 2.61, + "learning_rate": 1.2167965934818319e-05, + "loss": 1.4253, + "step": 33205 + }, + { + "epoch": 2.61, + "learning_rate": 1.216309004234256e-05, + "loss": 1.4266, + "step": 33206 + }, + { + "epoch": 2.61, + "learning_rate": 1.215821508570336e-05, + "loss": 1.4684, + "step": 33207 + }, + { + "epoch": 2.61, + "learning_rate": 1.2153341064933791e-05, + "loss": 1.4156, + "step": 33208 + }, + { + "epoch": 2.61, + "learning_rate": 1.2148467980066978e-05, + "loss": 1.4743, + "step": 33209 + }, + { + "epoch": 2.61, + "learning_rate": 1.2143595831135994e-05, + "loss": 1.4395, + "step": 33210 + }, + { + "epoch": 2.61, + "learning_rate": 1.2138724618173912e-05, + "loss": 1.4754, + "step": 33211 + }, + { + "epoch": 2.61, + "learning_rate": 1.2133854341213823e-05, + "loss": 1.4355, + "step": 33212 + }, + { + "epoch": 2.61, + "learning_rate": 1.2128985000288782e-05, + "loss": 1.4568, + "step": 33213 + }, + { + "epoch": 2.61, + "learning_rate": 1.2124116595431832e-05, + "loss": 1.4339, + "step": 33214 + }, + { + "epoch": 2.61, + "learning_rate": 1.2119249126676062e-05, + "loss": 1.4409, + "step": 33215 + }, + { + "epoch": 2.61, + "learning_rate": 1.2114382594054478e-05, + "loss": 1.4312, + "step": 33216 + }, + { + "epoch": 2.61, + "learning_rate": 1.2109516997600172e-05, + "loss": 1.4677, + "step": 33217 + }, + { + "epoch": 2.61, + "learning_rate": 1.2104652337346116e-05, + "loss": 1.4893, + "step": 33218 + }, + { + "epoch": 2.61, + "learning_rate": 1.2099788613325418e-05, + "loss": 1.4474, + "step": 33219 + }, + { + "epoch": 2.61, + "learning_rate": 1.209492582557105e-05, + "loss": 1.4716, + "step": 33220 + }, + { + "epoch": 2.61, + "learning_rate": 1.2090063974116021e-05, + "loss": 1.4471, + "step": 33221 + }, + { + "epoch": 2.61, + "learning_rate": 1.2085203058993337e-05, + "loss": 1.4735, + "step": 33222 + }, + { + "epoch": 2.61, + "learning_rate": 1.2080343080236037e-05, + "loss": 1.4579, + "step": 33223 + }, + { + "epoch": 2.61, + "learning_rate": 1.2075484037877099e-05, + "loss": 1.4759, + "step": 33224 + }, + { + "epoch": 2.61, + "learning_rate": 1.207062593194949e-05, + "loss": 1.3864, + "step": 33225 + }, + { + "epoch": 2.61, + "learning_rate": 1.2065768762486238e-05, + "loss": 1.4314, + "step": 33226 + }, + { + "epoch": 2.61, + "learning_rate": 1.20609125295203e-05, + "loss": 1.4382, + "step": 33227 + }, + { + "epoch": 2.61, + "learning_rate": 1.2056057233084614e-05, + "loss": 1.4793, + "step": 33228 + }, + { + "epoch": 2.61, + "learning_rate": 1.2051202873212206e-05, + "loss": 1.4198, + "step": 33229 + }, + { + "epoch": 2.61, + "learning_rate": 1.2046349449936e-05, + "loss": 1.4044, + "step": 33230 + }, + { + "epoch": 2.61, + "learning_rate": 1.2041496963288933e-05, + "loss": 1.4188, + "step": 33231 + }, + { + "epoch": 2.61, + "learning_rate": 1.2036645413303964e-05, + "loss": 1.4771, + "step": 33232 + }, + { + "epoch": 2.61, + "learning_rate": 1.2031794800014066e-05, + "loss": 1.4516, + "step": 33233 + }, + { + "epoch": 2.61, + "learning_rate": 1.2026945123452131e-05, + "loss": 1.4243, + "step": 33234 + }, + { + "epoch": 2.61, + "learning_rate": 1.2022096383651097e-05, + "loss": 1.4097, + "step": 33235 + }, + { + "epoch": 2.62, + "learning_rate": 1.201724858064389e-05, + "loss": 1.4527, + "step": 33236 + }, + { + "epoch": 2.62, + "learning_rate": 1.2012401714463433e-05, + "loss": 1.4675, + "step": 33237 + }, + { + "epoch": 2.62, + "learning_rate": 1.2007555785142613e-05, + "loss": 1.4227, + "step": 33238 + }, + { + "epoch": 2.62, + "learning_rate": 1.2002710792714325e-05, + "loss": 1.4386, + "step": 33239 + }, + { + "epoch": 2.62, + "learning_rate": 1.1997866737211493e-05, + "loss": 1.4632, + "step": 33240 + }, + { + "epoch": 2.62, + "learning_rate": 1.1993023618666986e-05, + "loss": 1.3934, + "step": 33241 + }, + { + "epoch": 2.62, + "learning_rate": 1.1988181437113681e-05, + "loss": 1.4369, + "step": 33242 + }, + { + "epoch": 2.62, + "learning_rate": 1.1983340192584467e-05, + "loss": 1.4635, + "step": 33243 + }, + { + "epoch": 2.62, + "learning_rate": 1.1978499885112236e-05, + "loss": 1.4212, + "step": 33244 + }, + { + "epoch": 2.62, + "learning_rate": 1.1973660514729776e-05, + "loss": 1.4126, + "step": 33245 + }, + { + "epoch": 2.62, + "learning_rate": 1.1968822081470031e-05, + "loss": 1.4785, + "step": 33246 + }, + { + "epoch": 2.62, + "learning_rate": 1.1963984585365805e-05, + "loss": 1.4788, + "step": 33247 + }, + { + "epoch": 2.62, + "learning_rate": 1.1959148026449922e-05, + "loss": 1.4101, + "step": 33248 + }, + { + "epoch": 2.62, + "learning_rate": 1.1954312404755239e-05, + "loss": 1.4699, + "step": 33249 + }, + { + "epoch": 2.62, + "learning_rate": 1.1949477720314631e-05, + "loss": 1.4304, + "step": 33250 + }, + { + "epoch": 2.62, + "learning_rate": 1.194464397316089e-05, + "loss": 1.4212, + "step": 33251 + }, + { + "epoch": 2.62, + "learning_rate": 1.1939811163326801e-05, + "loss": 1.439, + "step": 33252 + }, + { + "epoch": 2.62, + "learning_rate": 1.1934979290845242e-05, + "loss": 1.4203, + "step": 33253 + }, + { + "epoch": 2.62, + "learning_rate": 1.193014835574897e-05, + "loss": 1.402, + "step": 33254 + }, + { + "epoch": 2.62, + "learning_rate": 1.1925318358070773e-05, + "loss": 1.4226, + "step": 33255 + }, + { + "epoch": 2.62, + "learning_rate": 1.1920489297843493e-05, + "loss": 1.4486, + "step": 33256 + }, + { + "epoch": 2.62, + "learning_rate": 1.1915661175099905e-05, + "loss": 1.43, + "step": 33257 + }, + { + "epoch": 2.62, + "learning_rate": 1.1910833989872765e-05, + "loss": 1.4662, + "step": 33258 + }, + { + "epoch": 2.62, + "learning_rate": 1.1906007742194829e-05, + "loss": 1.4458, + "step": 33259 + }, + { + "epoch": 2.62, + "learning_rate": 1.1901182432098921e-05, + "loss": 1.4126, + "step": 33260 + }, + { + "epoch": 2.62, + "learning_rate": 1.1896358059617784e-05, + "loss": 1.4858, + "step": 33261 + }, + { + "epoch": 2.62, + "learning_rate": 1.1891534624784139e-05, + "loss": 1.4244, + "step": 33262 + }, + { + "epoch": 2.62, + "learning_rate": 1.188671212763076e-05, + "loss": 1.4632, + "step": 33263 + }, + { + "epoch": 2.62, + "learning_rate": 1.1881890568190406e-05, + "loss": 1.3876, + "step": 33264 + }, + { + "epoch": 2.62, + "learning_rate": 1.1877069946495798e-05, + "loss": 1.4583, + "step": 33265 + }, + { + "epoch": 2.62, + "learning_rate": 1.187225026257963e-05, + "loss": 1.4568, + "step": 33266 + }, + { + "epoch": 2.62, + "learning_rate": 1.186743151647469e-05, + "loss": 1.5062, + "step": 33267 + }, + { + "epoch": 2.62, + "learning_rate": 1.1862613708213654e-05, + "loss": 1.4513, + "step": 33268 + }, + { + "epoch": 2.62, + "learning_rate": 1.1857796837829225e-05, + "loss": 1.4474, + "step": 33269 + }, + { + "epoch": 2.62, + "learning_rate": 1.1852980905354147e-05, + "loss": 1.4436, + "step": 33270 + }, + { + "epoch": 2.62, + "learning_rate": 1.1848165910821095e-05, + "loss": 1.4899, + "step": 33271 + }, + { + "epoch": 2.62, + "learning_rate": 1.1843351854262723e-05, + "loss": 1.4398, + "step": 33272 + }, + { + "epoch": 2.62, + "learning_rate": 1.1838538735711789e-05, + "loss": 1.452, + "step": 33273 + }, + { + "epoch": 2.62, + "learning_rate": 1.1833726555200918e-05, + "loss": 1.4186, + "step": 33274 + }, + { + "epoch": 2.62, + "learning_rate": 1.1828915312762815e-05, + "loss": 1.4927, + "step": 33275 + }, + { + "epoch": 2.62, + "learning_rate": 1.182410500843009e-05, + "loss": 1.4225, + "step": 33276 + }, + { + "epoch": 2.62, + "learning_rate": 1.1819295642235466e-05, + "loss": 1.4605, + "step": 33277 + }, + { + "epoch": 2.62, + "learning_rate": 1.1814487214211566e-05, + "loss": 1.4552, + "step": 33278 + }, + { + "epoch": 2.62, + "learning_rate": 1.180967972439103e-05, + "loss": 1.4338, + "step": 33279 + }, + { + "epoch": 2.62, + "learning_rate": 1.18048731728065e-05, + "loss": 1.4886, + "step": 33280 + }, + { + "epoch": 2.62, + "learning_rate": 1.1800067559490634e-05, + "loss": 1.439, + "step": 33281 + }, + { + "epoch": 2.62, + "learning_rate": 1.179526288447607e-05, + "loss": 1.4546, + "step": 33282 + }, + { + "epoch": 2.62, + "learning_rate": 1.179045914779535e-05, + "loss": 1.4898, + "step": 33283 + }, + { + "epoch": 2.62, + "learning_rate": 1.1785656349481182e-05, + "loss": 1.3988, + "step": 33284 + }, + { + "epoch": 2.62, + "learning_rate": 1.1780854489566138e-05, + "loss": 1.4108, + "step": 33285 + }, + { + "epoch": 2.62, + "learning_rate": 1.1776053568082777e-05, + "loss": 1.4667, + "step": 33286 + }, + { + "epoch": 2.62, + "learning_rate": 1.1771253585063773e-05, + "loss": 1.4585, + "step": 33287 + }, + { + "epoch": 2.62, + "learning_rate": 1.176645454054168e-05, + "loss": 1.4205, + "step": 33288 + }, + { + "epoch": 2.62, + "learning_rate": 1.1761656434549043e-05, + "loss": 1.4202, + "step": 33289 + }, + { + "epoch": 2.62, + "learning_rate": 1.1756859267118484e-05, + "loss": 1.4947, + "step": 33290 + }, + { + "epoch": 2.62, + "learning_rate": 1.1752063038282578e-05, + "loss": 1.4321, + "step": 33291 + }, + { + "epoch": 2.62, + "learning_rate": 1.174726774807388e-05, + "loss": 1.4811, + "step": 33292 + }, + { + "epoch": 2.62, + "learning_rate": 1.1742473396524899e-05, + "loss": 1.4592, + "step": 33293 + }, + { + "epoch": 2.62, + "learning_rate": 1.1737679983668258e-05, + "loss": 1.4916, + "step": 33294 + }, + { + "epoch": 2.62, + "learning_rate": 1.1732887509536449e-05, + "loss": 1.4682, + "step": 33295 + }, + { + "epoch": 2.62, + "learning_rate": 1.1728095974162044e-05, + "loss": 1.3975, + "step": 33296 + }, + { + "epoch": 2.62, + "learning_rate": 1.1723305377577552e-05, + "loss": 1.4814, + "step": 33297 + }, + { + "epoch": 2.62, + "learning_rate": 1.171851571981553e-05, + "loss": 1.3994, + "step": 33298 + }, + { + "epoch": 2.62, + "learning_rate": 1.1713727000908468e-05, + "loss": 1.4316, + "step": 33299 + }, + { + "epoch": 2.62, + "learning_rate": 1.1708939220888875e-05, + "loss": 1.4791, + "step": 33300 + }, + { + "epoch": 2.62, + "learning_rate": 1.170415237978929e-05, + "loss": 1.4242, + "step": 33301 + }, + { + "epoch": 2.62, + "learning_rate": 1.1699366477642186e-05, + "loss": 1.4108, + "step": 33302 + }, + { + "epoch": 2.62, + "learning_rate": 1.169458151448004e-05, + "loss": 1.4721, + "step": 33303 + }, + { + "epoch": 2.62, + "learning_rate": 1.1689797490335389e-05, + "loss": 1.4121, + "step": 33304 + }, + { + "epoch": 2.62, + "learning_rate": 1.1685014405240695e-05, + "loss": 1.4591, + "step": 33305 + }, + { + "epoch": 2.62, + "learning_rate": 1.1680232259228395e-05, + "loss": 1.472, + "step": 33306 + }, + { + "epoch": 2.62, + "learning_rate": 1.1675451052331015e-05, + "loss": 1.476, + "step": 33307 + }, + { + "epoch": 2.62, + "learning_rate": 1.1670670784580977e-05, + "loss": 1.3924, + "step": 33308 + }, + { + "epoch": 2.62, + "learning_rate": 1.1665891456010756e-05, + "loss": 1.4494, + "step": 33309 + }, + { + "epoch": 2.62, + "learning_rate": 1.1661113066652761e-05, + "loss": 1.433, + "step": 33310 + }, + { + "epoch": 2.62, + "learning_rate": 1.1656335616539481e-05, + "loss": 1.4576, + "step": 33311 + }, + { + "epoch": 2.62, + "learning_rate": 1.165155910570334e-05, + "loss": 1.4676, + "step": 33312 + }, + { + "epoch": 2.62, + "learning_rate": 1.1646783534176763e-05, + "loss": 1.4785, + "step": 33313 + }, + { + "epoch": 2.62, + "learning_rate": 1.1642008901992189e-05, + "loss": 1.4364, + "step": 33314 + }, + { + "epoch": 2.62, + "learning_rate": 1.1637235209182027e-05, + "loss": 1.4317, + "step": 33315 + }, + { + "epoch": 2.62, + "learning_rate": 1.1632462455778685e-05, + "loss": 1.4398, + "step": 33316 + }, + { + "epoch": 2.62, + "learning_rate": 1.1627690641814535e-05, + "loss": 1.428, + "step": 33317 + }, + { + "epoch": 2.62, + "learning_rate": 1.1622919767322036e-05, + "loss": 1.4232, + "step": 33318 + }, + { + "epoch": 2.62, + "learning_rate": 1.1618149832333545e-05, + "loss": 1.4572, + "step": 33319 + }, + { + "epoch": 2.62, + "learning_rate": 1.161338083688142e-05, + "loss": 1.4597, + "step": 33320 + }, + { + "epoch": 2.62, + "learning_rate": 1.16086127809981e-05, + "loss": 1.4017, + "step": 33321 + }, + { + "epoch": 2.62, + "learning_rate": 1.1603845664715928e-05, + "loss": 1.4383, + "step": 33322 + }, + { + "epoch": 2.62, + "learning_rate": 1.1599079488067258e-05, + "loss": 1.4416, + "step": 33323 + }, + { + "epoch": 2.62, + "learning_rate": 1.1594314251084469e-05, + "loss": 1.4559, + "step": 33324 + }, + { + "epoch": 2.62, + "learning_rate": 1.1589549953799914e-05, + "loss": 1.4438, + "step": 33325 + }, + { + "epoch": 2.62, + "learning_rate": 1.158478659624592e-05, + "loss": 1.4809, + "step": 33326 + }, + { + "epoch": 2.62, + "learning_rate": 1.1580024178454827e-05, + "loss": 1.4245, + "step": 33327 + }, + { + "epoch": 2.62, + "learning_rate": 1.1575262700459026e-05, + "loss": 1.4468, + "step": 33328 + }, + { + "epoch": 2.62, + "learning_rate": 1.157050216229079e-05, + "loss": 1.3753, + "step": 33329 + }, + { + "epoch": 2.62, + "learning_rate": 1.1565742563982427e-05, + "loss": 1.4104, + "step": 33330 + }, + { + "epoch": 2.62, + "learning_rate": 1.1560983905566295e-05, + "loss": 1.4581, + "step": 33331 + }, + { + "epoch": 2.62, + "learning_rate": 1.1556226187074701e-05, + "loss": 1.4223, + "step": 33332 + }, + { + "epoch": 2.62, + "learning_rate": 1.1551469408539921e-05, + "loss": 1.4567, + "step": 33333 + }, + { + "epoch": 2.62, + "learning_rate": 1.1546713569994243e-05, + "loss": 1.4615, + "step": 33334 + }, + { + "epoch": 2.62, + "learning_rate": 1.1541958671469993e-05, + "loss": 1.4417, + "step": 33335 + }, + { + "epoch": 2.62, + "learning_rate": 1.1537204712999443e-05, + "loss": 1.4154, + "step": 33336 + }, + { + "epoch": 2.62, + "learning_rate": 1.1532451694614836e-05, + "loss": 1.513, + "step": 33337 + }, + { + "epoch": 2.62, + "learning_rate": 1.1527699616348497e-05, + "loss": 1.4544, + "step": 33338 + }, + { + "epoch": 2.62, + "learning_rate": 1.1522948478232646e-05, + "loss": 1.4393, + "step": 33339 + }, + { + "epoch": 2.62, + "learning_rate": 1.1518198280299545e-05, + "loss": 1.4454, + "step": 33340 + }, + { + "epoch": 2.62, + "learning_rate": 1.1513449022581483e-05, + "loss": 1.4481, + "step": 33341 + }, + { + "epoch": 2.62, + "learning_rate": 1.1508700705110651e-05, + "loss": 1.418, + "step": 33342 + }, + { + "epoch": 2.62, + "learning_rate": 1.1503953327919341e-05, + "loss": 1.4463, + "step": 33343 + }, + { + "epoch": 2.62, + "learning_rate": 1.1499206891039742e-05, + "loss": 1.4844, + "step": 33344 + }, + { + "epoch": 2.62, + "learning_rate": 1.1494461394504113e-05, + "loss": 1.4737, + "step": 33345 + }, + { + "epoch": 2.62, + "learning_rate": 1.1489716838344659e-05, + "loss": 1.4425, + "step": 33346 + }, + { + "epoch": 2.62, + "learning_rate": 1.1484973222593574e-05, + "loss": 1.4269, + "step": 33347 + }, + { + "epoch": 2.62, + "learning_rate": 1.1480230547283098e-05, + "loss": 1.4287, + "step": 33348 + }, + { + "epoch": 2.62, + "learning_rate": 1.1475488812445405e-05, + "loss": 1.4372, + "step": 33349 + }, + { + "epoch": 2.62, + "learning_rate": 1.1470748018112719e-05, + "loss": 1.4578, + "step": 33350 + }, + { + "epoch": 2.62, + "learning_rate": 1.146600816431718e-05, + "loss": 1.486, + "step": 33351 + }, + { + "epoch": 2.62, + "learning_rate": 1.1461269251091015e-05, + "loss": 1.3577, + "step": 33352 + }, + { + "epoch": 2.62, + "learning_rate": 1.145653127846638e-05, + "loss": 1.4566, + "step": 33353 + }, + { + "epoch": 2.62, + "learning_rate": 1.1451794246475415e-05, + "loss": 1.4551, + "step": 33354 + }, + { + "epoch": 2.62, + "learning_rate": 1.144705815515033e-05, + "loss": 1.4771, + "step": 33355 + }, + { + "epoch": 2.62, + "learning_rate": 1.144232300452328e-05, + "loss": 1.4081, + "step": 33356 + }, + { + "epoch": 2.62, + "learning_rate": 1.1437588794626357e-05, + "loss": 1.438, + "step": 33357 + }, + { + "epoch": 2.62, + "learning_rate": 1.1432855525491735e-05, + "loss": 1.5003, + "step": 33358 + }, + { + "epoch": 2.62, + "learning_rate": 1.142812319715159e-05, + "loss": 1.4508, + "step": 33359 + }, + { + "epoch": 2.62, + "learning_rate": 1.142339180963801e-05, + "loss": 1.4584, + "step": 33360 + }, + { + "epoch": 2.62, + "learning_rate": 1.1418661362983106e-05, + "loss": 1.4498, + "step": 33361 + }, + { + "epoch": 2.62, + "learning_rate": 1.141393185721905e-05, + "loss": 1.4418, + "step": 33362 + }, + { + "epoch": 2.63, + "learning_rate": 1.1409203292377917e-05, + "loss": 1.4359, + "step": 33363 + }, + { + "epoch": 2.63, + "learning_rate": 1.140447566849178e-05, + "loss": 1.4076, + "step": 33364 + }, + { + "epoch": 2.63, + "learning_rate": 1.1399748985592799e-05, + "loss": 1.471, + "step": 33365 + }, + { + "epoch": 2.63, + "learning_rate": 1.139502324371303e-05, + "loss": 1.4293, + "step": 33366 + }, + { + "epoch": 2.63, + "learning_rate": 1.1390298442884549e-05, + "loss": 1.4737, + "step": 33367 + }, + { + "epoch": 2.63, + "learning_rate": 1.1385574583139462e-05, + "loss": 1.4161, + "step": 33368 + }, + { + "epoch": 2.63, + "learning_rate": 1.1380851664509843e-05, + "loss": 1.4523, + "step": 33369 + }, + { + "epoch": 2.63, + "learning_rate": 1.1376129687027734e-05, + "loss": 1.4709, + "step": 33370 + }, + { + "epoch": 2.63, + "learning_rate": 1.1371408650725194e-05, + "loss": 1.4369, + "step": 33371 + }, + { + "epoch": 2.63, + "learning_rate": 1.1366688555634296e-05, + "loss": 1.424, + "step": 33372 + }, + { + "epoch": 2.63, + "learning_rate": 1.1361969401787064e-05, + "loss": 1.4266, + "step": 33373 + }, + { + "epoch": 2.63, + "learning_rate": 1.1357251189215588e-05, + "loss": 1.4069, + "step": 33374 + }, + { + "epoch": 2.63, + "learning_rate": 1.1352533917951828e-05, + "loss": 1.4695, + "step": 33375 + }, + { + "epoch": 2.63, + "learning_rate": 1.1347817588027875e-05, + "loss": 1.4601, + "step": 33376 + }, + { + "epoch": 2.63, + "learning_rate": 1.1343102199475734e-05, + "loss": 1.4404, + "step": 33377 + }, + { + "epoch": 2.63, + "learning_rate": 1.1338387752327382e-05, + "loss": 1.5036, + "step": 33378 + }, + { + "epoch": 2.63, + "learning_rate": 1.1333674246614876e-05, + "loss": 1.4573, + "step": 33379 + }, + { + "epoch": 2.63, + "learning_rate": 1.1328961682370208e-05, + "loss": 1.4493, + "step": 33380 + }, + { + "epoch": 2.63, + "learning_rate": 1.1324250059625333e-05, + "loss": 1.4887, + "step": 33381 + }, + { + "epoch": 2.63, + "learning_rate": 1.1319539378412312e-05, + "loss": 1.4427, + "step": 33382 + }, + { + "epoch": 2.63, + "learning_rate": 1.1314829638763085e-05, + "loss": 1.4627, + "step": 33383 + }, + { + "epoch": 2.63, + "learning_rate": 1.131012084070959e-05, + "loss": 1.4002, + "step": 33384 + }, + { + "epoch": 2.63, + "learning_rate": 1.1305412984283874e-05, + "loss": 1.4131, + "step": 33385 + }, + { + "epoch": 2.63, + "learning_rate": 1.1300706069517873e-05, + "loss": 1.4688, + "step": 33386 + }, + { + "epoch": 2.63, + "learning_rate": 1.129600009644353e-05, + "loss": 1.5071, + "step": 33387 + }, + { + "epoch": 2.63, + "learning_rate": 1.129129506509277e-05, + "loss": 1.4567, + "step": 33388 + }, + { + "epoch": 2.63, + "learning_rate": 1.1286590975497583e-05, + "loss": 1.3918, + "step": 33389 + }, + { + "epoch": 2.63, + "learning_rate": 1.1281887827689929e-05, + "loss": 1.4172, + "step": 33390 + }, + { + "epoch": 2.63, + "learning_rate": 1.1277185621701695e-05, + "loss": 1.4397, + "step": 33391 + }, + { + "epoch": 2.63, + "learning_rate": 1.1272484357564776e-05, + "loss": 1.4068, + "step": 33392 + }, + { + "epoch": 2.63, + "learning_rate": 1.1267784035311178e-05, + "loss": 1.3761, + "step": 33393 + }, + { + "epoch": 2.63, + "learning_rate": 1.126308465497276e-05, + "loss": 1.4928, + "step": 33394 + }, + { + "epoch": 2.63, + "learning_rate": 1.125838621658141e-05, + "loss": 1.4341, + "step": 33395 + }, + { + "epoch": 2.63, + "learning_rate": 1.125368872016909e-05, + "loss": 1.4345, + "step": 33396 + }, + { + "epoch": 2.63, + "learning_rate": 1.124899216576764e-05, + "loss": 1.4496, + "step": 33397 + }, + { + "epoch": 2.63, + "learning_rate": 1.124429655340895e-05, + "loss": 1.4106, + "step": 33398 + }, + { + "epoch": 2.63, + "learning_rate": 1.1239601883124944e-05, + "loss": 1.4463, + "step": 33399 + }, + { + "epoch": 2.63, + "learning_rate": 1.1234908154947447e-05, + "loss": 1.4616, + "step": 33400 + }, + { + "epoch": 2.63, + "learning_rate": 1.1230215368908335e-05, + "loss": 1.4866, + "step": 33401 + }, + { + "epoch": 2.63, + "learning_rate": 1.1225523525039514e-05, + "loss": 1.4231, + "step": 33402 + }, + { + "epoch": 2.63, + "learning_rate": 1.1220832623372795e-05, + "loss": 1.4536, + "step": 33403 + }, + { + "epoch": 2.63, + "learning_rate": 1.1216142663940048e-05, + "loss": 1.4557, + "step": 33404 + }, + { + "epoch": 2.63, + "learning_rate": 1.1211453646773033e-05, + "loss": 1.4729, + "step": 33405 + }, + { + "epoch": 2.63, + "learning_rate": 1.1206765571903725e-05, + "loss": 1.4542, + "step": 33406 + }, + { + "epoch": 2.63, + "learning_rate": 1.1202078439363881e-05, + "loss": 1.4813, + "step": 33407 + }, + { + "epoch": 2.63, + "learning_rate": 1.1197392249185343e-05, + "loss": 1.4561, + "step": 33408 + }, + { + "epoch": 2.63, + "learning_rate": 1.119270700139987e-05, + "loss": 1.4532, + "step": 33409 + }, + { + "epoch": 2.63, + "learning_rate": 1.118802269603935e-05, + "loss": 1.389, + "step": 33410 + }, + { + "epoch": 2.63, + "learning_rate": 1.118333933313556e-05, + "loss": 1.4577, + "step": 33411 + }, + { + "epoch": 2.63, + "learning_rate": 1.1178656912720257e-05, + "loss": 1.4325, + "step": 33412 + }, + { + "epoch": 2.63, + "learning_rate": 1.1173975434825283e-05, + "loss": 1.4351, + "step": 33413 + }, + { + "epoch": 2.63, + "learning_rate": 1.1169294899482429e-05, + "loss": 1.4469, + "step": 33414 + }, + { + "epoch": 2.63, + "learning_rate": 1.1164615306723401e-05, + "loss": 1.4283, + "step": 33415 + }, + { + "epoch": 2.63, + "learning_rate": 1.1159936656580059e-05, + "loss": 1.4715, + "step": 33416 + }, + { + "epoch": 2.63, + "learning_rate": 1.1155258949084112e-05, + "loss": 1.4389, + "step": 33417 + }, + { + "epoch": 2.63, + "learning_rate": 1.1150582184267332e-05, + "loss": 1.4504, + "step": 33418 + }, + { + "epoch": 2.63, + "learning_rate": 1.1145906362161477e-05, + "loss": 1.4698, + "step": 33419 + }, + { + "epoch": 2.63, + "learning_rate": 1.1141231482798308e-05, + "loss": 1.4556, + "step": 33420 + }, + { + "epoch": 2.63, + "learning_rate": 1.113655754620953e-05, + "loss": 1.4868, + "step": 33421 + }, + { + "epoch": 2.63, + "learning_rate": 1.1131884552426884e-05, + "loss": 1.4741, + "step": 33422 + }, + { + "epoch": 2.63, + "learning_rate": 1.112721250148213e-05, + "loss": 1.4831, + "step": 33423 + }, + { + "epoch": 2.63, + "learning_rate": 1.1122541393406976e-05, + "loss": 1.4501, + "step": 33424 + }, + { + "epoch": 2.63, + "learning_rate": 1.1117871228233093e-05, + "loss": 1.4348, + "step": 33425 + }, + { + "epoch": 2.63, + "learning_rate": 1.1113202005992244e-05, + "loss": 1.4791, + "step": 33426 + }, + { + "epoch": 2.63, + "learning_rate": 1.1108533726716117e-05, + "loss": 1.4012, + "step": 33427 + }, + { + "epoch": 2.63, + "learning_rate": 1.1103866390436406e-05, + "loss": 1.4088, + "step": 33428 + }, + { + "epoch": 2.63, + "learning_rate": 1.1099199997184766e-05, + "loss": 1.4644, + "step": 33429 + }, + { + "epoch": 2.63, + "learning_rate": 1.1094534546992923e-05, + "loss": 1.4243, + "step": 33430 + }, + { + "epoch": 2.63, + "learning_rate": 1.1089870039892551e-05, + "loss": 1.4119, + "step": 33431 + }, + { + "epoch": 2.63, + "learning_rate": 1.108520647591526e-05, + "loss": 1.4193, + "step": 33432 + }, + { + "epoch": 2.63, + "learning_rate": 1.1080543855092789e-05, + "loss": 1.4311, + "step": 33433 + }, + { + "epoch": 2.63, + "learning_rate": 1.1075882177456763e-05, + "loss": 1.4943, + "step": 33434 + }, + { + "epoch": 2.63, + "learning_rate": 1.1071221443038808e-05, + "loss": 1.4194, + "step": 33435 + }, + { + "epoch": 2.63, + "learning_rate": 1.1066561651870598e-05, + "loss": 1.4426, + "step": 33436 + }, + { + "epoch": 2.63, + "learning_rate": 1.106190280398379e-05, + "loss": 1.4016, + "step": 33437 + }, + { + "epoch": 2.63, + "learning_rate": 1.1057244899409978e-05, + "loss": 1.4096, + "step": 33438 + }, + { + "epoch": 2.63, + "learning_rate": 1.1052587938180785e-05, + "loss": 1.4339, + "step": 33439 + }, + { + "epoch": 2.63, + "learning_rate": 1.1047931920327868e-05, + "loss": 1.4542, + "step": 33440 + }, + { + "epoch": 2.63, + "learning_rate": 1.1043276845882804e-05, + "loss": 1.4467, + "step": 33441 + }, + { + "epoch": 2.63, + "learning_rate": 1.1038622714877183e-05, + "loss": 1.3961, + "step": 33442 + }, + { + "epoch": 2.63, + "learning_rate": 1.1033969527342662e-05, + "loss": 1.4596, + "step": 33443 + }, + { + "epoch": 2.63, + "learning_rate": 1.1029317283310785e-05, + "loss": 1.4611, + "step": 33444 + }, + { + "epoch": 2.63, + "learning_rate": 1.1024665982813175e-05, + "loss": 1.4615, + "step": 33445 + }, + { + "epoch": 2.63, + "learning_rate": 1.102001562588134e-05, + "loss": 1.4447, + "step": 33446 + }, + { + "epoch": 2.63, + "learning_rate": 1.1015366212546955e-05, + "loss": 1.3961, + "step": 33447 + }, + { + "epoch": 2.63, + "learning_rate": 1.1010717742841512e-05, + "loss": 1.4673, + "step": 33448 + }, + { + "epoch": 2.63, + "learning_rate": 1.1006070216796586e-05, + "loss": 1.4965, + "step": 33449 + }, + { + "epoch": 2.63, + "learning_rate": 1.1001423634443751e-05, + "loss": 1.4707, + "step": 33450 + }, + { + "epoch": 2.63, + "learning_rate": 1.0996777995814566e-05, + "loss": 1.465, + "step": 33451 + }, + { + "epoch": 2.63, + "learning_rate": 1.0992133300940502e-05, + "loss": 1.4571, + "step": 33452 + }, + { + "epoch": 2.63, + "learning_rate": 1.0987489549853157e-05, + "loss": 1.4086, + "step": 33453 + }, + { + "epoch": 2.63, + "learning_rate": 1.0982846742584051e-05, + "loss": 1.4663, + "step": 33454 + }, + { + "epoch": 2.63, + "learning_rate": 1.0978204879164726e-05, + "loss": 1.4249, + "step": 33455 + }, + { + "epoch": 2.63, + "learning_rate": 1.0973563959626624e-05, + "loss": 1.4147, + "step": 33456 + }, + { + "epoch": 2.63, + "learning_rate": 1.0968923984001338e-05, + "loss": 1.4653, + "step": 33457 + }, + { + "epoch": 2.63, + "learning_rate": 1.0964284952320324e-05, + "loss": 1.4452, + "step": 33458 + }, + { + "epoch": 2.63, + "learning_rate": 1.0959646864615074e-05, + "loss": 1.5085, + "step": 33459 + }, + { + "epoch": 2.63, + "learning_rate": 1.0955009720917113e-05, + "loss": 1.4832, + "step": 33460 + }, + { + "epoch": 2.63, + "learning_rate": 1.0950373521257915e-05, + "loss": 1.4811, + "step": 33461 + }, + { + "epoch": 2.63, + "learning_rate": 1.0945738265668941e-05, + "loss": 1.4636, + "step": 33462 + }, + { + "epoch": 2.63, + "learning_rate": 1.094110395418163e-05, + "loss": 1.4637, + "step": 33463 + }, + { + "epoch": 2.63, + "learning_rate": 1.0936470586827523e-05, + "loss": 1.4339, + "step": 33464 + }, + { + "epoch": 2.63, + "learning_rate": 1.0931838163638029e-05, + "loss": 1.5104, + "step": 33465 + }, + { + "epoch": 2.63, + "learning_rate": 1.092720668464459e-05, + "loss": 1.4567, + "step": 33466 + }, + { + "epoch": 2.63, + "learning_rate": 1.0922576149878698e-05, + "loss": 1.4559, + "step": 33467 + }, + { + "epoch": 2.63, + "learning_rate": 1.0917946559371743e-05, + "loss": 1.4681, + "step": 33468 + }, + { + "epoch": 2.63, + "learning_rate": 1.0913317913155201e-05, + "loss": 1.4625, + "step": 33469 + }, + { + "epoch": 2.63, + "learning_rate": 1.0908690211260446e-05, + "loss": 1.4705, + "step": 33470 + }, + { + "epoch": 2.63, + "learning_rate": 1.090406345371897e-05, + "loss": 1.4034, + "step": 33471 + }, + { + "epoch": 2.63, + "learning_rate": 1.0899437640562114e-05, + "loss": 1.4446, + "step": 33472 + }, + { + "epoch": 2.63, + "learning_rate": 1.0894812771821321e-05, + "loss": 1.464, + "step": 33473 + }, + { + "epoch": 2.63, + "learning_rate": 1.089018884752798e-05, + "loss": 1.4658, + "step": 33474 + }, + { + "epoch": 2.63, + "learning_rate": 1.0885565867713503e-05, + "loss": 1.4191, + "step": 33475 + }, + { + "epoch": 2.63, + "learning_rate": 1.0880943832409244e-05, + "loss": 1.4176, + "step": 33476 + }, + { + "epoch": 2.63, + "learning_rate": 1.087632274164663e-05, + "loss": 1.4719, + "step": 33477 + }, + { + "epoch": 2.63, + "learning_rate": 1.0871702595457005e-05, + "loss": 1.4867, + "step": 33478 + }, + { + "epoch": 2.63, + "learning_rate": 1.0867083393871723e-05, + "loss": 1.3905, + "step": 33479 + }, + { + "epoch": 2.63, + "learning_rate": 1.0862465136922177e-05, + "loss": 1.4375, + "step": 33480 + }, + { + "epoch": 2.63, + "learning_rate": 1.085784782463971e-05, + "loss": 1.427, + "step": 33481 + }, + { + "epoch": 2.63, + "learning_rate": 1.0853231457055678e-05, + "loss": 1.4633, + "step": 33482 + }, + { + "epoch": 2.63, + "learning_rate": 1.0848616034201375e-05, + "loss": 1.4108, + "step": 33483 + }, + { + "epoch": 2.63, + "learning_rate": 1.0844001556108222e-05, + "loss": 1.3903, + "step": 33484 + }, + { + "epoch": 2.63, + "learning_rate": 1.08393880228075e-05, + "loss": 1.4432, + "step": 33485 + }, + { + "epoch": 2.63, + "learning_rate": 1.0834775434330545e-05, + "loss": 1.4345, + "step": 33486 + }, + { + "epoch": 2.63, + "learning_rate": 1.0830163790708635e-05, + "loss": 1.4307, + "step": 33487 + }, + { + "epoch": 2.63, + "learning_rate": 1.0825553091973143e-05, + "loss": 1.423, + "step": 33488 + }, + { + "epoch": 2.63, + "learning_rate": 1.0820943338155347e-05, + "loss": 1.449, + "step": 33489 + }, + { + "epoch": 2.64, + "learning_rate": 1.081633452928652e-05, + "loss": 1.4319, + "step": 33490 + }, + { + "epoch": 2.64, + "learning_rate": 1.0811726665397985e-05, + "loss": 1.4314, + "step": 33491 + }, + { + "epoch": 2.64, + "learning_rate": 1.080711974652102e-05, + "loss": 1.4301, + "step": 33492 + }, + { + "epoch": 2.64, + "learning_rate": 1.0802513772686866e-05, + "loss": 1.4851, + "step": 33493 + }, + { + "epoch": 2.64, + "learning_rate": 1.0797908743926865e-05, + "loss": 1.4468, + "step": 33494 + }, + { + "epoch": 2.64, + "learning_rate": 1.079330466027224e-05, + "loss": 1.3995, + "step": 33495 + }, + { + "epoch": 2.64, + "learning_rate": 1.0788701521754233e-05, + "loss": 1.4615, + "step": 33496 + }, + { + "epoch": 2.64, + "learning_rate": 1.078409932840414e-05, + "loss": 1.4251, + "step": 33497 + }, + { + "epoch": 2.64, + "learning_rate": 1.0779498080253196e-05, + "loss": 1.4642, + "step": 33498 + }, + { + "epoch": 2.64, + "learning_rate": 1.0774897777332597e-05, + "loss": 1.4842, + "step": 33499 + }, + { + "epoch": 2.64, + "learning_rate": 1.0770298419673618e-05, + "loss": 1.4336, + "step": 33500 + }, + { + "epoch": 2.64, + "learning_rate": 1.0765700007307498e-05, + "loss": 1.4288, + "step": 33501 + }, + { + "epoch": 2.64, + "learning_rate": 1.0761102540265449e-05, + "loss": 1.3825, + "step": 33502 + }, + { + "epoch": 2.64, + "learning_rate": 1.0756506018578676e-05, + "loss": 1.4391, + "step": 33503 + }, + { + "epoch": 2.64, + "learning_rate": 1.0751910442278338e-05, + "loss": 1.4196, + "step": 33504 + }, + { + "epoch": 2.64, + "learning_rate": 1.0747315811395729e-05, + "loss": 1.4621, + "step": 33505 + }, + { + "epoch": 2.64, + "learning_rate": 1.0742722125962005e-05, + "loss": 1.4637, + "step": 33506 + }, + { + "epoch": 2.64, + "learning_rate": 1.0738129386008309e-05, + "loss": 1.4677, + "step": 33507 + }, + { + "epoch": 2.64, + "learning_rate": 1.0733537591565899e-05, + "loss": 1.3819, + "step": 33508 + }, + { + "epoch": 2.64, + "learning_rate": 1.0728946742665917e-05, + "loss": 1.4268, + "step": 33509 + }, + { + "epoch": 2.64, + "learning_rate": 1.0724356839339504e-05, + "loss": 1.4324, + "step": 33510 + }, + { + "epoch": 2.64, + "learning_rate": 1.0719767881617868e-05, + "loss": 1.4499, + "step": 33511 + }, + { + "epoch": 2.64, + "learning_rate": 1.0715179869532153e-05, + "loss": 1.4485, + "step": 33512 + }, + { + "epoch": 2.64, + "learning_rate": 1.0710592803113466e-05, + "loss": 1.4195, + "step": 33513 + }, + { + "epoch": 2.64, + "learning_rate": 1.0706006682393014e-05, + "loss": 1.4504, + "step": 33514 + }, + { + "epoch": 2.64, + "learning_rate": 1.0701421507401892e-05, + "loss": 1.4305, + "step": 33515 + }, + { + "epoch": 2.64, + "learning_rate": 1.0696837278171271e-05, + "loss": 1.4188, + "step": 33516 + }, + { + "epoch": 2.64, + "learning_rate": 1.0692253994732231e-05, + "loss": 1.4695, + "step": 33517 + }, + { + "epoch": 2.64, + "learning_rate": 1.0687671657115926e-05, + "loss": 1.4866, + "step": 33518 + }, + { + "epoch": 2.64, + "learning_rate": 1.068309026535345e-05, + "loss": 1.3972, + "step": 33519 + }, + { + "epoch": 2.64, + "learning_rate": 1.0678509819475927e-05, + "loss": 1.4301, + "step": 33520 + }, + { + "epoch": 2.64, + "learning_rate": 1.06739303195144e-05, + "loss": 1.4208, + "step": 33521 + }, + { + "epoch": 2.64, + "learning_rate": 1.0669351765500011e-05, + "loss": 1.4364, + "step": 33522 + }, + { + "epoch": 2.64, + "learning_rate": 1.066477415746385e-05, + "loss": 1.5127, + "step": 33523 + }, + { + "epoch": 2.64, + "learning_rate": 1.0660197495436962e-05, + "loss": 1.4389, + "step": 33524 + }, + { + "epoch": 2.64, + "learning_rate": 1.0655621779450451e-05, + "loss": 1.5089, + "step": 33525 + }, + { + "epoch": 2.64, + "learning_rate": 1.0651047009535379e-05, + "loss": 1.4454, + "step": 33526 + }, + { + "epoch": 2.64, + "learning_rate": 1.064647318572277e-05, + "loss": 1.488, + "step": 33527 + }, + { + "epoch": 2.64, + "learning_rate": 1.0641900308043732e-05, + "loss": 1.4406, + "step": 33528 + }, + { + "epoch": 2.64, + "learning_rate": 1.0637328376529292e-05, + "loss": 1.4179, + "step": 33529 + }, + { + "epoch": 2.64, + "learning_rate": 1.0632757391210456e-05, + "loss": 1.4248, + "step": 33530 + }, + { + "epoch": 2.64, + "learning_rate": 1.0628187352118283e-05, + "loss": 1.4578, + "step": 33531 + }, + { + "epoch": 2.64, + "learning_rate": 1.062361825928385e-05, + "loss": 1.4475, + "step": 33532 + }, + { + "epoch": 2.64, + "learning_rate": 1.0619050112738115e-05, + "loss": 1.4519, + "step": 33533 + }, + { + "epoch": 2.64, + "learning_rate": 1.0614482912512101e-05, + "loss": 1.4483, + "step": 33534 + }, + { + "epoch": 2.64, + "learning_rate": 1.0609916658636835e-05, + "loss": 1.4718, + "step": 33535 + }, + { + "epoch": 2.64, + "learning_rate": 1.0605351351143327e-05, + "loss": 1.4553, + "step": 33536 + }, + { + "epoch": 2.64, + "learning_rate": 1.0600786990062531e-05, + "loss": 1.4008, + "step": 33537 + }, + { + "epoch": 2.64, + "learning_rate": 1.0596223575425495e-05, + "loss": 1.4646, + "step": 33538 + }, + { + "epoch": 2.64, + "learning_rate": 1.0591661107263173e-05, + "loss": 1.4276, + "step": 33539 + }, + { + "epoch": 2.64, + "learning_rate": 1.058709958560654e-05, + "loss": 1.4623, + "step": 33540 + }, + { + "epoch": 2.64, + "learning_rate": 1.0582539010486524e-05, + "loss": 1.4115, + "step": 33541 + }, + { + "epoch": 2.64, + "learning_rate": 1.0577979381934165e-05, + "loss": 1.4311, + "step": 33542 + }, + { + "epoch": 2.64, + "learning_rate": 1.057342069998039e-05, + "loss": 1.4469, + "step": 33543 + }, + { + "epoch": 2.64, + "learning_rate": 1.0568862964656122e-05, + "loss": 1.4693, + "step": 33544 + }, + { + "epoch": 2.64, + "learning_rate": 1.0564306175992355e-05, + "loss": 1.4524, + "step": 33545 + }, + { + "epoch": 2.64, + "learning_rate": 1.0559750334019979e-05, + "loss": 1.4854, + "step": 33546 + }, + { + "epoch": 2.64, + "learning_rate": 1.055519543876997e-05, + "loss": 1.492, + "step": 33547 + }, + { + "epoch": 2.64, + "learning_rate": 1.0550641490273204e-05, + "loss": 1.4866, + "step": 33548 + }, + { + "epoch": 2.64, + "learning_rate": 1.0546088488560672e-05, + "loss": 1.465, + "step": 33549 + }, + { + "epoch": 2.64, + "learning_rate": 1.0541536433663218e-05, + "loss": 1.4745, + "step": 33550 + }, + { + "epoch": 2.64, + "learning_rate": 1.0536985325611764e-05, + "loss": 1.4601, + "step": 33551 + }, + { + "epoch": 2.64, + "learning_rate": 1.0532435164437237e-05, + "loss": 1.464, + "step": 33552 + }, + { + "epoch": 2.64, + "learning_rate": 1.0527885950170495e-05, + "loss": 1.4665, + "step": 33553 + }, + { + "epoch": 2.64, + "learning_rate": 1.0523337682842432e-05, + "loss": 1.4516, + "step": 33554 + }, + { + "epoch": 2.64, + "learning_rate": 1.0518790362483953e-05, + "loss": 1.5118, + "step": 33555 + }, + { + "epoch": 2.64, + "learning_rate": 1.051424398912592e-05, + "loss": 1.4266, + "step": 33556 + }, + { + "epoch": 2.64, + "learning_rate": 1.0509698562799207e-05, + "loss": 1.4024, + "step": 33557 + }, + { + "epoch": 2.64, + "learning_rate": 1.0505154083534623e-05, + "loss": 1.4867, + "step": 33558 + }, + { + "epoch": 2.64, + "learning_rate": 1.0500610551363093e-05, + "loss": 1.4641, + "step": 33559 + }, + { + "epoch": 2.64, + "learning_rate": 1.0496067966315441e-05, + "loss": 1.4289, + "step": 33560 + }, + { + "epoch": 2.64, + "learning_rate": 1.0491526328422462e-05, + "loss": 1.5082, + "step": 33561 + }, + { + "epoch": 2.64, + "learning_rate": 1.0486985637715045e-05, + "loss": 1.4627, + "step": 33562 + }, + { + "epoch": 2.64, + "learning_rate": 1.0482445894224034e-05, + "loss": 1.424, + "step": 33563 + }, + { + "epoch": 2.64, + "learning_rate": 1.047790709798022e-05, + "loss": 1.4398, + "step": 33564 + }, + { + "epoch": 2.64, + "learning_rate": 1.0473369249014395e-05, + "loss": 1.4279, + "step": 33565 + }, + { + "epoch": 2.64, + "learning_rate": 1.046883234735742e-05, + "loss": 1.4682, + "step": 33566 + }, + { + "epoch": 2.64, + "learning_rate": 1.0464296393040067e-05, + "loss": 1.4287, + "step": 33567 + }, + { + "epoch": 2.64, + "learning_rate": 1.045976138609313e-05, + "loss": 1.4679, + "step": 33568 + }, + { + "epoch": 2.64, + "learning_rate": 1.0455227326547417e-05, + "loss": 1.4072, + "step": 33569 + }, + { + "epoch": 2.64, + "learning_rate": 1.0450694214433702e-05, + "loss": 1.4368, + "step": 33570 + }, + { + "epoch": 2.64, + "learning_rate": 1.0446162049782763e-05, + "loss": 1.4348, + "step": 33571 + }, + { + "epoch": 2.64, + "learning_rate": 1.0441630832625375e-05, + "loss": 1.4418, + "step": 33572 + }, + { + "epoch": 2.64, + "learning_rate": 1.0437100562992295e-05, + "loss": 1.4229, + "step": 33573 + }, + { + "epoch": 2.64, + "learning_rate": 1.04325712409143e-05, + "loss": 1.3811, + "step": 33574 + }, + { + "epoch": 2.64, + "learning_rate": 1.0428042866422098e-05, + "loss": 1.428, + "step": 33575 + }, + { + "epoch": 2.64, + "learning_rate": 1.0423515439546481e-05, + "loss": 1.4425, + "step": 33576 + }, + { + "epoch": 2.64, + "learning_rate": 1.0418988960318175e-05, + "loss": 1.4638, + "step": 33577 + }, + { + "epoch": 2.64, + "learning_rate": 1.0414463428767872e-05, + "loss": 1.4427, + "step": 33578 + }, + { + "epoch": 2.64, + "learning_rate": 1.0409938844926363e-05, + "loss": 1.4013, + "step": 33579 + }, + { + "epoch": 2.64, + "learning_rate": 1.0405415208824341e-05, + "loss": 1.3921, + "step": 33580 + }, + { + "epoch": 2.64, + "learning_rate": 1.0400892520492516e-05, + "loss": 1.3948, + "step": 33581 + }, + { + "epoch": 2.64, + "learning_rate": 1.039637077996156e-05, + "loss": 1.3979, + "step": 33582 + }, + { + "epoch": 2.64, + "learning_rate": 1.0391849987262252e-05, + "loss": 1.432, + "step": 33583 + }, + { + "epoch": 2.64, + "learning_rate": 1.0387330142425216e-05, + "loss": 1.407, + "step": 33584 + }, + { + "epoch": 2.64, + "learning_rate": 1.038281124548116e-05, + "loss": 1.4175, + "step": 33585 + }, + { + "epoch": 2.64, + "learning_rate": 1.0378293296460777e-05, + "loss": 1.4717, + "step": 33586 + }, + { + "epoch": 2.64, + "learning_rate": 1.0373776295394743e-05, + "loss": 1.4757, + "step": 33587 + }, + { + "epoch": 2.64, + "learning_rate": 1.0369260242313681e-05, + "loss": 1.491, + "step": 33588 + }, + { + "epoch": 2.64, + "learning_rate": 1.036474513724832e-05, + "loss": 1.4492, + "step": 33589 + }, + { + "epoch": 2.64, + "learning_rate": 1.0360230980229283e-05, + "loss": 1.4816, + "step": 33590 + }, + { + "epoch": 2.64, + "learning_rate": 1.0355717771287197e-05, + "loss": 1.4347, + "step": 33591 + }, + { + "epoch": 2.64, + "learning_rate": 1.0351205510452737e-05, + "loss": 1.4259, + "step": 33592 + }, + { + "epoch": 2.64, + "learning_rate": 1.0346694197756512e-05, + "loss": 1.41, + "step": 33593 + }, + { + "epoch": 2.64, + "learning_rate": 1.0342183833229194e-05, + "loss": 1.4231, + "step": 33594 + }, + { + "epoch": 2.64, + "learning_rate": 1.0337674416901348e-05, + "loss": 1.449, + "step": 33595 + }, + { + "epoch": 2.64, + "learning_rate": 1.0333165948803646e-05, + "loss": 1.4305, + "step": 33596 + }, + { + "epoch": 2.64, + "learning_rate": 1.032865842896668e-05, + "loss": 1.3954, + "step": 33597 + }, + { + "epoch": 2.64, + "learning_rate": 1.0324151857421042e-05, + "loss": 1.5157, + "step": 33598 + }, + { + "epoch": 2.64, + "learning_rate": 1.0319646234197293e-05, + "loss": 1.4249, + "step": 33599 + }, + { + "epoch": 2.64, + "learning_rate": 1.0315141559326107e-05, + "loss": 1.4449, + "step": 33600 + }, + { + "epoch": 2.64, + "learning_rate": 1.0310637832838026e-05, + "loss": 1.3824, + "step": 33601 + }, + { + "epoch": 2.64, + "learning_rate": 1.0306135054763592e-05, + "loss": 1.432, + "step": 33602 + }, + { + "epoch": 2.64, + "learning_rate": 1.0301633225133433e-05, + "loss": 1.5024, + "step": 33603 + }, + { + "epoch": 2.64, + "learning_rate": 1.0297132343978104e-05, + "loss": 1.4718, + "step": 33604 + }, + { + "epoch": 2.64, + "learning_rate": 1.0292632411328133e-05, + "loss": 1.429, + "step": 33605 + }, + { + "epoch": 2.64, + "learning_rate": 1.0288133427214095e-05, + "loss": 1.4443, + "step": 33606 + }, + { + "epoch": 2.64, + "learning_rate": 1.028363539166655e-05, + "loss": 1.445, + "step": 33607 + }, + { + "epoch": 2.64, + "learning_rate": 1.027913830471599e-05, + "loss": 1.524, + "step": 33608 + }, + { + "epoch": 2.64, + "learning_rate": 1.0274642166392971e-05, + "loss": 1.466, + "step": 33609 + }, + { + "epoch": 2.64, + "learning_rate": 1.0270146976728055e-05, + "loss": 1.4743, + "step": 33610 + }, + { + "epoch": 2.64, + "learning_rate": 1.0265652735751716e-05, + "loss": 1.4548, + "step": 33611 + }, + { + "epoch": 2.64, + "learning_rate": 1.0261159443494481e-05, + "loss": 1.4593, + "step": 33612 + }, + { + "epoch": 2.64, + "learning_rate": 1.0256667099986875e-05, + "loss": 1.4365, + "step": 33613 + }, + { + "epoch": 2.64, + "learning_rate": 1.0252175705259374e-05, + "loss": 1.4388, + "step": 33614 + }, + { + "epoch": 2.64, + "learning_rate": 1.0247685259342487e-05, + "loss": 1.4542, + "step": 33615 + }, + { + "epoch": 2.64, + "learning_rate": 1.024319576226667e-05, + "loss": 1.4485, + "step": 33616 + }, + { + "epoch": 2.65, + "learning_rate": 1.023870721406247e-05, + "loss": 1.4816, + "step": 33617 + }, + { + "epoch": 2.65, + "learning_rate": 1.0234219614760309e-05, + "loss": 1.4611, + "step": 33618 + }, + { + "epoch": 2.65, + "learning_rate": 1.022973296439063e-05, + "loss": 1.4611, + "step": 33619 + }, + { + "epoch": 2.65, + "learning_rate": 1.0225247262983976e-05, + "loss": 1.4654, + "step": 33620 + }, + { + "epoch": 2.65, + "learning_rate": 1.0220762510570757e-05, + "loss": 1.4461, + "step": 33621 + }, + { + "epoch": 2.65, + "learning_rate": 1.021627870718138e-05, + "loss": 1.4513, + "step": 33622 + }, + { + "epoch": 2.65, + "learning_rate": 1.0211795852846372e-05, + "loss": 1.4302, + "step": 33623 + }, + { + "epoch": 2.65, + "learning_rate": 1.0207313947596124e-05, + "loss": 1.4215, + "step": 33624 + }, + { + "epoch": 2.65, + "learning_rate": 1.0202832991461063e-05, + "loss": 1.4597, + "step": 33625 + }, + { + "epoch": 2.65, + "learning_rate": 1.0198352984471598e-05, + "loss": 1.4592, + "step": 33626 + }, + { + "epoch": 2.65, + "learning_rate": 1.0193873926658202e-05, + "loss": 1.4619, + "step": 33627 + }, + { + "epoch": 2.65, + "learning_rate": 1.0189395818051255e-05, + "loss": 1.4387, + "step": 33628 + }, + { + "epoch": 2.65, + "learning_rate": 1.0184918658681113e-05, + "loss": 1.4306, + "step": 33629 + }, + { + "epoch": 2.65, + "learning_rate": 1.0180442448578252e-05, + "loss": 1.4014, + "step": 33630 + }, + { + "epoch": 2.65, + "learning_rate": 1.0175967187773032e-05, + "loss": 1.4816, + "step": 33631 + }, + { + "epoch": 2.65, + "learning_rate": 1.0171492876295812e-05, + "loss": 1.3753, + "step": 33632 + }, + { + "epoch": 2.65, + "learning_rate": 1.0167019514177e-05, + "loss": 1.3818, + "step": 33633 + }, + { + "epoch": 2.65, + "learning_rate": 1.0162547101446971e-05, + "loss": 1.4623, + "step": 33634 + }, + { + "epoch": 2.65, + "learning_rate": 1.0158075638136088e-05, + "loss": 1.4311, + "step": 33635 + }, + { + "epoch": 2.65, + "learning_rate": 1.0153605124274656e-05, + "loss": 1.4541, + "step": 33636 + }, + { + "epoch": 2.65, + "learning_rate": 1.0149135559893118e-05, + "loss": 1.443, + "step": 33637 + }, + { + "epoch": 2.65, + "learning_rate": 1.014466694502175e-05, + "loss": 1.4283, + "step": 33638 + }, + { + "epoch": 2.65, + "learning_rate": 1.0140199279690896e-05, + "loss": 1.4563, + "step": 33639 + }, + { + "epoch": 2.65, + "learning_rate": 1.0135732563930948e-05, + "loss": 1.4468, + "step": 33640 + }, + { + "epoch": 2.65, + "learning_rate": 1.0131266797772148e-05, + "loss": 1.4313, + "step": 33641 + }, + { + "epoch": 2.65, + "learning_rate": 1.0126801981244903e-05, + "loss": 1.4527, + "step": 33642 + }, + { + "epoch": 2.65, + "learning_rate": 1.0122338114379442e-05, + "loss": 1.4695, + "step": 33643 + }, + { + "epoch": 2.65, + "learning_rate": 1.0117875197206155e-05, + "loss": 1.405, + "step": 33644 + }, + { + "epoch": 2.65, + "learning_rate": 1.0113413229755286e-05, + "loss": 1.4257, + "step": 33645 + }, + { + "epoch": 2.65, + "learning_rate": 1.0108952212057143e-05, + "loss": 1.4727, + "step": 33646 + }, + { + "epoch": 2.65, + "learning_rate": 1.0104492144142018e-05, + "loss": 1.422, + "step": 33647 + }, + { + "epoch": 2.65, + "learning_rate": 1.0100033026040205e-05, + "loss": 1.4362, + "step": 33648 + }, + { + "epoch": 2.65, + "learning_rate": 1.009557485778193e-05, + "loss": 1.4615, + "step": 33649 + }, + { + "epoch": 2.65, + "learning_rate": 1.0091117639397534e-05, + "loss": 1.4371, + "step": 33650 + }, + { + "epoch": 2.65, + "learning_rate": 1.0086661370917226e-05, + "loss": 1.4188, + "step": 33651 + }, + { + "epoch": 2.65, + "learning_rate": 1.0082206052371283e-05, + "loss": 1.4549, + "step": 33652 + }, + { + "epoch": 2.65, + "learning_rate": 1.0077751683789932e-05, + "loss": 1.4619, + "step": 33653 + }, + { + "epoch": 2.65, + "learning_rate": 1.0073298265203444e-05, + "loss": 1.4561, + "step": 33654 + }, + { + "epoch": 2.65, + "learning_rate": 1.006884579664205e-05, + "loss": 1.4959, + "step": 33655 + }, + { + "epoch": 2.65, + "learning_rate": 1.006439427813594e-05, + "loss": 1.4351, + "step": 33656 + }, + { + "epoch": 2.65, + "learning_rate": 1.0059943709715374e-05, + "loss": 1.5092, + "step": 33657 + }, + { + "epoch": 2.65, + "learning_rate": 1.0055494091410594e-05, + "loss": 1.4173, + "step": 33658 + }, + { + "epoch": 2.65, + "learning_rate": 1.0051045423251775e-05, + "loss": 1.4087, + "step": 33659 + }, + { + "epoch": 2.65, + "learning_rate": 1.004659770526911e-05, + "loss": 1.4216, + "step": 33660 + }, + { + "epoch": 2.65, + "learning_rate": 1.0042150937492827e-05, + "loss": 1.4428, + "step": 33661 + }, + { + "epoch": 2.65, + "learning_rate": 1.0037705119953115e-05, + "loss": 1.4352, + "step": 33662 + }, + { + "epoch": 2.65, + "learning_rate": 1.003326025268012e-05, + "loss": 1.4552, + "step": 33663 + }, + { + "epoch": 2.65, + "learning_rate": 1.0028816335704065e-05, + "loss": 1.414, + "step": 33664 + }, + { + "epoch": 2.65, + "learning_rate": 1.0024373369055111e-05, + "loss": 1.4497, + "step": 33665 + }, + { + "epoch": 2.65, + "learning_rate": 1.00199313527634e-05, + "loss": 1.4273, + "step": 33666 + }, + { + "epoch": 2.65, + "learning_rate": 1.0015490286859124e-05, + "loss": 1.4574, + "step": 33667 + }, + { + "epoch": 2.65, + "learning_rate": 1.0011050171372409e-05, + "loss": 1.4508, + "step": 33668 + }, + { + "epoch": 2.65, + "learning_rate": 1.0006611006333432e-05, + "loss": 1.431, + "step": 33669 + }, + { + "epoch": 2.65, + "learning_rate": 1.0002172791772268e-05, + "loss": 1.4342, + "step": 33670 + }, + { + "epoch": 2.65, + "learning_rate": 9.997735527719126e-06, + "loss": 1.4086, + "step": 33671 + }, + { + "epoch": 2.65, + "learning_rate": 9.993299214204082e-06, + "loss": 1.4174, + "step": 33672 + }, + { + "epoch": 2.65, + "learning_rate": 9.988863851257294e-06, + "loss": 1.4552, + "step": 33673 + }, + { + "epoch": 2.65, + "learning_rate": 9.984429438908826e-06, + "loss": 1.4408, + "step": 33674 + }, + { + "epoch": 2.65, + "learning_rate": 9.979995977188849e-06, + "loss": 1.4944, + "step": 33675 + }, + { + "epoch": 2.65, + "learning_rate": 9.975563466127423e-06, + "loss": 1.4423, + "step": 33676 + }, + { + "epoch": 2.65, + "learning_rate": 9.971131905754626e-06, + "loss": 1.5106, + "step": 33677 + }, + { + "epoch": 2.65, + "learning_rate": 9.966701296100599e-06, + "loss": 1.471, + "step": 33678 + }, + { + "epoch": 2.65, + "learning_rate": 9.962271637195385e-06, + "loss": 1.4213, + "step": 33679 + }, + { + "epoch": 2.65, + "learning_rate": 9.957842929069043e-06, + "loss": 1.4162, + "step": 33680 + }, + { + "epoch": 2.65, + "learning_rate": 9.9534151717517e-06, + "loss": 1.4055, + "step": 33681 + }, + { + "epoch": 2.65, + "learning_rate": 9.94898836527338e-06, + "loss": 1.4425, + "step": 33682 + }, + { + "epoch": 2.65, + "learning_rate": 9.944562509664111e-06, + "loss": 1.4619, + "step": 33683 + }, + { + "epoch": 2.65, + "learning_rate": 9.940137604954002e-06, + "loss": 1.4498, + "step": 33684 + }, + { + "epoch": 2.65, + "learning_rate": 9.935713651173078e-06, + "loss": 1.4245, + "step": 33685 + }, + { + "epoch": 2.65, + "learning_rate": 9.931290648351348e-06, + "loss": 1.5091, + "step": 33686 + }, + { + "epoch": 2.65, + "learning_rate": 9.926868596518839e-06, + "loss": 1.4291, + "step": 33687 + }, + { + "epoch": 2.65, + "learning_rate": 9.922447495705594e-06, + "loss": 1.4503, + "step": 33688 + }, + { + "epoch": 2.65, + "learning_rate": 9.918027345941653e-06, + "loss": 1.4272, + "step": 33689 + }, + { + "epoch": 2.65, + "learning_rate": 9.913608147256979e-06, + "loss": 1.395, + "step": 33690 + }, + { + "epoch": 2.65, + "learning_rate": 9.90918989968163e-06, + "loss": 1.5035, + "step": 33691 + }, + { + "epoch": 2.65, + "learning_rate": 9.904772603245564e-06, + "loss": 1.4007, + "step": 33692 + }, + { + "epoch": 2.65, + "learning_rate": 9.900356257978792e-06, + "loss": 1.4856, + "step": 33693 + }, + { + "epoch": 2.65, + "learning_rate": 9.895940863911255e-06, + "loss": 1.4612, + "step": 33694 + }, + { + "epoch": 2.65, + "learning_rate": 9.891526421072981e-06, + "loss": 1.3875, + "step": 33695 + }, + { + "epoch": 2.65, + "learning_rate": 9.887112929493946e-06, + "loss": 1.386, + "step": 33696 + }, + { + "epoch": 2.65, + "learning_rate": 9.882700389204056e-06, + "loss": 1.4442, + "step": 33697 + }, + { + "epoch": 2.65, + "learning_rate": 9.878288800233325e-06, + "loss": 1.437, + "step": 33698 + }, + { + "epoch": 2.65, + "learning_rate": 9.873878162611693e-06, + "loss": 1.4654, + "step": 33699 + }, + { + "epoch": 2.65, + "learning_rate": 9.869468476369085e-06, + "loss": 1.4257, + "step": 33700 + }, + { + "epoch": 2.65, + "learning_rate": 9.865059741535464e-06, + "loss": 1.4343, + "step": 33701 + }, + { + "epoch": 2.65, + "learning_rate": 9.860651958140769e-06, + "loss": 1.4852, + "step": 33702 + }, + { + "epoch": 2.65, + "learning_rate": 9.856245126214879e-06, + "loss": 1.4205, + "step": 33703 + }, + { + "epoch": 2.65, + "learning_rate": 9.851839245787751e-06, + "loss": 1.4131, + "step": 33704 + }, + { + "epoch": 2.65, + "learning_rate": 9.847434316889313e-06, + "loss": 1.4988, + "step": 33705 + }, + { + "epoch": 2.65, + "learning_rate": 9.843030339549456e-06, + "loss": 1.4458, + "step": 33706 + }, + { + "epoch": 2.65, + "learning_rate": 9.838627313798058e-06, + "loss": 1.4508, + "step": 33707 + }, + { + "epoch": 2.65, + "learning_rate": 9.834225239665045e-06, + "loss": 1.4675, + "step": 33708 + }, + { + "epoch": 2.65, + "learning_rate": 9.829824117180308e-06, + "loss": 1.4509, + "step": 33709 + }, + { + "epoch": 2.65, + "learning_rate": 9.825423946373707e-06, + "loss": 1.4439, + "step": 33710 + }, + { + "epoch": 2.65, + "learning_rate": 9.821024727275101e-06, + "loss": 1.4086, + "step": 33711 + }, + { + "epoch": 2.65, + "learning_rate": 9.8166264599144e-06, + "loss": 1.453, + "step": 33712 + }, + { + "epoch": 2.65, + "learning_rate": 9.812229144321448e-06, + "loss": 1.4333, + "step": 33713 + }, + { + "epoch": 2.65, + "learning_rate": 9.80783278052607e-06, + "loss": 1.4513, + "step": 33714 + }, + { + "epoch": 2.65, + "learning_rate": 9.803437368558175e-06, + "loss": 1.4936, + "step": 33715 + }, + { + "epoch": 2.65, + "learning_rate": 9.799042908447558e-06, + "loss": 1.4592, + "step": 33716 + }, + { + "epoch": 2.65, + "learning_rate": 9.794649400224059e-06, + "loss": 1.3954, + "step": 33717 + }, + { + "epoch": 2.65, + "learning_rate": 9.790256843917538e-06, + "loss": 1.4496, + "step": 33718 + }, + { + "epoch": 2.65, + "learning_rate": 9.785865239557789e-06, + "loss": 1.4831, + "step": 33719 + }, + { + "epoch": 2.65, + "learning_rate": 9.781474587174654e-06, + "loss": 1.3866, + "step": 33720 + }, + { + "epoch": 2.65, + "learning_rate": 9.777084886797893e-06, + "loss": 1.4452, + "step": 33721 + }, + { + "epoch": 2.65, + "learning_rate": 9.77269613845738e-06, + "loss": 1.4379, + "step": 33722 + }, + { + "epoch": 2.65, + "learning_rate": 9.768308342182862e-06, + "loss": 1.4566, + "step": 33723 + }, + { + "epoch": 2.65, + "learning_rate": 9.763921498004145e-06, + "loss": 1.4048, + "step": 33724 + }, + { + "epoch": 2.65, + "learning_rate": 9.759535605951007e-06, + "loss": 1.3951, + "step": 33725 + }, + { + "epoch": 2.65, + "learning_rate": 9.755150666053258e-06, + "loss": 1.4755, + "step": 33726 + }, + { + "epoch": 2.65, + "learning_rate": 9.750766678340622e-06, + "loss": 1.4148, + "step": 33727 + }, + { + "epoch": 2.65, + "learning_rate": 9.746383642842876e-06, + "loss": 1.5063, + "step": 33728 + }, + { + "epoch": 2.65, + "learning_rate": 9.742001559589796e-06, + "loss": 1.4342, + "step": 33729 + }, + { + "epoch": 2.65, + "learning_rate": 9.737620428611142e-06, + "loss": 1.4151, + "step": 33730 + }, + { + "epoch": 2.65, + "learning_rate": 9.733240249936608e-06, + "loss": 1.4308, + "step": 33731 + }, + { + "epoch": 2.65, + "learning_rate": 9.728861023595986e-06, + "loss": 1.4875, + "step": 33732 + }, + { + "epoch": 2.65, + "learning_rate": 9.724482749619e-06, + "loss": 1.4187, + "step": 33733 + }, + { + "epoch": 2.65, + "learning_rate": 9.720105428035329e-06, + "loss": 1.4724, + "step": 33734 + }, + { + "epoch": 2.65, + "learning_rate": 9.715729058874733e-06, + "loss": 1.4353, + "step": 33735 + }, + { + "epoch": 2.65, + "learning_rate": 9.711353642166953e-06, + "loss": 1.3895, + "step": 33736 + }, + { + "epoch": 2.65, + "learning_rate": 9.706979177941666e-06, + "loss": 1.4741, + "step": 33737 + }, + { + "epoch": 2.65, + "learning_rate": 9.702605666228547e-06, + "loss": 1.4158, + "step": 33738 + }, + { + "epoch": 2.65, + "learning_rate": 9.698233107057324e-06, + "loss": 1.4074, + "step": 33739 + }, + { + "epoch": 2.65, + "learning_rate": 9.693861500457672e-06, + "loss": 1.4527, + "step": 33740 + }, + { + "epoch": 2.65, + "learning_rate": 9.689490846459269e-06, + "loss": 1.4534, + "step": 33741 + }, + { + "epoch": 2.65, + "learning_rate": 9.685121145091806e-06, + "loss": 1.3879, + "step": 33742 + }, + { + "epoch": 2.65, + "learning_rate": 9.680752396384928e-06, + "loss": 1.4525, + "step": 33743 + }, + { + "epoch": 2.66, + "learning_rate": 9.676384600368292e-06, + "loss": 1.4243, + "step": 33744 + }, + { + "epoch": 2.66, + "learning_rate": 9.672017757071594e-06, + "loss": 1.5051, + "step": 33745 + }, + { + "epoch": 2.66, + "learning_rate": 9.667651866524456e-06, + "loss": 1.4702, + "step": 33746 + }, + { + "epoch": 2.66, + "learning_rate": 9.663286928756525e-06, + "loss": 1.4815, + "step": 33747 + }, + { + "epoch": 2.66, + "learning_rate": 9.658922943797393e-06, + "loss": 1.4576, + "step": 33748 + }, + { + "epoch": 2.66, + "learning_rate": 9.654559911676767e-06, + "loss": 1.4475, + "step": 33749 + }, + { + "epoch": 2.66, + "learning_rate": 9.650197832424212e-06, + "loss": 1.4056, + "step": 33750 + }, + { + "epoch": 2.66, + "learning_rate": 9.645836706069348e-06, + "loss": 1.5023, + "step": 33751 + }, + { + "epoch": 2.66, + "learning_rate": 9.641476532641807e-06, + "loss": 1.4431, + "step": 33752 + }, + { + "epoch": 2.66, + "learning_rate": 9.637117312171194e-06, + "loss": 1.4612, + "step": 33753 + }, + { + "epoch": 2.66, + "learning_rate": 9.632759044687105e-06, + "loss": 1.4564, + "step": 33754 + }, + { + "epoch": 2.66, + "learning_rate": 9.628401730219098e-06, + "loss": 1.4569, + "step": 33755 + }, + { + "epoch": 2.66, + "learning_rate": 9.624045368796801e-06, + "loss": 1.481, + "step": 33756 + }, + { + "epoch": 2.66, + "learning_rate": 9.619689960449772e-06, + "loss": 1.4449, + "step": 33757 + }, + { + "epoch": 2.66, + "learning_rate": 9.615335505207555e-06, + "loss": 1.4601, + "step": 33758 + }, + { + "epoch": 2.66, + "learning_rate": 9.61098200309976e-06, + "loss": 1.4478, + "step": 33759 + }, + { + "epoch": 2.66, + "learning_rate": 9.606629454155929e-06, + "loss": 1.4466, + "step": 33760 + }, + { + "epoch": 2.66, + "learning_rate": 9.60227785840557e-06, + "loss": 1.4381, + "step": 33761 + }, + { + "epoch": 2.66, + "learning_rate": 9.597927215878316e-06, + "loss": 1.4527, + "step": 33762 + }, + { + "epoch": 2.66, + "learning_rate": 9.593577526603635e-06, + "loss": 1.4527, + "step": 33763 + }, + { + "epoch": 2.66, + "learning_rate": 9.589228790611093e-06, + "loss": 1.4979, + "step": 33764 + }, + { + "epoch": 2.66, + "learning_rate": 9.584881007930161e-06, + "loss": 1.4267, + "step": 33765 + }, + { + "epoch": 2.66, + "learning_rate": 9.580534178590421e-06, + "loss": 1.4654, + "step": 33766 + }, + { + "epoch": 2.66, + "learning_rate": 9.57618830262138e-06, + "loss": 1.4308, + "step": 33767 + }, + { + "epoch": 2.66, + "learning_rate": 9.571843380052512e-06, + "loss": 1.3759, + "step": 33768 + }, + { + "epoch": 2.66, + "learning_rate": 9.567499410913332e-06, + "loss": 1.4309, + "step": 33769 + }, + { + "epoch": 2.66, + "learning_rate": 9.563156395233345e-06, + "loss": 1.4499, + "step": 33770 + }, + { + "epoch": 2.66, + "learning_rate": 9.55881433304203e-06, + "loss": 1.4162, + "step": 33771 + }, + { + "epoch": 2.66, + "learning_rate": 9.554473224368847e-06, + "loss": 1.4829, + "step": 33772 + }, + { + "epoch": 2.66, + "learning_rate": 9.550133069243304e-06, + "loss": 1.3951, + "step": 33773 + }, + { + "epoch": 2.66, + "learning_rate": 9.545793867694846e-06, + "loss": 1.4609, + "step": 33774 + }, + { + "epoch": 2.66, + "learning_rate": 9.541455619752913e-06, + "loss": 1.4153, + "step": 33775 + }, + { + "epoch": 2.66, + "learning_rate": 9.537118325447019e-06, + "loss": 1.4231, + "step": 33776 + }, + { + "epoch": 2.66, + "learning_rate": 9.53278198480657e-06, + "loss": 1.44, + "step": 33777 + }, + { + "epoch": 2.66, + "learning_rate": 9.528446597860995e-06, + "loss": 1.4643, + "step": 33778 + }, + { + "epoch": 2.66, + "learning_rate": 9.52411216463977e-06, + "loss": 1.4447, + "step": 33779 + }, + { + "epoch": 2.66, + "learning_rate": 9.519778685172303e-06, + "loss": 1.4666, + "step": 33780 + }, + { + "epoch": 2.66, + "learning_rate": 9.515446159488021e-06, + "loss": 1.4658, + "step": 33781 + }, + { + "epoch": 2.66, + "learning_rate": 9.511114587616286e-06, + "loss": 1.478, + "step": 33782 + }, + { + "epoch": 2.66, + "learning_rate": 9.506783969586606e-06, + "loss": 1.4174, + "step": 33783 + }, + { + "epoch": 2.66, + "learning_rate": 9.502454305428326e-06, + "loss": 1.4543, + "step": 33784 + }, + { + "epoch": 2.66, + "learning_rate": 9.498125595170836e-06, + "loss": 1.4167, + "step": 33785 + }, + { + "epoch": 2.66, + "learning_rate": 9.493797838843532e-06, + "loss": 1.4736, + "step": 33786 + }, + { + "epoch": 2.66, + "learning_rate": 9.48947103647582e-06, + "loss": 1.4722, + "step": 33787 + }, + { + "epoch": 2.66, + "learning_rate": 9.485145188097066e-06, + "loss": 1.4287, + "step": 33788 + }, + { + "epoch": 2.66, + "learning_rate": 9.480820293736591e-06, + "loss": 1.4866, + "step": 33789 + }, + { + "epoch": 2.66, + "learning_rate": 9.47649635342384e-06, + "loss": 1.4637, + "step": 33790 + }, + { + "epoch": 2.66, + "learning_rate": 9.472173367188124e-06, + "loss": 1.4414, + "step": 33791 + }, + { + "epoch": 2.66, + "learning_rate": 9.467851335058786e-06, + "loss": 1.4718, + "step": 33792 + }, + { + "epoch": 2.66, + "learning_rate": 9.463530257065217e-06, + "loss": 1.4093, + "step": 33793 + }, + { + "epoch": 2.66, + "learning_rate": 9.45921013323671e-06, + "loss": 1.4375, + "step": 33794 + }, + { + "epoch": 2.66, + "learning_rate": 9.45489096360258e-06, + "loss": 1.4476, + "step": 33795 + }, + { + "epoch": 2.66, + "learning_rate": 9.450572748192214e-06, + "loss": 1.4182, + "step": 33796 + }, + { + "epoch": 2.66, + "learning_rate": 9.446255487034893e-06, + "loss": 1.462, + "step": 33797 + }, + { + "epoch": 2.66, + "learning_rate": 9.441939180159924e-06, + "loss": 1.4321, + "step": 33798 + }, + { + "epoch": 2.66, + "learning_rate": 9.437623827596603e-06, + "loss": 1.4217, + "step": 33799 + }, + { + "epoch": 2.66, + "learning_rate": 9.433309429374285e-06, + "loss": 1.404, + "step": 33800 + }, + { + "epoch": 2.66, + "learning_rate": 9.42899598552222e-06, + "loss": 1.4053, + "step": 33801 + }, + { + "epoch": 2.66, + "learning_rate": 9.424683496069663e-06, + "loss": 1.4788, + "step": 33802 + }, + { + "epoch": 2.66, + "learning_rate": 9.420371961045958e-06, + "loss": 1.4719, + "step": 33803 + }, + { + "epoch": 2.66, + "learning_rate": 9.416061380480367e-06, + "loss": 1.484, + "step": 33804 + }, + { + "epoch": 2.66, + "learning_rate": 9.411751754402113e-06, + "loss": 1.42, + "step": 33805 + }, + { + "epoch": 2.66, + "learning_rate": 9.407443082840476e-06, + "loss": 1.4395, + "step": 33806 + }, + { + "epoch": 2.66, + "learning_rate": 9.403135365824732e-06, + "loss": 1.489, + "step": 33807 + }, + { + "epoch": 2.66, + "learning_rate": 9.398828603384124e-06, + "loss": 1.4397, + "step": 33808 + }, + { + "epoch": 2.66, + "learning_rate": 9.394522795547843e-06, + "loss": 1.4603, + "step": 33809 + }, + { + "epoch": 2.66, + "learning_rate": 9.390217942345186e-06, + "loss": 1.4674, + "step": 33810 + }, + { + "epoch": 2.66, + "learning_rate": 9.385914043805343e-06, + "loss": 1.4888, + "step": 33811 + }, + { + "epoch": 2.66, + "learning_rate": 9.381611099957542e-06, + "loss": 1.4268, + "step": 33812 + }, + { + "epoch": 2.66, + "learning_rate": 9.377309110830994e-06, + "loss": 1.4264, + "step": 33813 + }, + { + "epoch": 2.66, + "learning_rate": 9.373008076454924e-06, + "loss": 1.4241, + "step": 33814 + }, + { + "epoch": 2.66, + "learning_rate": 9.368707996858544e-06, + "loss": 1.4122, + "step": 33815 + }, + { + "epoch": 2.66, + "learning_rate": 9.36440887207101e-06, + "loss": 1.4681, + "step": 33816 + }, + { + "epoch": 2.66, + "learning_rate": 9.360110702121537e-06, + "loss": 1.4156, + "step": 33817 + }, + { + "epoch": 2.66, + "learning_rate": 9.355813487039315e-06, + "loss": 1.4777, + "step": 33818 + }, + { + "epoch": 2.66, + "learning_rate": 9.351517226853472e-06, + "loss": 1.4331, + "step": 33819 + }, + { + "epoch": 2.66, + "learning_rate": 9.347221921593234e-06, + "loss": 1.4742, + "step": 33820 + }, + { + "epoch": 2.66, + "learning_rate": 9.342927571287745e-06, + "loss": 1.4545, + "step": 33821 + }, + { + "epoch": 2.66, + "learning_rate": 9.338634175966164e-06, + "loss": 1.4852, + "step": 33822 + }, + { + "epoch": 2.66, + "learning_rate": 9.334341735657602e-06, + "loss": 1.4178, + "step": 33823 + }, + { + "epoch": 2.66, + "learning_rate": 9.330050250391253e-06, + "loss": 1.4627, + "step": 33824 + }, + { + "epoch": 2.66, + "learning_rate": 9.32575972019624e-06, + "loss": 1.4899, + "step": 33825 + }, + { + "epoch": 2.66, + "learning_rate": 9.321470145101662e-06, + "loss": 1.4348, + "step": 33826 + }, + { + "epoch": 2.66, + "learning_rate": 9.317181525136691e-06, + "loss": 1.4141, + "step": 33827 + }, + { + "epoch": 2.66, + "learning_rate": 9.312893860330439e-06, + "loss": 1.4098, + "step": 33828 + }, + { + "epoch": 2.66, + "learning_rate": 9.308607150711949e-06, + "loss": 1.429, + "step": 33829 + }, + { + "epoch": 2.66, + "learning_rate": 9.3043213963104e-06, + "loss": 1.5152, + "step": 33830 + }, + { + "epoch": 2.66, + "learning_rate": 9.300036597154881e-06, + "loss": 1.4673, + "step": 33831 + }, + { + "epoch": 2.66, + "learning_rate": 9.295752753274471e-06, + "loss": 1.4765, + "step": 33832 + }, + { + "epoch": 2.66, + "learning_rate": 9.29146986469823e-06, + "loss": 1.4199, + "step": 33833 + }, + { + "epoch": 2.66, + "learning_rate": 9.28718793145527e-06, + "loss": 1.4456, + "step": 33834 + }, + { + "epoch": 2.66, + "learning_rate": 9.282906953574664e-06, + "loss": 1.4503, + "step": 33835 + }, + { + "epoch": 2.66, + "learning_rate": 9.278626931085442e-06, + "loss": 1.4645, + "step": 33836 + }, + { + "epoch": 2.66, + "learning_rate": 9.274347864016712e-06, + "loss": 1.4515, + "step": 33837 + }, + { + "epoch": 2.66, + "learning_rate": 9.270069752397485e-06, + "loss": 1.4252, + "step": 33838 + }, + { + "epoch": 2.66, + "learning_rate": 9.265792596256837e-06, + "loss": 1.4553, + "step": 33839 + }, + { + "epoch": 2.66, + "learning_rate": 9.26151639562378e-06, + "loss": 1.4359, + "step": 33840 + }, + { + "epoch": 2.66, + "learning_rate": 9.257241150527373e-06, + "loss": 1.4232, + "step": 33841 + }, + { + "epoch": 2.66, + "learning_rate": 9.252966860996624e-06, + "loss": 1.4105, + "step": 33842 + }, + { + "epoch": 2.66, + "learning_rate": 9.248693527060547e-06, + "loss": 1.4562, + "step": 33843 + }, + { + "epoch": 2.66, + "learning_rate": 9.244421148748183e-06, + "loss": 1.4306, + "step": 33844 + }, + { + "epoch": 2.66, + "learning_rate": 9.240149726088508e-06, + "loss": 1.4233, + "step": 33845 + }, + { + "epoch": 2.66, + "learning_rate": 9.235879259110552e-06, + "loss": 1.4777, + "step": 33846 + }, + { + "epoch": 2.66, + "learning_rate": 9.231609747843288e-06, + "loss": 1.4163, + "step": 33847 + }, + { + "epoch": 2.66, + "learning_rate": 9.22734119231573e-06, + "loss": 1.4229, + "step": 33848 + }, + { + "epoch": 2.66, + "learning_rate": 9.223073592556834e-06, + "loss": 1.4495, + "step": 33849 + }, + { + "epoch": 2.66, + "learning_rate": 9.218806948595547e-06, + "loss": 1.4392, + "step": 33850 + }, + { + "epoch": 2.66, + "learning_rate": 9.214541260460912e-06, + "loss": 1.4415, + "step": 33851 + }, + { + "epoch": 2.66, + "learning_rate": 9.210276528181853e-06, + "loss": 1.4725, + "step": 33852 + }, + { + "epoch": 2.66, + "learning_rate": 9.206012751787285e-06, + "loss": 1.4268, + "step": 33853 + }, + { + "epoch": 2.66, + "learning_rate": 9.20174993130623e-06, + "loss": 1.4577, + "step": 33854 + }, + { + "epoch": 2.66, + "learning_rate": 9.197488066767584e-06, + "loss": 1.4406, + "step": 33855 + }, + { + "epoch": 2.66, + "learning_rate": 9.193227158200273e-06, + "loss": 1.4876, + "step": 33856 + }, + { + "epoch": 2.66, + "learning_rate": 9.188967205633275e-06, + "loss": 1.4151, + "step": 33857 + }, + { + "epoch": 2.66, + "learning_rate": 9.184708209095466e-06, + "loss": 1.4271, + "step": 33858 + }, + { + "epoch": 2.66, + "learning_rate": 9.180450168615806e-06, + "loss": 1.4117, + "step": 33859 + }, + { + "epoch": 2.66, + "learning_rate": 9.176193084223138e-06, + "loss": 1.4436, + "step": 33860 + }, + { + "epoch": 2.66, + "learning_rate": 9.171936955946407e-06, + "loss": 1.4773, + "step": 33861 + }, + { + "epoch": 2.66, + "learning_rate": 9.167681783814523e-06, + "loss": 1.434, + "step": 33862 + }, + { + "epoch": 2.66, + "learning_rate": 9.16342756785638e-06, + "loss": 1.466, + "step": 33863 + }, + { + "epoch": 2.66, + "learning_rate": 9.159174308100819e-06, + "loss": 1.4038, + "step": 33864 + }, + { + "epoch": 2.66, + "learning_rate": 9.154922004576754e-06, + "loss": 1.4842, + "step": 33865 + }, + { + "epoch": 2.66, + "learning_rate": 9.150670657313058e-06, + "loss": 1.3945, + "step": 33866 + }, + { + "epoch": 2.66, + "learning_rate": 9.146420266338544e-06, + "loss": 1.3676, + "step": 33867 + }, + { + "epoch": 2.66, + "learning_rate": 9.142170831682139e-06, + "loss": 1.454, + "step": 33868 + }, + { + "epoch": 2.66, + "learning_rate": 9.137922353372652e-06, + "loss": 1.4671, + "step": 33869 + }, + { + "epoch": 2.66, + "learning_rate": 9.133674831438926e-06, + "loss": 1.4094, + "step": 33870 + }, + { + "epoch": 2.67, + "learning_rate": 9.129428265909838e-06, + "loss": 1.5145, + "step": 33871 + }, + { + "epoch": 2.67, + "learning_rate": 9.125182656814183e-06, + "loss": 1.4715, + "step": 33872 + }, + { + "epoch": 2.67, + "learning_rate": 9.120938004180772e-06, + "loss": 1.4295, + "step": 33873 + }, + { + "epoch": 2.67, + "learning_rate": 9.11669430803848e-06, + "loss": 1.4895, + "step": 33874 + }, + { + "epoch": 2.67, + "learning_rate": 9.112451568416085e-06, + "loss": 1.4451, + "step": 33875 + }, + { + "epoch": 2.67, + "learning_rate": 9.108209785342379e-06, + "loss": 1.451, + "step": 33876 + }, + { + "epoch": 2.67, + "learning_rate": 9.103968958846159e-06, + "loss": 1.4425, + "step": 33877 + }, + { + "epoch": 2.67, + "learning_rate": 9.09972908895628e-06, + "loss": 1.465, + "step": 33878 + }, + { + "epoch": 2.67, + "learning_rate": 9.095490175701475e-06, + "loss": 1.382, + "step": 33879 + }, + { + "epoch": 2.67, + "learning_rate": 9.091252219110535e-06, + "loss": 1.5583, + "step": 33880 + }, + { + "epoch": 2.67, + "learning_rate": 9.087015219212219e-06, + "loss": 1.4632, + "step": 33881 + }, + { + "epoch": 2.67, + "learning_rate": 9.08277917603532e-06, + "loss": 1.4267, + "step": 33882 + }, + { + "epoch": 2.67, + "learning_rate": 9.078544089608586e-06, + "loss": 1.41, + "step": 33883 + }, + { + "epoch": 2.67, + "learning_rate": 9.07430995996074e-06, + "loss": 1.4478, + "step": 33884 + }, + { + "epoch": 2.67, + "learning_rate": 9.070076787120595e-06, + "loss": 1.4152, + "step": 33885 + }, + { + "epoch": 2.67, + "learning_rate": 9.06584457111686e-06, + "loss": 1.4351, + "step": 33886 + }, + { + "epoch": 2.67, + "learning_rate": 9.061613311978244e-06, + "loss": 1.4724, + "step": 33887 + }, + { + "epoch": 2.67, + "learning_rate": 9.05738300973351e-06, + "loss": 1.4401, + "step": 33888 + }, + { + "epoch": 2.67, + "learning_rate": 9.053153664411366e-06, + "loss": 1.454, + "step": 33889 + }, + { + "epoch": 2.67, + "learning_rate": 9.048925276040508e-06, + "loss": 1.4533, + "step": 33890 + }, + { + "epoch": 2.67, + "learning_rate": 9.044697844649695e-06, + "loss": 1.4112, + "step": 33891 + }, + { + "epoch": 2.67, + "learning_rate": 9.040471370267571e-06, + "loss": 1.429, + "step": 33892 + }, + { + "epoch": 2.67, + "learning_rate": 9.03624585292288e-06, + "loss": 1.4109, + "step": 33893 + }, + { + "epoch": 2.67, + "learning_rate": 9.032021292644264e-06, + "loss": 1.4272, + "step": 33894 + }, + { + "epoch": 2.67, + "learning_rate": 9.027797689460454e-06, + "loss": 1.4659, + "step": 33895 + }, + { + "epoch": 2.67, + "learning_rate": 9.023575043400106e-06, + "loss": 1.4599, + "step": 33896 + }, + { + "epoch": 2.67, + "learning_rate": 9.019353354491881e-06, + "loss": 1.4585, + "step": 33897 + }, + { + "epoch": 2.67, + "learning_rate": 9.015132622764442e-06, + "loss": 1.4837, + "step": 33898 + }, + { + "epoch": 2.67, + "learning_rate": 9.010912848246449e-06, + "loss": 1.4603, + "step": 33899 + }, + { + "epoch": 2.67, + "learning_rate": 9.006694030966577e-06, + "loss": 1.4824, + "step": 33900 + }, + { + "epoch": 2.67, + "learning_rate": 9.002476170953404e-06, + "loss": 1.4825, + "step": 33901 + }, + { + "epoch": 2.67, + "learning_rate": 8.998259268235642e-06, + "loss": 1.48, + "step": 33902 + }, + { + "epoch": 2.67, + "learning_rate": 8.994043322841881e-06, + "loss": 1.4388, + "step": 33903 + }, + { + "epoch": 2.67, + "learning_rate": 8.989828334800736e-06, + "loss": 1.4765, + "step": 33904 + }, + { + "epoch": 2.67, + "learning_rate": 8.985614304140865e-06, + "loss": 1.4564, + "step": 33905 + }, + { + "epoch": 2.67, + "learning_rate": 8.981401230890844e-06, + "loss": 1.4368, + "step": 33906 + }, + { + "epoch": 2.67, + "learning_rate": 8.97718911507927e-06, + "loss": 1.4014, + "step": 33907 + }, + { + "epoch": 2.67, + "learning_rate": 8.972977956734767e-06, + "loss": 1.4088, + "step": 33908 + }, + { + "epoch": 2.67, + "learning_rate": 8.96876775588593e-06, + "loss": 1.4411, + "step": 33909 + }, + { + "epoch": 2.67, + "learning_rate": 8.964558512561338e-06, + "loss": 1.4986, + "step": 33910 + }, + { + "epoch": 2.67, + "learning_rate": 8.960350226789548e-06, + "loss": 1.44, + "step": 33911 + }, + { + "epoch": 2.67, + "learning_rate": 8.956142898599156e-06, + "loss": 1.4265, + "step": 33912 + }, + { + "epoch": 2.67, + "learning_rate": 8.951936528018721e-06, + "loss": 1.4357, + "step": 33913 + }, + { + "epoch": 2.67, + "learning_rate": 8.947731115076789e-06, + "loss": 1.4194, + "step": 33914 + }, + { + "epoch": 2.67, + "learning_rate": 8.943526659801936e-06, + "loss": 1.4622, + "step": 33915 + }, + { + "epoch": 2.67, + "learning_rate": 8.939323162222705e-06, + "loss": 1.4341, + "step": 33916 + }, + { + "epoch": 2.67, + "learning_rate": 8.935120622367626e-06, + "loss": 1.4788, + "step": 33917 + }, + { + "epoch": 2.67, + "learning_rate": 8.930919040265205e-06, + "loss": 1.4557, + "step": 33918 + }, + { + "epoch": 2.67, + "learning_rate": 8.926718415944022e-06, + "loss": 1.4196, + "step": 33919 + }, + { + "epoch": 2.67, + "learning_rate": 8.922518749432555e-06, + "loss": 1.3886, + "step": 33920 + }, + { + "epoch": 2.67, + "learning_rate": 8.91832004075933e-06, + "loss": 1.4397, + "step": 33921 + }, + { + "epoch": 2.67, + "learning_rate": 8.914122289952858e-06, + "loss": 1.4943, + "step": 33922 + }, + { + "epoch": 2.67, + "learning_rate": 8.909925497041631e-06, + "loss": 1.4415, + "step": 33923 + }, + { + "epoch": 2.67, + "learning_rate": 8.905729662054178e-06, + "loss": 1.4001, + "step": 33924 + }, + { + "epoch": 2.67, + "learning_rate": 8.901534785018927e-06, + "loss": 1.4875, + "step": 33925 + }, + { + "epoch": 2.67, + "learning_rate": 8.897340865964403e-06, + "loss": 1.4702, + "step": 33926 + }, + { + "epoch": 2.67, + "learning_rate": 8.893147904919084e-06, + "loss": 1.4189, + "step": 33927 + }, + { + "epoch": 2.67, + "learning_rate": 8.888955901911398e-06, + "loss": 1.4648, + "step": 33928 + }, + { + "epoch": 2.67, + "learning_rate": 8.88476485696984e-06, + "loss": 1.4454, + "step": 33929 + }, + { + "epoch": 2.67, + "learning_rate": 8.880574770122867e-06, + "loss": 1.4124, + "step": 33930 + }, + { + "epoch": 2.67, + "learning_rate": 8.876385641398875e-06, + "loss": 1.4193, + "step": 33931 + }, + { + "epoch": 2.67, + "learning_rate": 8.872197470826392e-06, + "loss": 1.4452, + "step": 33932 + }, + { + "epoch": 2.67, + "learning_rate": 8.868010258433794e-06, + "loss": 1.4836, + "step": 33933 + }, + { + "epoch": 2.67, + "learning_rate": 8.863824004249526e-06, + "loss": 1.3934, + "step": 33934 + }, + { + "epoch": 2.67, + "learning_rate": 8.859638708301981e-06, + "loss": 1.3771, + "step": 33935 + }, + { + "epoch": 2.67, + "learning_rate": 8.855454370619636e-06, + "loss": 1.412, + "step": 33936 + }, + { + "epoch": 2.67, + "learning_rate": 8.851270991230853e-06, + "loss": 1.4869, + "step": 33937 + }, + { + "epoch": 2.67, + "learning_rate": 8.847088570164024e-06, + "loss": 1.4451, + "step": 33938 + }, + { + "epoch": 2.67, + "learning_rate": 8.842907107447578e-06, + "loss": 1.4405, + "step": 33939 + }, + { + "epoch": 2.67, + "learning_rate": 8.838726603109908e-06, + "loss": 1.4063, + "step": 33940 + }, + { + "epoch": 2.67, + "learning_rate": 8.834547057179391e-06, + "loss": 1.4162, + "step": 33941 + }, + { + "epoch": 2.67, + "learning_rate": 8.83036846968439e-06, + "loss": 1.3726, + "step": 33942 + }, + { + "epoch": 2.67, + "learning_rate": 8.82619084065328e-06, + "loss": 1.4444, + "step": 33943 + }, + { + "epoch": 2.67, + "learning_rate": 8.82201417011444e-06, + "loss": 1.477, + "step": 33944 + }, + { + "epoch": 2.67, + "learning_rate": 8.817838458096193e-06, + "loss": 1.3904, + "step": 33945 + }, + { + "epoch": 2.67, + "learning_rate": 8.81366370462694e-06, + "loss": 1.4208, + "step": 33946 + }, + { + "epoch": 2.67, + "learning_rate": 8.809489909734984e-06, + "loss": 1.4408, + "step": 33947 + }, + { + "epoch": 2.67, + "learning_rate": 8.805317073448675e-06, + "loss": 1.4483, + "step": 33948 + }, + { + "epoch": 2.67, + "learning_rate": 8.801145195796356e-06, + "loss": 1.4153, + "step": 33949 + }, + { + "epoch": 2.67, + "learning_rate": 8.796974276806335e-06, + "loss": 1.4301, + "step": 33950 + }, + { + "epoch": 2.67, + "learning_rate": 8.79280431650694e-06, + "loss": 1.4691, + "step": 33951 + }, + { + "epoch": 2.67, + "learning_rate": 8.788635314926452e-06, + "loss": 1.459, + "step": 33952 + }, + { + "epoch": 2.67, + "learning_rate": 8.784467272093242e-06, + "loss": 1.4416, + "step": 33953 + }, + { + "epoch": 2.67, + "learning_rate": 8.78030018803556e-06, + "loss": 1.4456, + "step": 33954 + }, + { + "epoch": 2.67, + "learning_rate": 8.776134062781664e-06, + "loss": 1.4754, + "step": 33955 + }, + { + "epoch": 2.67, + "learning_rate": 8.771968896359915e-06, + "loss": 1.443, + "step": 33956 + }, + { + "epoch": 2.67, + "learning_rate": 8.767804688798574e-06, + "loss": 1.5188, + "step": 33957 + }, + { + "epoch": 2.67, + "learning_rate": 8.763641440125901e-06, + "loss": 1.4193, + "step": 33958 + }, + { + "epoch": 2.67, + "learning_rate": 8.759479150370141e-06, + "loss": 1.4194, + "step": 33959 + }, + { + "epoch": 2.67, + "learning_rate": 8.755317819559604e-06, + "loss": 1.4766, + "step": 33960 + }, + { + "epoch": 2.67, + "learning_rate": 8.751157447722501e-06, + "loss": 1.454, + "step": 33961 + }, + { + "epoch": 2.67, + "learning_rate": 8.746998034887075e-06, + "loss": 1.4215, + "step": 33962 + }, + { + "epoch": 2.67, + "learning_rate": 8.742839581081607e-06, + "loss": 1.4162, + "step": 33963 + }, + { + "epoch": 2.67, + "learning_rate": 8.738682086334303e-06, + "loss": 1.4404, + "step": 33964 + }, + { + "epoch": 2.67, + "learning_rate": 8.73452555067336e-06, + "loss": 1.3757, + "step": 33965 + }, + { + "epoch": 2.67, + "learning_rate": 8.730369974127072e-06, + "loss": 1.4283, + "step": 33966 + }, + { + "epoch": 2.67, + "learning_rate": 8.726215356723598e-06, + "loss": 1.4638, + "step": 33967 + }, + { + "epoch": 2.67, + "learning_rate": 8.72206169849115e-06, + "loss": 1.4416, + "step": 33968 + }, + { + "epoch": 2.67, + "learning_rate": 8.717908999457956e-06, + "loss": 1.4336, + "step": 33969 + }, + { + "epoch": 2.67, + "learning_rate": 8.713757259652194e-06, + "loss": 1.4616, + "step": 33970 + }, + { + "epoch": 2.67, + "learning_rate": 8.709606479102022e-06, + "loss": 1.496, + "step": 33971 + }, + { + "epoch": 2.67, + "learning_rate": 8.705456657835668e-06, + "loss": 1.4507, + "step": 33972 + }, + { + "epoch": 2.67, + "learning_rate": 8.701307795881297e-06, + "loss": 1.4758, + "step": 33973 + }, + { + "epoch": 2.67, + "learning_rate": 8.69715989326708e-06, + "loss": 1.3982, + "step": 33974 + }, + { + "epoch": 2.67, + "learning_rate": 8.693012950021167e-06, + "loss": 1.4038, + "step": 33975 + }, + { + "epoch": 2.67, + "learning_rate": 8.688866966171698e-06, + "loss": 1.4439, + "step": 33976 + }, + { + "epoch": 2.67, + "learning_rate": 8.68472194174687e-06, + "loss": 1.4521, + "step": 33977 + }, + { + "epoch": 2.67, + "learning_rate": 8.680577876774774e-06, + "loss": 1.4018, + "step": 33978 + }, + { + "epoch": 2.67, + "learning_rate": 8.676434771283558e-06, + "loss": 1.4616, + "step": 33979 + }, + { + "epoch": 2.67, + "learning_rate": 8.672292625301397e-06, + "loss": 1.4713, + "step": 33980 + }, + { + "epoch": 2.67, + "learning_rate": 8.668151438856353e-06, + "loss": 1.4664, + "step": 33981 + }, + { + "epoch": 2.67, + "learning_rate": 8.664011211976569e-06, + "loss": 1.47, + "step": 33982 + }, + { + "epoch": 2.67, + "learning_rate": 8.659871944690156e-06, + "loss": 1.416, + "step": 33983 + }, + { + "epoch": 2.67, + "learning_rate": 8.655733637025225e-06, + "loss": 1.3994, + "step": 33984 + }, + { + "epoch": 2.67, + "learning_rate": 8.651596289009838e-06, + "loss": 1.3901, + "step": 33985 + }, + { + "epoch": 2.67, + "learning_rate": 8.647459900672104e-06, + "loss": 1.458, + "step": 33986 + }, + { + "epoch": 2.67, + "learning_rate": 8.643324472040136e-06, + "loss": 1.3999, + "step": 33987 + }, + { + "epoch": 2.67, + "learning_rate": 8.639190003141994e-06, + "loss": 1.4568, + "step": 33988 + }, + { + "epoch": 2.67, + "learning_rate": 8.635056494005721e-06, + "loss": 1.4179, + "step": 33989 + }, + { + "epoch": 2.67, + "learning_rate": 8.630923944659412e-06, + "loss": 1.4687, + "step": 33990 + }, + { + "epoch": 2.67, + "learning_rate": 8.62679235513113e-06, + "loss": 1.4466, + "step": 33991 + }, + { + "epoch": 2.67, + "learning_rate": 8.622661725448899e-06, + "loss": 1.4662, + "step": 33992 + }, + { + "epoch": 2.67, + "learning_rate": 8.618532055640764e-06, + "loss": 1.4327, + "step": 33993 + }, + { + "epoch": 2.67, + "learning_rate": 8.614403345734788e-06, + "loss": 1.4501, + "step": 33994 + }, + { + "epoch": 2.67, + "learning_rate": 8.610275595758998e-06, + "loss": 1.4784, + "step": 33995 + }, + { + "epoch": 2.67, + "learning_rate": 8.606148805741402e-06, + "loss": 1.4193, + "step": 33996 + }, + { + "epoch": 2.67, + "learning_rate": 8.602022975710032e-06, + "loss": 1.4649, + "step": 33997 + }, + { + "epoch": 2.68, + "learning_rate": 8.597898105692897e-06, + "loss": 1.3843, + "step": 33998 + }, + { + "epoch": 2.68, + "learning_rate": 8.59377419571799e-06, + "loss": 1.4417, + "step": 33999 + }, + { + "epoch": 2.68, + "learning_rate": 8.58965124581334e-06, + "loss": 1.4643, + "step": 34000 + }, + { + "epoch": 2.68, + "learning_rate": 8.585529256006906e-06, + "loss": 1.4465, + "step": 34001 + }, + { + "epoch": 2.68, + "learning_rate": 8.581408226326686e-06, + "loss": 1.4143, + "step": 34002 + }, + { + "epoch": 2.68, + "learning_rate": 8.577288156800654e-06, + "loss": 1.3868, + "step": 34003 + }, + { + "epoch": 2.68, + "learning_rate": 8.573169047456823e-06, + "loss": 1.4176, + "step": 34004 + }, + { + "epoch": 2.68, + "learning_rate": 8.56905089832312e-06, + "loss": 1.4961, + "step": 34005 + }, + { + "epoch": 2.68, + "learning_rate": 8.56493370942749e-06, + "loss": 1.4255, + "step": 34006 + }, + { + "epoch": 2.68, + "learning_rate": 8.560817480797943e-06, + "loss": 1.4462, + "step": 34007 + }, + { + "epoch": 2.68, + "learning_rate": 8.556702212462375e-06, + "loss": 1.4235, + "step": 34008 + }, + { + "epoch": 2.68, + "learning_rate": 8.552587904448743e-06, + "loss": 1.4221, + "step": 34009 + }, + { + "epoch": 2.68, + "learning_rate": 8.548474556784995e-06, + "loss": 1.407, + "step": 34010 + }, + { + "epoch": 2.68, + "learning_rate": 8.544362169499042e-06, + "loss": 1.4715, + "step": 34011 + }, + { + "epoch": 2.68, + "learning_rate": 8.54025074261881e-06, + "loss": 1.5173, + "step": 34012 + }, + { + "epoch": 2.68, + "learning_rate": 8.536140276172176e-06, + "loss": 1.3925, + "step": 34013 + }, + { + "epoch": 2.68, + "learning_rate": 8.53203077018712e-06, + "loss": 1.4299, + "step": 34014 + }, + { + "epoch": 2.68, + "learning_rate": 8.527922224691519e-06, + "loss": 1.4489, + "step": 34015 + }, + { + "epoch": 2.68, + "learning_rate": 8.523814639713217e-06, + "loss": 1.4843, + "step": 34016 + }, + { + "epoch": 2.68, + "learning_rate": 8.519708015280159e-06, + "loss": 1.4668, + "step": 34017 + }, + { + "epoch": 2.68, + "learning_rate": 8.515602351420186e-06, + "loss": 1.47, + "step": 34018 + }, + { + "epoch": 2.68, + "learning_rate": 8.51149764816123e-06, + "loss": 1.4599, + "step": 34019 + }, + { + "epoch": 2.68, + "learning_rate": 8.507393905531101e-06, + "loss": 1.452, + "step": 34020 + }, + { + "epoch": 2.68, + "learning_rate": 8.50329112355771e-06, + "loss": 1.4885, + "step": 34021 + }, + { + "epoch": 2.68, + "learning_rate": 8.499189302268865e-06, + "loss": 1.528, + "step": 34022 + }, + { + "epoch": 2.68, + "learning_rate": 8.495088441692432e-06, + "loss": 1.4708, + "step": 34023 + }, + { + "epoch": 2.68, + "learning_rate": 8.490988541856286e-06, + "loss": 1.4705, + "step": 34024 + }, + { + "epoch": 2.68, + "learning_rate": 8.486889602788239e-06, + "loss": 1.4567, + "step": 34025 + }, + { + "epoch": 2.68, + "learning_rate": 8.482791624516082e-06, + "loss": 1.4522, + "step": 34026 + }, + { + "epoch": 2.68, + "learning_rate": 8.478694607067715e-06, + "loss": 1.442, + "step": 34027 + }, + { + "epoch": 2.68, + "learning_rate": 8.474598550470896e-06, + "loss": 1.4949, + "step": 34028 + }, + { + "epoch": 2.68, + "learning_rate": 8.47050345475347e-06, + "loss": 1.4755, + "step": 34029 + }, + { + "epoch": 2.68, + "learning_rate": 8.46640931994318e-06, + "loss": 1.4165, + "step": 34030 + }, + { + "epoch": 2.68, + "learning_rate": 8.462316146067905e-06, + "loss": 1.46, + "step": 34031 + }, + { + "epoch": 2.68, + "learning_rate": 8.458223933155389e-06, + "loss": 1.4096, + "step": 34032 + }, + { + "epoch": 2.68, + "learning_rate": 8.454132681233394e-06, + "loss": 1.4248, + "step": 34033 + }, + { + "epoch": 2.68, + "learning_rate": 8.450042390329747e-06, + "loss": 1.4898, + "step": 34034 + }, + { + "epoch": 2.68, + "learning_rate": 8.445953060472194e-06, + "loss": 1.4305, + "step": 34035 + }, + { + "epoch": 2.68, + "learning_rate": 8.441864691688527e-06, + "loss": 1.4882, + "step": 34036 + }, + { + "epoch": 2.68, + "learning_rate": 8.437777284006442e-06, + "loss": 1.4272, + "step": 34037 + }, + { + "epoch": 2.68, + "learning_rate": 8.433690837453766e-06, + "loss": 1.4579, + "step": 34038 + }, + { + "epoch": 2.68, + "learning_rate": 8.429605352058194e-06, + "loss": 1.4212, + "step": 34039 + }, + { + "epoch": 2.68, + "learning_rate": 8.42552082784747e-06, + "loss": 1.4816, + "step": 34040 + }, + { + "epoch": 2.68, + "learning_rate": 8.42143726484934e-06, + "loss": 1.4427, + "step": 34041 + }, + { + "epoch": 2.68, + "learning_rate": 8.417354663091531e-06, + "loss": 1.4812, + "step": 34042 + }, + { + "epoch": 2.68, + "learning_rate": 8.413273022601718e-06, + "loss": 1.4712, + "step": 34043 + }, + { + "epoch": 2.68, + "learning_rate": 8.409192343407667e-06, + "loss": 1.4715, + "step": 34044 + }, + { + "epoch": 2.68, + "learning_rate": 8.405112625537086e-06, + "loss": 1.399, + "step": 34045 + }, + { + "epoch": 2.68, + "learning_rate": 8.401033869017637e-06, + "loss": 1.4944, + "step": 34046 + }, + { + "epoch": 2.68, + "learning_rate": 8.396956073876998e-06, + "loss": 1.4483, + "step": 34047 + }, + { + "epoch": 2.68, + "learning_rate": 8.392879240142914e-06, + "loss": 1.4219, + "step": 34048 + }, + { + "epoch": 2.68, + "learning_rate": 8.38880336784301e-06, + "loss": 1.4446, + "step": 34049 + }, + { + "epoch": 2.68, + "learning_rate": 8.384728457005018e-06, + "loss": 1.4339, + "step": 34050 + }, + { + "epoch": 2.68, + "learning_rate": 8.38065450765653e-06, + "loss": 1.3983, + "step": 34051 + }, + { + "epoch": 2.68, + "learning_rate": 8.376581519825277e-06, + "loss": 1.4326, + "step": 34052 + }, + { + "epoch": 2.68, + "learning_rate": 8.372509493538881e-06, + "loss": 1.4555, + "step": 34053 + }, + { + "epoch": 2.68, + "learning_rate": 8.368438428824975e-06, + "loss": 1.4382, + "step": 34054 + }, + { + "epoch": 2.68, + "learning_rate": 8.364368325711219e-06, + "loss": 1.3781, + "step": 34055 + }, + { + "epoch": 2.68, + "learning_rate": 8.360299184225256e-06, + "loss": 1.4488, + "step": 34056 + }, + { + "epoch": 2.68, + "learning_rate": 8.356231004394664e-06, + "loss": 1.4761, + "step": 34057 + }, + { + "epoch": 2.68, + "learning_rate": 8.352163786247124e-06, + "loss": 1.4228, + "step": 34058 + }, + { + "epoch": 2.68, + "learning_rate": 8.348097529810227e-06, + "loss": 1.4671, + "step": 34059 + }, + { + "epoch": 2.68, + "learning_rate": 8.344032235111553e-06, + "loss": 1.4559, + "step": 34060 + }, + { + "epoch": 2.68, + "learning_rate": 8.339967902178763e-06, + "loss": 1.391, + "step": 34061 + }, + { + "epoch": 2.68, + "learning_rate": 8.3359045310394e-06, + "loss": 1.3934, + "step": 34062 + }, + { + "epoch": 2.68, + "learning_rate": 8.331842121721078e-06, + "loss": 1.4494, + "step": 34063 + }, + { + "epoch": 2.68, + "learning_rate": 8.327780674251339e-06, + "loss": 1.4225, + "step": 34064 + }, + { + "epoch": 2.68, + "learning_rate": 8.323720188657796e-06, + "loss": 1.4551, + "step": 34065 + }, + { + "epoch": 2.68, + "learning_rate": 8.319660664968025e-06, + "loss": 1.3965, + "step": 34066 + }, + { + "epoch": 2.68, + "learning_rate": 8.31560210320954e-06, + "loss": 1.4747, + "step": 34067 + }, + { + "epoch": 2.68, + "learning_rate": 8.311544503409967e-06, + "loss": 1.4747, + "step": 34068 + }, + { + "epoch": 2.68, + "learning_rate": 8.307487865596819e-06, + "loss": 1.486, + "step": 34069 + }, + { + "epoch": 2.68, + "learning_rate": 8.30343218979762e-06, + "loss": 1.4131, + "step": 34070 + }, + { + "epoch": 2.68, + "learning_rate": 8.29937747603992e-06, + "loss": 1.4439, + "step": 34071 + }, + { + "epoch": 2.68, + "learning_rate": 8.295323724351261e-06, + "loss": 1.4243, + "step": 34072 + }, + { + "epoch": 2.68, + "learning_rate": 8.291270934759153e-06, + "loss": 1.4243, + "step": 34073 + }, + { + "epoch": 2.68, + "learning_rate": 8.287219107291093e-06, + "loss": 1.424, + "step": 34074 + }, + { + "epoch": 2.68, + "learning_rate": 8.283168241974641e-06, + "loss": 1.4826, + "step": 34075 + }, + { + "epoch": 2.68, + "learning_rate": 8.27911833883726e-06, + "loss": 1.4302, + "step": 34076 + }, + { + "epoch": 2.68, + "learning_rate": 8.275069397906443e-06, + "loss": 1.4314, + "step": 34077 + }, + { + "epoch": 2.68, + "learning_rate": 8.271021419209716e-06, + "loss": 1.4142, + "step": 34078 + }, + { + "epoch": 2.68, + "learning_rate": 8.266974402774529e-06, + "loss": 1.4427, + "step": 34079 + }, + { + "epoch": 2.68, + "learning_rate": 8.262928348628373e-06, + "loss": 1.4363, + "step": 34080 + }, + { + "epoch": 2.68, + "learning_rate": 8.258883256798694e-06, + "loss": 1.4826, + "step": 34081 + }, + { + "epoch": 2.68, + "learning_rate": 8.254839127313017e-06, + "loss": 1.4482, + "step": 34082 + }, + { + "epoch": 2.68, + "learning_rate": 8.250795960198741e-06, + "loss": 1.4958, + "step": 34083 + }, + { + "epoch": 2.68, + "learning_rate": 8.246753755483326e-06, + "loss": 1.4318, + "step": 34084 + }, + { + "epoch": 2.68, + "learning_rate": 8.24271251319425e-06, + "loss": 1.4146, + "step": 34085 + }, + { + "epoch": 2.68, + "learning_rate": 8.238672233358939e-06, + "loss": 1.4565, + "step": 34086 + }, + { + "epoch": 2.68, + "learning_rate": 8.23463291600479e-06, + "loss": 1.4341, + "step": 34087 + }, + { + "epoch": 2.68, + "learning_rate": 8.230594561159249e-06, + "loss": 1.4797, + "step": 34088 + }, + { + "epoch": 2.68, + "learning_rate": 8.22655716884974e-06, + "loss": 1.3939, + "step": 34089 + }, + { + "epoch": 2.68, + "learning_rate": 8.222520739103693e-06, + "loss": 1.4348, + "step": 34090 + }, + { + "epoch": 2.68, + "learning_rate": 8.218485271948456e-06, + "loss": 1.484, + "step": 34091 + }, + { + "epoch": 2.68, + "learning_rate": 8.214450767411485e-06, + "loss": 1.4366, + "step": 34092 + }, + { + "epoch": 2.68, + "learning_rate": 8.210417225520144e-06, + "loss": 1.4444, + "step": 34093 + }, + { + "epoch": 2.68, + "learning_rate": 8.206384646301812e-06, + "loss": 1.4534, + "step": 34094 + }, + { + "epoch": 2.68, + "learning_rate": 8.202353029783899e-06, + "loss": 1.4918, + "step": 34095 + }, + { + "epoch": 2.68, + "learning_rate": 8.198322375993732e-06, + "loss": 1.4767, + "step": 34096 + }, + { + "epoch": 2.68, + "learning_rate": 8.194292684958726e-06, + "loss": 1.4047, + "step": 34097 + }, + { + "epoch": 2.68, + "learning_rate": 8.190263956706206e-06, + "loss": 1.4581, + "step": 34098 + }, + { + "epoch": 2.68, + "learning_rate": 8.186236191263551e-06, + "loss": 1.4138, + "step": 34099 + }, + { + "epoch": 2.68, + "learning_rate": 8.18220938865809e-06, + "loss": 1.4026, + "step": 34100 + }, + { + "epoch": 2.68, + "learning_rate": 8.17818354891715e-06, + "loss": 1.4662, + "step": 34101 + }, + { + "epoch": 2.68, + "learning_rate": 8.174158672068093e-06, + "loss": 1.4885, + "step": 34102 + }, + { + "epoch": 2.68, + "learning_rate": 8.17013475813823e-06, + "loss": 1.4675, + "step": 34103 + }, + { + "epoch": 2.68, + "learning_rate": 8.166111807154907e-06, + "loss": 1.3854, + "step": 34104 + }, + { + "epoch": 2.68, + "learning_rate": 8.162089819145368e-06, + "loss": 1.4449, + "step": 34105 + }, + { + "epoch": 2.68, + "learning_rate": 8.158068794137007e-06, + "loss": 1.4797, + "step": 34106 + }, + { + "epoch": 2.68, + "learning_rate": 8.15404873215707e-06, + "loss": 1.4773, + "step": 34107 + }, + { + "epoch": 2.68, + "learning_rate": 8.150029633232852e-06, + "loss": 1.4847, + "step": 34108 + }, + { + "epoch": 2.68, + "learning_rate": 8.146011497391663e-06, + "loss": 1.4145, + "step": 34109 + }, + { + "epoch": 2.68, + "learning_rate": 8.141994324660783e-06, + "loss": 1.3793, + "step": 34110 + }, + { + "epoch": 2.68, + "learning_rate": 8.137978115067456e-06, + "loss": 1.4853, + "step": 34111 + }, + { + "epoch": 2.68, + "learning_rate": 8.133962868638977e-06, + "loss": 1.4135, + "step": 34112 + }, + { + "epoch": 2.68, + "learning_rate": 8.129948585402623e-06, + "loss": 1.4135, + "step": 34113 + }, + { + "epoch": 2.68, + "learning_rate": 8.125935265385624e-06, + "loss": 1.4674, + "step": 34114 + }, + { + "epoch": 2.68, + "learning_rate": 8.121922908615208e-06, + "loss": 1.4809, + "step": 34115 + }, + { + "epoch": 2.68, + "learning_rate": 8.117911515118653e-06, + "loss": 1.4769, + "step": 34116 + }, + { + "epoch": 2.68, + "learning_rate": 8.113901084923203e-06, + "loss": 1.4128, + "step": 34117 + }, + { + "epoch": 2.68, + "learning_rate": 8.109891618056035e-06, + "loss": 1.4467, + "step": 34118 + }, + { + "epoch": 2.68, + "learning_rate": 8.105883114544414e-06, + "loss": 1.4636, + "step": 34119 + }, + { + "epoch": 2.68, + "learning_rate": 8.10187557441555e-06, + "loss": 1.4629, + "step": 34120 + }, + { + "epoch": 2.68, + "learning_rate": 8.097868997696622e-06, + "loss": 1.4617, + "step": 34121 + }, + { + "epoch": 2.68, + "learning_rate": 8.09386338441489e-06, + "loss": 1.4305, + "step": 34122 + }, + { + "epoch": 2.68, + "learning_rate": 8.089858734597498e-06, + "loss": 1.4643, + "step": 34123 + }, + { + "epoch": 2.68, + "learning_rate": 8.08585504827166e-06, + "loss": 1.4319, + "step": 34124 + }, + { + "epoch": 2.68, + "learning_rate": 8.081852325464522e-06, + "loss": 1.4056, + "step": 34125 + }, + { + "epoch": 2.69, + "learning_rate": 8.077850566203325e-06, + "loss": 1.4447, + "step": 34126 + }, + { + "epoch": 2.69, + "learning_rate": 8.0738497705152e-06, + "loss": 1.4268, + "step": 34127 + }, + { + "epoch": 2.69, + "learning_rate": 8.069849938427275e-06, + "loss": 1.4066, + "step": 34128 + }, + { + "epoch": 2.69, + "learning_rate": 8.06585106996676e-06, + "loss": 1.3602, + "step": 34129 + }, + { + "epoch": 2.69, + "learning_rate": 8.06185316516082e-06, + "loss": 1.435, + "step": 34130 + }, + { + "epoch": 2.69, + "learning_rate": 8.057856224036563e-06, + "loss": 1.4544, + "step": 34131 + }, + { + "epoch": 2.69, + "learning_rate": 8.053860246621101e-06, + "loss": 1.4421, + "step": 34132 + }, + { + "epoch": 2.69, + "learning_rate": 8.049865232941633e-06, + "loss": 1.455, + "step": 34133 + }, + { + "epoch": 2.69, + "learning_rate": 8.045871183025232e-06, + "loss": 1.4632, + "step": 34134 + }, + { + "epoch": 2.69, + "learning_rate": 8.041878096899012e-06, + "loss": 1.4533, + "step": 34135 + }, + { + "epoch": 2.69, + "learning_rate": 8.03788597459012e-06, + "loss": 1.3713, + "step": 34136 + }, + { + "epoch": 2.69, + "learning_rate": 8.033894816125646e-06, + "loss": 1.4694, + "step": 34137 + }, + { + "epoch": 2.69, + "learning_rate": 8.029904621532656e-06, + "loss": 1.4352, + "step": 34138 + }, + { + "epoch": 2.69, + "learning_rate": 8.025915390838295e-06, + "loss": 1.479, + "step": 34139 + }, + { + "epoch": 2.69, + "learning_rate": 8.021927124069621e-06, + "loss": 1.4129, + "step": 34140 + }, + { + "epoch": 2.69, + "learning_rate": 8.0179398212537e-06, + "loss": 1.4279, + "step": 34141 + }, + { + "epoch": 2.69, + "learning_rate": 8.013953482417606e-06, + "loss": 1.4306, + "step": 34142 + }, + { + "epoch": 2.69, + "learning_rate": 8.009968107588404e-06, + "loss": 1.4482, + "step": 34143 + }, + { + "epoch": 2.69, + "learning_rate": 8.005983696793188e-06, + "loss": 1.5042, + "step": 34144 + }, + { + "epoch": 2.69, + "learning_rate": 8.002000250058987e-06, + "loss": 1.4825, + "step": 34145 + }, + { + "epoch": 2.69, + "learning_rate": 7.99801776741283e-06, + "loss": 1.4806, + "step": 34146 + }, + { + "epoch": 2.69, + "learning_rate": 7.994036248881775e-06, + "loss": 1.4511, + "step": 34147 + }, + { + "epoch": 2.69, + "learning_rate": 7.990055694492852e-06, + "loss": 1.4365, + "step": 34148 + }, + { + "epoch": 2.69, + "learning_rate": 7.986076104273075e-06, + "loss": 1.4353, + "step": 34149 + }, + { + "epoch": 2.69, + "learning_rate": 7.982097478249472e-06, + "loss": 1.4534, + "step": 34150 + }, + { + "epoch": 2.69, + "learning_rate": 7.978119816449069e-06, + "loss": 1.451, + "step": 34151 + }, + { + "epoch": 2.69, + "learning_rate": 7.97414311889883e-06, + "loss": 1.491, + "step": 34152 + }, + { + "epoch": 2.69, + "learning_rate": 7.970167385625813e-06, + "loss": 1.4862, + "step": 34153 + }, + { + "epoch": 2.69, + "learning_rate": 7.966192616656968e-06, + "loss": 1.4649, + "step": 34154 + }, + { + "epoch": 2.69, + "learning_rate": 7.96221881201929e-06, + "loss": 1.442, + "step": 34155 + }, + { + "epoch": 2.69, + "learning_rate": 7.95824597173977e-06, + "loss": 1.4696, + "step": 34156 + }, + { + "epoch": 2.69, + "learning_rate": 7.954274095845386e-06, + "loss": 1.4465, + "step": 34157 + }, + { + "epoch": 2.69, + "learning_rate": 7.950303184363088e-06, + "loss": 1.4526, + "step": 34158 + }, + { + "epoch": 2.69, + "learning_rate": 7.946333237319801e-06, + "loss": 1.4481, + "step": 34159 + }, + { + "epoch": 2.69, + "learning_rate": 7.942364254742555e-06, + "loss": 1.4288, + "step": 34160 + }, + { + "epoch": 2.69, + "learning_rate": 7.938396236658262e-06, + "loss": 1.4903, + "step": 34161 + }, + { + "epoch": 2.69, + "learning_rate": 7.934429183093865e-06, + "loss": 1.4646, + "step": 34162 + }, + { + "epoch": 2.69, + "learning_rate": 7.930463094076279e-06, + "loss": 1.4852, + "step": 34163 + }, + { + "epoch": 2.69, + "learning_rate": 7.926497969632479e-06, + "loss": 1.4487, + "step": 34164 + }, + { + "epoch": 2.69, + "learning_rate": 7.922533809789328e-06, + "loss": 1.4699, + "step": 34165 + }, + { + "epoch": 2.69, + "learning_rate": 7.918570614573771e-06, + "loss": 1.3873, + "step": 34166 + }, + { + "epoch": 2.69, + "learning_rate": 7.914608384012721e-06, + "loss": 1.4349, + "step": 34167 + }, + { + "epoch": 2.69, + "learning_rate": 7.910647118133073e-06, + "loss": 1.4452, + "step": 34168 + }, + { + "epoch": 2.69, + "learning_rate": 7.906686816961706e-06, + "loss": 1.4433, + "step": 34169 + }, + { + "epoch": 2.69, + "learning_rate": 7.902727480525528e-06, + "loss": 1.4549, + "step": 34170 + }, + { + "epoch": 2.69, + "learning_rate": 7.898769108851421e-06, + "loss": 1.4224, + "step": 34171 + }, + { + "epoch": 2.69, + "learning_rate": 7.894811701966247e-06, + "loss": 1.447, + "step": 34172 + }, + { + "epoch": 2.69, + "learning_rate": 7.890855259896884e-06, + "loss": 1.4588, + "step": 34173 + }, + { + "epoch": 2.69, + "learning_rate": 7.886899782670208e-06, + "loss": 1.4352, + "step": 34174 + }, + { + "epoch": 2.69, + "learning_rate": 7.882945270313018e-06, + "loss": 1.4507, + "step": 34175 + }, + { + "epoch": 2.69, + "learning_rate": 7.878991722852207e-06, + "loss": 1.4712, + "step": 34176 + }, + { + "epoch": 2.69, + "learning_rate": 7.875039140314638e-06, + "loss": 1.4248, + "step": 34177 + }, + { + "epoch": 2.69, + "learning_rate": 7.871087522727138e-06, + "loss": 1.4181, + "step": 34178 + }, + { + "epoch": 2.69, + "learning_rate": 7.86713687011647e-06, + "loss": 1.4847, + "step": 34179 + }, + { + "epoch": 2.69, + "learning_rate": 7.863187182509544e-06, + "loss": 1.4288, + "step": 34180 + }, + { + "epoch": 2.69, + "learning_rate": 7.859238459933142e-06, + "loss": 1.452, + "step": 34181 + }, + { + "epoch": 2.69, + "learning_rate": 7.855290702414074e-06, + "loss": 1.4422, + "step": 34182 + }, + { + "epoch": 2.69, + "learning_rate": 7.851343909979118e-06, + "loss": 1.4452, + "step": 34183 + }, + { + "epoch": 2.69, + "learning_rate": 7.847398082655105e-06, + "loss": 1.446, + "step": 34184 + }, + { + "epoch": 2.69, + "learning_rate": 7.843453220468809e-06, + "loss": 1.5013, + "step": 34185 + }, + { + "epoch": 2.69, + "learning_rate": 7.839509323447013e-06, + "loss": 1.4731, + "step": 34186 + }, + { + "epoch": 2.69, + "learning_rate": 7.83556639161651e-06, + "loss": 1.4183, + "step": 34187 + }, + { + "epoch": 2.69, + "learning_rate": 7.831624425004047e-06, + "loss": 1.494, + "step": 34188 + }, + { + "epoch": 2.69, + "learning_rate": 7.8276834236364e-06, + "loss": 1.4819, + "step": 34189 + }, + { + "epoch": 2.69, + "learning_rate": 7.823743387540332e-06, + "loss": 1.4632, + "step": 34190 + }, + { + "epoch": 2.69, + "learning_rate": 7.819804316742574e-06, + "loss": 1.4457, + "step": 34191 + }, + { + "epoch": 2.69, + "learning_rate": 7.8158662112699e-06, + "loss": 1.4844, + "step": 34192 + }, + { + "epoch": 2.69, + "learning_rate": 7.811929071149009e-06, + "loss": 1.4602, + "step": 34193 + }, + { + "epoch": 2.69, + "learning_rate": 7.807992896406662e-06, + "loss": 1.4196, + "step": 34194 + }, + { + "epoch": 2.69, + "learning_rate": 7.804057687069604e-06, + "loss": 1.4562, + "step": 34195 + }, + { + "epoch": 2.69, + "learning_rate": 7.80012344316448e-06, + "loss": 1.4388, + "step": 34196 + }, + { + "epoch": 2.69, + "learning_rate": 7.79619016471807e-06, + "loss": 1.4679, + "step": 34197 + }, + { + "epoch": 2.69, + "learning_rate": 7.792257851757066e-06, + "loss": 1.4233, + "step": 34198 + }, + { + "epoch": 2.69, + "learning_rate": 7.788326504308134e-06, + "loss": 1.4322, + "step": 34199 + }, + { + "epoch": 2.69, + "learning_rate": 7.784396122397984e-06, + "loss": 1.4592, + "step": 34200 + }, + { + "epoch": 2.69, + "learning_rate": 7.780466706053312e-06, + "loss": 1.4335, + "step": 34201 + }, + { + "epoch": 2.69, + "learning_rate": 7.776538255300795e-06, + "loss": 1.4456, + "step": 34202 + }, + { + "epoch": 2.69, + "learning_rate": 7.772610770167082e-06, + "loss": 1.4232, + "step": 34203 + }, + { + "epoch": 2.69, + "learning_rate": 7.768684250678864e-06, + "loss": 1.4889, + "step": 34204 + }, + { + "epoch": 2.69, + "learning_rate": 7.764758696862805e-06, + "loss": 1.4405, + "step": 34205 + }, + { + "epoch": 2.69, + "learning_rate": 7.7608341087455e-06, + "loss": 1.4552, + "step": 34206 + }, + { + "epoch": 2.69, + "learning_rate": 7.756910486353663e-06, + "loss": 1.4076, + "step": 34207 + }, + { + "epoch": 2.69, + "learning_rate": 7.752987829713903e-06, + "loss": 1.4256, + "step": 34208 + }, + { + "epoch": 2.69, + "learning_rate": 7.749066138852883e-06, + "loss": 1.4658, + "step": 34209 + }, + { + "epoch": 2.69, + "learning_rate": 7.745145413797166e-06, + "loss": 1.4429, + "step": 34210 + }, + { + "epoch": 2.69, + "learning_rate": 7.74122565457343e-06, + "loss": 1.4974, + "step": 34211 + }, + { + "epoch": 2.69, + "learning_rate": 7.73730686120827e-06, + "loss": 1.3935, + "step": 34212 + }, + { + "epoch": 2.69, + "learning_rate": 7.733389033728265e-06, + "loss": 1.4721, + "step": 34213 + }, + { + "epoch": 2.69, + "learning_rate": 7.729472172160061e-06, + "loss": 1.5133, + "step": 34214 + }, + { + "epoch": 2.69, + "learning_rate": 7.725556276530237e-06, + "loss": 1.467, + "step": 34215 + }, + { + "epoch": 2.69, + "learning_rate": 7.721641346865353e-06, + "loss": 1.4576, + "step": 34216 + }, + { + "epoch": 2.69, + "learning_rate": 7.717727383192008e-06, + "loss": 1.4077, + "step": 34217 + }, + { + "epoch": 2.69, + "learning_rate": 7.713814385536792e-06, + "loss": 1.4164, + "step": 34218 + }, + { + "epoch": 2.69, + "learning_rate": 7.709902353926257e-06, + "loss": 1.4104, + "step": 34219 + }, + { + "epoch": 2.69, + "learning_rate": 7.705991288386942e-06, + "loss": 1.4841, + "step": 34220 + }, + { + "epoch": 2.69, + "learning_rate": 7.70208118894543e-06, + "loss": 1.4827, + "step": 34221 + }, + { + "epoch": 2.69, + "learning_rate": 7.698172055628249e-06, + "loss": 1.5171, + "step": 34222 + }, + { + "epoch": 2.69, + "learning_rate": 7.694263888461976e-06, + "loss": 1.4176, + "step": 34223 + }, + { + "epoch": 2.69, + "learning_rate": 7.690356687473092e-06, + "loss": 1.4279, + "step": 34224 + }, + { + "epoch": 2.69, + "learning_rate": 7.686450452688192e-06, + "loss": 1.4202, + "step": 34225 + }, + { + "epoch": 2.69, + "learning_rate": 7.682545184133737e-06, + "loss": 1.3891, + "step": 34226 + }, + { + "epoch": 2.69, + "learning_rate": 7.678640881836256e-06, + "loss": 1.4172, + "step": 34227 + }, + { + "epoch": 2.69, + "learning_rate": 7.674737545822279e-06, + "loss": 1.4763, + "step": 34228 + }, + { + "epoch": 2.69, + "learning_rate": 7.670835176118284e-06, + "loss": 1.521, + "step": 34229 + }, + { + "epoch": 2.69, + "learning_rate": 7.666933772750766e-06, + "loss": 1.4635, + "step": 34230 + }, + { + "epoch": 2.69, + "learning_rate": 7.663033335746238e-06, + "loss": 1.4923, + "step": 34231 + }, + { + "epoch": 2.69, + "learning_rate": 7.659133865131163e-06, + "loss": 1.4208, + "step": 34232 + }, + { + "epoch": 2.69, + "learning_rate": 7.655235360932e-06, + "loss": 1.4379, + "step": 34233 + }, + { + "epoch": 2.69, + "learning_rate": 7.651337823175263e-06, + "loss": 1.4792, + "step": 34234 + }, + { + "epoch": 2.69, + "learning_rate": 7.647441251887381e-06, + "loss": 1.3961, + "step": 34235 + }, + { + "epoch": 2.69, + "learning_rate": 7.643545647094817e-06, + "loss": 1.4944, + "step": 34236 + }, + { + "epoch": 2.69, + "learning_rate": 7.639651008824e-06, + "loss": 1.4588, + "step": 34237 + }, + { + "epoch": 2.69, + "learning_rate": 7.63575733710139e-06, + "loss": 1.4158, + "step": 34238 + }, + { + "epoch": 2.69, + "learning_rate": 7.631864631953449e-06, + "loss": 1.4166, + "step": 34239 + }, + { + "epoch": 2.69, + "learning_rate": 7.627972893406575e-06, + "loss": 1.4654, + "step": 34240 + }, + { + "epoch": 2.69, + "learning_rate": 7.624082121487196e-06, + "loss": 1.3941, + "step": 34241 + }, + { + "epoch": 2.69, + "learning_rate": 7.6201923162217236e-06, + "loss": 1.4068, + "step": 34242 + }, + { + "epoch": 2.69, + "learning_rate": 7.616303477636587e-06, + "loss": 1.4086, + "step": 34243 + }, + { + "epoch": 2.69, + "learning_rate": 7.6124156057581656e-06, + "loss": 1.4634, + "step": 34244 + }, + { + "epoch": 2.69, + "learning_rate": 7.60852870061287e-06, + "loss": 1.5052, + "step": 34245 + }, + { + "epoch": 2.69, + "learning_rate": 7.604642762227098e-06, + "loss": 1.417, + "step": 34246 + }, + { + "epoch": 2.69, + "learning_rate": 7.600757790627193e-06, + "loss": 1.4182, + "step": 34247 + }, + { + "epoch": 2.69, + "learning_rate": 7.596873785839586e-06, + "loss": 1.4479, + "step": 34248 + }, + { + "epoch": 2.69, + "learning_rate": 7.592990747890621e-06, + "loss": 1.5166, + "step": 34249 + }, + { + "epoch": 2.69, + "learning_rate": 7.5891086768066265e-06, + "loss": 1.4651, + "step": 34250 + }, + { + "epoch": 2.69, + "learning_rate": 7.585227572614033e-06, + "loss": 1.3815, + "step": 34251 + }, + { + "epoch": 2.69, + "learning_rate": 7.581347435339152e-06, + "loss": 1.4222, + "step": 34252 + }, + { + "epoch": 2.7, + "learning_rate": 7.57746826500833e-06, + "loss": 1.5019, + "step": 34253 + }, + { + "epoch": 2.7, + "learning_rate": 7.573590061647844e-06, + "loss": 1.4448, + "step": 34254 + }, + { + "epoch": 2.7, + "learning_rate": 7.569712825284141e-06, + "loss": 1.4308, + "step": 34255 + }, + { + "epoch": 2.7, + "learning_rate": 7.565836555943483e-06, + "loss": 1.3866, + "step": 34256 + }, + { + "epoch": 2.7, + "learning_rate": 7.561961253652199e-06, + "loss": 1.4655, + "step": 34257 + }, + { + "epoch": 2.7, + "learning_rate": 7.5580869184365674e-06, + "loss": 1.4377, + "step": 34258 + }, + { + "epoch": 2.7, + "learning_rate": 7.5542135503229515e-06, + "loss": 1.4504, + "step": 34259 + }, + { + "epoch": 2.7, + "learning_rate": 7.550341149337613e-06, + "loss": 1.5038, + "step": 34260 + }, + { + "epoch": 2.7, + "learning_rate": 7.5464697155068146e-06, + "loss": 1.4515, + "step": 34261 + }, + { + "epoch": 2.7, + "learning_rate": 7.542599248856917e-06, + "loss": 1.4173, + "step": 34262 + }, + { + "epoch": 2.7, + "learning_rate": 7.538729749414135e-06, + "loss": 1.4746, + "step": 34263 + }, + { + "epoch": 2.7, + "learning_rate": 7.534861217204746e-06, + "loss": 1.4482, + "step": 34264 + }, + { + "epoch": 2.7, + "learning_rate": 7.530993652255063e-06, + "loss": 1.4818, + "step": 34265 + }, + { + "epoch": 2.7, + "learning_rate": 7.527127054591298e-06, + "loss": 1.4638, + "step": 34266 + }, + { + "epoch": 2.7, + "learning_rate": 7.523261424239712e-06, + "loss": 1.4167, + "step": 34267 + }, + { + "epoch": 2.7, + "learning_rate": 7.519396761226554e-06, + "loss": 1.461, + "step": 34268 + }, + { + "epoch": 2.7, + "learning_rate": 7.515533065578066e-06, + "loss": 1.4564, + "step": 34269 + }, + { + "epoch": 2.7, + "learning_rate": 7.51167033732048e-06, + "loss": 1.4128, + "step": 34270 + }, + { + "epoch": 2.7, + "learning_rate": 7.507808576480023e-06, + "loss": 1.4694, + "step": 34271 + }, + { + "epoch": 2.7, + "learning_rate": 7.503947783082909e-06, + "loss": 1.4849, + "step": 34272 + }, + { + "epoch": 2.7, + "learning_rate": 7.500087957155365e-06, + "loss": 1.4034, + "step": 34273 + }, + { + "epoch": 2.7, + "learning_rate": 7.496229098723589e-06, + "loss": 1.4389, + "step": 34274 + }, + { + "epoch": 2.7, + "learning_rate": 7.492371207813758e-06, + "loss": 1.4347, + "step": 34275 + }, + { + "epoch": 2.7, + "learning_rate": 7.488514284452101e-06, + "loss": 1.4382, + "step": 34276 + }, + { + "epoch": 2.7, + "learning_rate": 7.484658328664783e-06, + "loss": 1.4984, + "step": 34277 + }, + { + "epoch": 2.7, + "learning_rate": 7.480803340477981e-06, + "loss": 1.4236, + "step": 34278 + }, + { + "epoch": 2.7, + "learning_rate": 7.476949319917874e-06, + "loss": 1.4603, + "step": 34279 + }, + { + "epoch": 2.7, + "learning_rate": 7.473096267010659e-06, + "loss": 1.48, + "step": 34280 + }, + { + "epoch": 2.7, + "learning_rate": 7.46924418178243e-06, + "loss": 1.3811, + "step": 34281 + }, + { + "epoch": 2.7, + "learning_rate": 7.4653930642594e-06, + "loss": 1.4549, + "step": 34282 + }, + { + "epoch": 2.7, + "learning_rate": 7.461542914467683e-06, + "loss": 1.5273, + "step": 34283 + }, + { + "epoch": 2.7, + "learning_rate": 7.457693732433423e-06, + "loss": 1.4807, + "step": 34284 + }, + { + "epoch": 2.7, + "learning_rate": 7.453845518182766e-06, + "loss": 1.4382, + "step": 34285 + }, + { + "epoch": 2.7, + "learning_rate": 7.449998271741842e-06, + "loss": 1.4729, + "step": 34286 + }, + { + "epoch": 2.7, + "learning_rate": 7.446151993136779e-06, + "loss": 1.4708, + "step": 34287 + }, + { + "epoch": 2.7, + "learning_rate": 7.442306682393639e-06, + "loss": 1.4852, + "step": 34288 + }, + { + "epoch": 2.7, + "learning_rate": 7.4384623395386036e-06, + "loss": 1.428, + "step": 34289 + }, + { + "epoch": 2.7, + "learning_rate": 7.434618964597733e-06, + "loss": 1.4733, + "step": 34290 + }, + { + "epoch": 2.7, + "learning_rate": 7.43077655759709e-06, + "loss": 1.4596, + "step": 34291 + }, + { + "epoch": 2.7, + "learning_rate": 7.426935118562838e-06, + "loss": 1.4681, + "step": 34292 + }, + { + "epoch": 2.7, + "learning_rate": 7.423094647521005e-06, + "loss": 1.5197, + "step": 34293 + }, + { + "epoch": 2.7, + "learning_rate": 7.419255144497688e-06, + "loss": 1.4142, + "step": 34294 + }, + { + "epoch": 2.7, + "learning_rate": 7.415416609518915e-06, + "loss": 1.4315, + "step": 34295 + }, + { + "epoch": 2.7, + "learning_rate": 7.411579042610799e-06, + "loss": 1.4475, + "step": 34296 + }, + { + "epoch": 2.7, + "learning_rate": 7.407742443799386e-06, + "loss": 1.5093, + "step": 34297 + }, + { + "epoch": 2.7, + "learning_rate": 7.403906813110688e-06, + "loss": 1.4151, + "step": 34298 + }, + { + "epoch": 2.7, + "learning_rate": 7.400072150570785e-06, + "loss": 1.4439, + "step": 34299 + }, + { + "epoch": 2.7, + "learning_rate": 7.3962384562057055e-06, + "loss": 1.4239, + "step": 34300 + }, + { + "epoch": 2.7, + "learning_rate": 7.392405730041462e-06, + "loss": 1.458, + "step": 34301 + }, + { + "epoch": 2.7, + "learning_rate": 7.388573972104067e-06, + "loss": 1.4718, + "step": 34302 + }, + { + "epoch": 2.7, + "learning_rate": 7.384743182419584e-06, + "loss": 1.4661, + "step": 34303 + }, + { + "epoch": 2.7, + "learning_rate": 7.38091336101399e-06, + "loss": 1.4426, + "step": 34304 + }, + { + "epoch": 2.7, + "learning_rate": 7.3770845079132835e-06, + "loss": 1.4188, + "step": 34305 + }, + { + "epoch": 2.7, + "learning_rate": 7.373256623143476e-06, + "loss": 1.4922, + "step": 34306 + }, + { + "epoch": 2.7, + "learning_rate": 7.369429706730545e-06, + "loss": 1.4861, + "step": 34307 + }, + { + "epoch": 2.7, + "learning_rate": 7.365603758700456e-06, + "loss": 1.4668, + "step": 34308 + }, + { + "epoch": 2.7, + "learning_rate": 7.361778779079236e-06, + "loss": 1.4323, + "step": 34309 + }, + { + "epoch": 2.7, + "learning_rate": 7.3579547678928155e-06, + "loss": 1.4543, + "step": 34310 + }, + { + "epoch": 2.7, + "learning_rate": 7.354131725167172e-06, + "loss": 1.472, + "step": 34311 + }, + { + "epoch": 2.7, + "learning_rate": 7.350309650928238e-06, + "loss": 1.389, + "step": 34312 + }, + { + "epoch": 2.7, + "learning_rate": 7.3464885452019896e-06, + "loss": 1.3844, + "step": 34313 + }, + { + "epoch": 2.7, + "learning_rate": 7.342668408014357e-06, + "loss": 1.4205, + "step": 34314 + }, + { + "epoch": 2.7, + "learning_rate": 7.33884923939127e-06, + "loss": 1.4407, + "step": 34315 + }, + { + "epoch": 2.7, + "learning_rate": 7.335031039358674e-06, + "loss": 1.4669, + "step": 34316 + }, + { + "epoch": 2.7, + "learning_rate": 7.331213807942499e-06, + "loss": 1.4685, + "step": 34317 + }, + { + "epoch": 2.7, + "learning_rate": 7.327397545168656e-06, + "loss": 1.4783, + "step": 34318 + }, + { + "epoch": 2.7, + "learning_rate": 7.323582251063043e-06, + "loss": 1.4591, + "step": 34319 + }, + { + "epoch": 2.7, + "learning_rate": 7.319767925651571e-06, + "loss": 1.4139, + "step": 34320 + }, + { + "epoch": 2.7, + "learning_rate": 7.315954568960153e-06, + "loss": 1.4495, + "step": 34321 + }, + { + "epoch": 2.7, + "learning_rate": 7.312142181014635e-06, + "loss": 1.4645, + "step": 34322 + }, + { + "epoch": 2.7, + "learning_rate": 7.308330761840947e-06, + "loss": 1.434, + "step": 34323 + }, + { + "epoch": 2.7, + "learning_rate": 7.3045203114649506e-06, + "loss": 1.4141, + "step": 34324 + }, + { + "epoch": 2.7, + "learning_rate": 7.300710829912493e-06, + "loss": 1.4524, + "step": 34325 + }, + { + "epoch": 2.7, + "learning_rate": 7.296902317209485e-06, + "loss": 1.4236, + "step": 34326 + }, + { + "epoch": 2.7, + "learning_rate": 7.293094773381775e-06, + "loss": 1.4182, + "step": 34327 + }, + { + "epoch": 2.7, + "learning_rate": 7.289288198455173e-06, + "loss": 1.498, + "step": 34328 + }, + { + "epoch": 2.7, + "learning_rate": 7.285482592455544e-06, + "loss": 1.4143, + "step": 34329 + }, + { + "epoch": 2.7, + "learning_rate": 7.281677955408749e-06, + "loss": 1.4968, + "step": 34330 + }, + { + "epoch": 2.7, + "learning_rate": 7.277874287340602e-06, + "loss": 1.4415, + "step": 34331 + }, + { + "epoch": 2.7, + "learning_rate": 7.274071588276897e-06, + "loss": 1.4496, + "step": 34332 + }, + { + "epoch": 2.7, + "learning_rate": 7.270269858243516e-06, + "loss": 1.4497, + "step": 34333 + }, + { + "epoch": 2.7, + "learning_rate": 7.266469097266237e-06, + "loss": 1.424, + "step": 34334 + }, + { + "epoch": 2.7, + "learning_rate": 7.2626693053708716e-06, + "loss": 1.4196, + "step": 34335 + }, + { + "epoch": 2.7, + "learning_rate": 7.258870482583184e-06, + "loss": 1.421, + "step": 34336 + }, + { + "epoch": 2.7, + "learning_rate": 7.25507262892902e-06, + "loss": 1.4492, + "step": 34337 + }, + { + "epoch": 2.7, + "learning_rate": 7.251275744434126e-06, + "loss": 1.4419, + "step": 34338 + }, + { + "epoch": 2.7, + "learning_rate": 7.247479829124297e-06, + "loss": 1.4301, + "step": 34339 + }, + { + "epoch": 2.7, + "learning_rate": 7.243684883025314e-06, + "loss": 1.4191, + "step": 34340 + }, + { + "epoch": 2.7, + "learning_rate": 7.239890906162921e-06, + "loss": 1.4675, + "step": 34341 + }, + { + "epoch": 2.7, + "learning_rate": 7.236097898562881e-06, + "loss": 1.4513, + "step": 34342 + }, + { + "epoch": 2.7, + "learning_rate": 7.232305860250959e-06, + "loss": 1.4544, + "step": 34343 + }, + { + "epoch": 2.7, + "learning_rate": 7.228514791252898e-06, + "loss": 1.431, + "step": 34344 + }, + { + "epoch": 2.7, + "learning_rate": 7.22472469159443e-06, + "loss": 1.5101, + "step": 34345 + }, + { + "epoch": 2.7, + "learning_rate": 7.2209355613013e-06, + "loss": 1.4196, + "step": 34346 + }, + { + "epoch": 2.7, + "learning_rate": 7.21714740039922e-06, + "loss": 1.459, + "step": 34347 + }, + { + "epoch": 2.7, + "learning_rate": 7.213360208913904e-06, + "loss": 1.4564, + "step": 34348 + }, + { + "epoch": 2.7, + "learning_rate": 7.209573986871065e-06, + "loss": 1.4645, + "step": 34349 + }, + { + "epoch": 2.7, + "learning_rate": 7.205788734296447e-06, + "loss": 1.3994, + "step": 34350 + }, + { + "epoch": 2.7, + "learning_rate": 7.202004451215732e-06, + "loss": 1.4744, + "step": 34351 + }, + { + "epoch": 2.7, + "learning_rate": 7.198221137654597e-06, + "loss": 1.3785, + "step": 34352 + }, + { + "epoch": 2.7, + "learning_rate": 7.194438793638707e-06, + "loss": 1.4803, + "step": 34353 + }, + { + "epoch": 2.7, + "learning_rate": 7.190657419193807e-06, + "loss": 1.4479, + "step": 34354 + }, + { + "epoch": 2.7, + "learning_rate": 7.186877014345526e-06, + "loss": 1.462, + "step": 34355 + }, + { + "epoch": 2.7, + "learning_rate": 7.183097579119513e-06, + "loss": 1.4693, + "step": 34356 + }, + { + "epoch": 2.7, + "learning_rate": 7.179319113541476e-06, + "loss": 1.4424, + "step": 34357 + }, + { + "epoch": 2.7, + "learning_rate": 7.175541617637065e-06, + "loss": 1.4041, + "step": 34358 + }, + { + "epoch": 2.7, + "learning_rate": 7.171765091431874e-06, + "loss": 1.4635, + "step": 34359 + }, + { + "epoch": 2.7, + "learning_rate": 7.167989534951601e-06, + "loss": 1.4399, + "step": 34360 + }, + { + "epoch": 2.7, + "learning_rate": 7.164214948221858e-06, + "loss": 1.4221, + "step": 34361 + }, + { + "epoch": 2.7, + "learning_rate": 7.160441331268257e-06, + "loss": 1.4959, + "step": 34362 + }, + { + "epoch": 2.7, + "learning_rate": 7.156668684116446e-06, + "loss": 1.4332, + "step": 34363 + }, + { + "epoch": 2.7, + "learning_rate": 7.152897006792002e-06, + "loss": 1.4939, + "step": 34364 + }, + { + "epoch": 2.7, + "learning_rate": 7.14912629932059e-06, + "loss": 1.43, + "step": 34365 + }, + { + "epoch": 2.7, + "learning_rate": 7.145356561727755e-06, + "loss": 1.4311, + "step": 34366 + }, + { + "epoch": 2.7, + "learning_rate": 7.141587794039144e-06, + "loss": 1.4558, + "step": 34367 + }, + { + "epoch": 2.7, + "learning_rate": 7.1378199962803025e-06, + "loss": 1.5395, + "step": 34368 + }, + { + "epoch": 2.7, + "learning_rate": 7.134053168476827e-06, + "loss": 1.4752, + "step": 34369 + }, + { + "epoch": 2.7, + "learning_rate": 7.130287310654281e-06, + "loss": 1.4175, + "step": 34370 + }, + { + "epoch": 2.7, + "learning_rate": 7.126522422838243e-06, + "loss": 1.3812, + "step": 34371 + }, + { + "epoch": 2.7, + "learning_rate": 7.1227585050542935e-06, + "loss": 1.4671, + "step": 34372 + }, + { + "epoch": 2.7, + "learning_rate": 7.118995557327945e-06, + "loss": 1.4731, + "step": 34373 + }, + { + "epoch": 2.7, + "learning_rate": 7.115233579684776e-06, + "loss": 1.463, + "step": 34374 + }, + { + "epoch": 2.7, + "learning_rate": 7.111472572150334e-06, + "loss": 1.445, + "step": 34375 + }, + { + "epoch": 2.7, + "learning_rate": 7.107712534750115e-06, + "loss": 1.4187, + "step": 34376 + }, + { + "epoch": 2.7, + "learning_rate": 7.103953467509682e-06, + "loss": 1.5177, + "step": 34377 + }, + { + "epoch": 2.7, + "learning_rate": 7.100195370454565e-06, + "loss": 1.4026, + "step": 34378 + }, + { + "epoch": 2.7, + "learning_rate": 7.096438243610242e-06, + "loss": 1.4581, + "step": 34379 + }, + { + "epoch": 2.71, + "learning_rate": 7.092682087002244e-06, + "loss": 1.4267, + "step": 34380 + }, + { + "epoch": 2.71, + "learning_rate": 7.0889269006560835e-06, + "loss": 1.4425, + "step": 34381 + }, + { + "epoch": 2.71, + "learning_rate": 7.08517268459724e-06, + "loss": 1.4898, + "step": 34382 + }, + { + "epoch": 2.71, + "learning_rate": 7.081419438851194e-06, + "loss": 1.4447, + "step": 34383 + }, + { + "epoch": 2.71, + "learning_rate": 7.077667163443457e-06, + "loss": 1.4034, + "step": 34384 + }, + { + "epoch": 2.71, + "learning_rate": 7.073915858399493e-06, + "loss": 1.4366, + "step": 34385 + }, + { + "epoch": 2.71, + "learning_rate": 7.070165523744747e-06, + "loss": 1.4224, + "step": 34386 + }, + { + "epoch": 2.71, + "learning_rate": 7.066416159504734e-06, + "loss": 1.4556, + "step": 34387 + }, + { + "epoch": 2.71, + "learning_rate": 7.062667765704866e-06, + "loss": 1.4341, + "step": 34388 + }, + { + "epoch": 2.71, + "learning_rate": 7.0589203423706055e-06, + "loss": 1.4685, + "step": 34389 + }, + { + "epoch": 2.71, + "learning_rate": 7.0551738895273655e-06, + "loss": 1.4826, + "step": 34390 + }, + { + "epoch": 2.71, + "learning_rate": 7.051428407200644e-06, + "loss": 1.4417, + "step": 34391 + }, + { + "epoch": 2.71, + "learning_rate": 7.047683895415835e-06, + "loss": 1.4074, + "step": 34392 + }, + { + "epoch": 2.71, + "learning_rate": 7.043940354198335e-06, + "loss": 1.4879, + "step": 34393 + }, + { + "epoch": 2.71, + "learning_rate": 7.040197783573626e-06, + "loss": 1.4634, + "step": 34394 + }, + { + "epoch": 2.71, + "learning_rate": 7.0364561835670516e-06, + "loss": 1.4459, + "step": 34395 + }, + { + "epoch": 2.71, + "learning_rate": 7.03271555420406e-06, + "loss": 1.4032, + "step": 34396 + }, + { + "epoch": 2.71, + "learning_rate": 7.028975895510031e-06, + "loss": 1.3912, + "step": 34397 + }, + { + "epoch": 2.71, + "learning_rate": 7.0252372075103594e-06, + "loss": 1.4857, + "step": 34398 + }, + { + "epoch": 2.71, + "learning_rate": 7.021499490230442e-06, + "loss": 1.4302, + "step": 34399 + }, + { + "epoch": 2.71, + "learning_rate": 7.017762743695627e-06, + "loss": 1.4552, + "step": 34400 + }, + { + "epoch": 2.71, + "learning_rate": 7.014026967931308e-06, + "loss": 1.4508, + "step": 34401 + }, + { + "epoch": 2.71, + "learning_rate": 7.010292162962833e-06, + "loss": 1.3938, + "step": 34402 + }, + { + "epoch": 2.71, + "learning_rate": 7.006558328815548e-06, + "loss": 1.4704, + "step": 34403 + }, + { + "epoch": 2.71, + "learning_rate": 7.00282546551485e-06, + "loss": 1.4439, + "step": 34404 + }, + { + "epoch": 2.71, + "learning_rate": 6.999093573086051e-06, + "loss": 1.4194, + "step": 34405 + }, + { + "epoch": 2.71, + "learning_rate": 6.995362651554498e-06, + "loss": 1.4204, + "step": 34406 + }, + { + "epoch": 2.71, + "learning_rate": 6.9916327009454875e-06, + "loss": 1.4517, + "step": 34407 + }, + { + "epoch": 2.71, + "learning_rate": 6.987903721284399e-06, + "loss": 1.4524, + "step": 34408 + }, + { + "epoch": 2.71, + "learning_rate": 6.984175712596513e-06, + "loss": 1.4665, + "step": 34409 + }, + { + "epoch": 2.71, + "learning_rate": 6.980448674907141e-06, + "loss": 1.4458, + "step": 34410 + }, + { + "epoch": 2.71, + "learning_rate": 6.976722608241597e-06, + "loss": 1.4165, + "step": 34411 + }, + { + "epoch": 2.71, + "learning_rate": 6.9729975126251944e-06, + "loss": 1.4713, + "step": 34412 + }, + { + "epoch": 2.71, + "learning_rate": 6.969273388083213e-06, + "loss": 1.4509, + "step": 34413 + }, + { + "epoch": 2.71, + "learning_rate": 6.9655502346409155e-06, + "loss": 1.4205, + "step": 34414 + }, + { + "epoch": 2.71, + "learning_rate": 6.9618280523236145e-06, + "loss": 1.456, + "step": 34415 + }, + { + "epoch": 2.71, + "learning_rate": 6.958106841156574e-06, + "loss": 1.414, + "step": 34416 + }, + { + "epoch": 2.71, + "learning_rate": 6.954386601165024e-06, + "loss": 1.448, + "step": 34417 + }, + { + "epoch": 2.71, + "learning_rate": 6.950667332374277e-06, + "loss": 1.446, + "step": 34418 + }, + { + "epoch": 2.71, + "learning_rate": 6.946949034809546e-06, + "loss": 1.3927, + "step": 34419 + }, + { + "epoch": 2.71, + "learning_rate": 6.943231708496078e-06, + "loss": 1.3902, + "step": 34420 + }, + { + "epoch": 2.71, + "learning_rate": 6.939515353459135e-06, + "loss": 1.4326, + "step": 34421 + }, + { + "epoch": 2.71, + "learning_rate": 6.935799969723949e-06, + "loss": 1.4442, + "step": 34422 + }, + { + "epoch": 2.71, + "learning_rate": 6.932085557315714e-06, + "loss": 1.4567, + "step": 34423 + }, + { + "epoch": 2.71, + "learning_rate": 6.928372116259662e-06, + "loss": 1.4171, + "step": 34424 + }, + { + "epoch": 2.71, + "learning_rate": 6.924659646581021e-06, + "loss": 1.4447, + "step": 34425 + }, + { + "epoch": 2.71, + "learning_rate": 6.920948148304972e-06, + "loss": 1.4648, + "step": 34426 + }, + { + "epoch": 2.71, + "learning_rate": 6.917237621456745e-06, + "loss": 1.4578, + "step": 34427 + }, + { + "epoch": 2.71, + "learning_rate": 6.913528066061485e-06, + "loss": 1.4919, + "step": 34428 + }, + { + "epoch": 2.71, + "learning_rate": 6.909819482144441e-06, + "loss": 1.45, + "step": 34429 + }, + { + "epoch": 2.71, + "learning_rate": 6.906111869730741e-06, + "loss": 1.4477, + "step": 34430 + }, + { + "epoch": 2.71, + "learning_rate": 6.902405228845581e-06, + "loss": 1.4273, + "step": 34431 + }, + { + "epoch": 2.71, + "learning_rate": 6.898699559514126e-06, + "loss": 1.458, + "step": 34432 + }, + { + "epoch": 2.71, + "learning_rate": 6.8949948617615215e-06, + "loss": 1.4557, + "step": 34433 + }, + { + "epoch": 2.71, + "learning_rate": 6.891291135612931e-06, + "loss": 1.4482, + "step": 34434 + }, + { + "epoch": 2.71, + "learning_rate": 6.8875883810935175e-06, + "loss": 1.4131, + "step": 34435 + }, + { + "epoch": 2.71, + "learning_rate": 6.883886598228394e-06, + "loss": 1.4079, + "step": 34436 + }, + { + "epoch": 2.71, + "learning_rate": 6.880185787042674e-06, + "loss": 1.4545, + "step": 34437 + }, + { + "epoch": 2.71, + "learning_rate": 6.876485947561555e-06, + "loss": 1.4438, + "step": 34438 + }, + { + "epoch": 2.71, + "learning_rate": 6.872787079810099e-06, + "loss": 1.433, + "step": 34439 + }, + { + "epoch": 2.71, + "learning_rate": 6.8690891838134365e-06, + "loss": 1.3952, + "step": 34440 + }, + { + "epoch": 2.71, + "learning_rate": 6.865392259596647e-06, + "loss": 1.4215, + "step": 34441 + }, + { + "epoch": 2.71, + "learning_rate": 6.861696307184878e-06, + "loss": 1.4065, + "step": 34442 + }, + { + "epoch": 2.71, + "learning_rate": 6.858001326603191e-06, + "loss": 1.4092, + "step": 34443 + }, + { + "epoch": 2.71, + "learning_rate": 6.854307317876684e-06, + "loss": 1.4319, + "step": 34444 + }, + { + "epoch": 2.71, + "learning_rate": 6.850614281030453e-06, + "loss": 1.4358, + "step": 34445 + }, + { + "epoch": 2.71, + "learning_rate": 6.8469222160895455e-06, + "loss": 1.5018, + "step": 34446 + }, + { + "epoch": 2.71, + "learning_rate": 6.84323112307904e-06, + "loss": 1.4493, + "step": 34447 + }, + { + "epoch": 2.71, + "learning_rate": 6.839541002023985e-06, + "loss": 1.4906, + "step": 34448 + }, + { + "epoch": 2.71, + "learning_rate": 6.835851852949459e-06, + "loss": 1.4467, + "step": 34449 + }, + { + "epoch": 2.71, + "learning_rate": 6.8321636758804925e-06, + "loss": 1.4993, + "step": 34450 + }, + { + "epoch": 2.71, + "learning_rate": 6.8284764708421146e-06, + "loss": 1.4103, + "step": 34451 + }, + { + "epoch": 2.71, + "learning_rate": 6.824790237859374e-06, + "loss": 1.5089, + "step": 34452 + }, + { + "epoch": 2.71, + "learning_rate": 6.821104976957314e-06, + "loss": 1.4423, + "step": 34453 + }, + { + "epoch": 2.71, + "learning_rate": 6.817420688160918e-06, + "loss": 1.462, + "step": 34454 + }, + { + "epoch": 2.71, + "learning_rate": 6.813737371495231e-06, + "loss": 1.47, + "step": 34455 + }, + { + "epoch": 2.71, + "learning_rate": 6.810055026985267e-06, + "loss": 1.4149, + "step": 34456 + }, + { + "epoch": 2.71, + "learning_rate": 6.806373654655972e-06, + "loss": 1.4315, + "step": 34457 + }, + { + "epoch": 2.71, + "learning_rate": 6.802693254532393e-06, + "loss": 1.4478, + "step": 34458 + }, + { + "epoch": 2.71, + "learning_rate": 6.79901382663951e-06, + "loss": 1.3967, + "step": 34459 + }, + { + "epoch": 2.71, + "learning_rate": 6.795335371002303e-06, + "loss": 1.4379, + "step": 34460 + }, + { + "epoch": 2.71, + "learning_rate": 6.791657887645735e-06, + "loss": 1.3921, + "step": 34461 + }, + { + "epoch": 2.71, + "learning_rate": 6.787981376594787e-06, + "loss": 1.3803, + "step": 34462 + }, + { + "epoch": 2.71, + "learning_rate": 6.784305837874421e-06, + "loss": 1.4733, + "step": 34463 + }, + { + "epoch": 2.71, + "learning_rate": 6.780631271509585e-06, + "loss": 1.4698, + "step": 34464 + }, + { + "epoch": 2.71, + "learning_rate": 6.776957677525208e-06, + "loss": 1.407, + "step": 34465 + }, + { + "epoch": 2.71, + "learning_rate": 6.77328505594627e-06, + "loss": 1.4815, + "step": 34466 + }, + { + "epoch": 2.71, + "learning_rate": 6.769613406797686e-06, + "loss": 1.4782, + "step": 34467 + }, + { + "epoch": 2.71, + "learning_rate": 6.765942730104368e-06, + "loss": 1.442, + "step": 34468 + }, + { + "epoch": 2.71, + "learning_rate": 6.76227302589128e-06, + "loss": 1.4621, + "step": 34469 + }, + { + "epoch": 2.71, + "learning_rate": 6.758604294183301e-06, + "loss": 1.4372, + "step": 34470 + }, + { + "epoch": 2.71, + "learning_rate": 6.754936535005328e-06, + "loss": 1.4523, + "step": 34471 + }, + { + "epoch": 2.71, + "learning_rate": 6.751269748382326e-06, + "loss": 1.4718, + "step": 34472 + }, + { + "epoch": 2.71, + "learning_rate": 6.747603934339141e-06, + "loss": 1.4275, + "step": 34473 + }, + { + "epoch": 2.71, + "learning_rate": 6.743939092900652e-06, + "loss": 1.4685, + "step": 34474 + }, + { + "epoch": 2.71, + "learning_rate": 6.740275224091773e-06, + "loss": 1.4692, + "step": 34475 + }, + { + "epoch": 2.71, + "learning_rate": 6.7366123279373685e-06, + "loss": 1.4013, + "step": 34476 + }, + { + "epoch": 2.71, + "learning_rate": 6.732950404462317e-06, + "loss": 1.4614, + "step": 34477 + }, + { + "epoch": 2.71, + "learning_rate": 6.72928945369145e-06, + "loss": 1.4777, + "step": 34478 + }, + { + "epoch": 2.71, + "learning_rate": 6.725629475649663e-06, + "loss": 1.4759, + "step": 34479 + }, + { + "epoch": 2.71, + "learning_rate": 6.721970470361787e-06, + "loss": 1.4394, + "step": 34480 + }, + { + "epoch": 2.71, + "learning_rate": 6.718312437852669e-06, + "loss": 1.4292, + "step": 34481 + }, + { + "epoch": 2.71, + "learning_rate": 6.714655378147121e-06, + "loss": 1.443, + "step": 34482 + }, + { + "epoch": 2.71, + "learning_rate": 6.7109992912700085e-06, + "loss": 1.429, + "step": 34483 + }, + { + "epoch": 2.71, + "learning_rate": 6.707344177246126e-06, + "loss": 1.4948, + "step": 34484 + }, + { + "epoch": 2.71, + "learning_rate": 6.70369003610029e-06, + "loss": 1.5056, + "step": 34485 + }, + { + "epoch": 2.71, + "learning_rate": 6.700036867857345e-06, + "loss": 1.4856, + "step": 34486 + }, + { + "epoch": 2.71, + "learning_rate": 6.696384672542071e-06, + "loss": 1.4083, + "step": 34487 + }, + { + "epoch": 2.71, + "learning_rate": 6.6927334501792325e-06, + "loss": 1.4669, + "step": 34488 + }, + { + "epoch": 2.71, + "learning_rate": 6.68908320079366e-06, + "loss": 1.4412, + "step": 34489 + }, + { + "epoch": 2.71, + "learning_rate": 6.68543392441015e-06, + "loss": 1.4544, + "step": 34490 + }, + { + "epoch": 2.71, + "learning_rate": 6.681785621053448e-06, + "loss": 1.4418, + "step": 34491 + }, + { + "epoch": 2.71, + "learning_rate": 6.678138290748319e-06, + "loss": 1.5232, + "step": 34492 + }, + { + "epoch": 2.71, + "learning_rate": 6.67449193351956e-06, + "loss": 1.449, + "step": 34493 + }, + { + "epoch": 2.71, + "learning_rate": 6.670846549391901e-06, + "loss": 1.4011, + "step": 34494 + }, + { + "epoch": 2.71, + "learning_rate": 6.667202138390071e-06, + "loss": 1.4391, + "step": 34495 + }, + { + "epoch": 2.71, + "learning_rate": 6.663558700538885e-06, + "loss": 1.4542, + "step": 34496 + }, + { + "epoch": 2.71, + "learning_rate": 6.6599162358630055e-06, + "loss": 1.4304, + "step": 34497 + }, + { + "epoch": 2.71, + "learning_rate": 6.6562747443871965e-06, + "loss": 1.4697, + "step": 34498 + }, + { + "epoch": 2.71, + "learning_rate": 6.652634226136188e-06, + "loss": 1.4422, + "step": 34499 + }, + { + "epoch": 2.71, + "learning_rate": 6.648994681134695e-06, + "loss": 1.479, + "step": 34500 + }, + { + "epoch": 2.71, + "learning_rate": 6.6453561094074125e-06, + "loss": 1.4352, + "step": 34501 + }, + { + "epoch": 2.71, + "learning_rate": 6.641718510979039e-06, + "loss": 1.4644, + "step": 34502 + }, + { + "epoch": 2.71, + "learning_rate": 6.638081885874303e-06, + "loss": 1.4196, + "step": 34503 + }, + { + "epoch": 2.71, + "learning_rate": 6.634446234117868e-06, + "loss": 1.473, + "step": 34504 + }, + { + "epoch": 2.71, + "learning_rate": 6.630811555734416e-06, + "loss": 1.4579, + "step": 34505 + }, + { + "epoch": 2.71, + "learning_rate": 6.627177850748644e-06, + "loss": 1.4674, + "step": 34506 + }, + { + "epoch": 2.72, + "learning_rate": 6.623545119185214e-06, + "loss": 1.5135, + "step": 34507 + }, + { + "epoch": 2.72, + "learning_rate": 6.6199133610688075e-06, + "loss": 1.4784, + "step": 34508 + }, + { + "epoch": 2.72, + "learning_rate": 6.6162825764240365e-06, + "loss": 1.4553, + "step": 34509 + }, + { + "epoch": 2.72, + "learning_rate": 6.612652765275617e-06, + "loss": 1.4182, + "step": 34510 + }, + { + "epoch": 2.72, + "learning_rate": 6.6090239276481435e-06, + "loss": 1.4985, + "step": 34511 + }, + { + "epoch": 2.72, + "learning_rate": 6.605396063566248e-06, + "loss": 1.3949, + "step": 34512 + }, + { + "epoch": 2.72, + "learning_rate": 6.601769173054611e-06, + "loss": 1.4572, + "step": 34513 + }, + { + "epoch": 2.72, + "learning_rate": 6.598143256137811e-06, + "loss": 1.4106, + "step": 34514 + }, + { + "epoch": 2.72, + "learning_rate": 6.59451831284048e-06, + "loss": 1.4571, + "step": 34515 + }, + { + "epoch": 2.72, + "learning_rate": 6.590894343187247e-06, + "loss": 1.4878, + "step": 34516 + }, + { + "epoch": 2.72, + "learning_rate": 6.587271347202694e-06, + "loss": 1.4518, + "step": 34517 + }, + { + "epoch": 2.72, + "learning_rate": 6.5836493249114334e-06, + "loss": 1.4516, + "step": 34518 + }, + { + "epoch": 2.72, + "learning_rate": 6.580028276338028e-06, + "loss": 1.4121, + "step": 34519 + }, + { + "epoch": 2.72, + "learning_rate": 6.576408201507111e-06, + "loss": 1.4563, + "step": 34520 + }, + { + "epoch": 2.72, + "learning_rate": 6.572789100443193e-06, + "loss": 1.4205, + "step": 34521 + }, + { + "epoch": 2.72, + "learning_rate": 6.56917097317094e-06, + "loss": 1.4766, + "step": 34522 + }, + { + "epoch": 2.72, + "learning_rate": 6.565553819714814e-06, + "loss": 1.4556, + "step": 34523 + }, + { + "epoch": 2.72, + "learning_rate": 6.561937640099463e-06, + "loss": 1.4466, + "step": 34524 + }, + { + "epoch": 2.72, + "learning_rate": 6.5583224343494005e-06, + "loss": 1.389, + "step": 34525 + }, + { + "epoch": 2.72, + "learning_rate": 6.5547082024891395e-06, + "loss": 1.4704, + "step": 34526 + }, + { + "epoch": 2.72, + "learning_rate": 6.551094944543278e-06, + "loss": 1.4355, + "step": 34527 + }, + { + "epoch": 2.72, + "learning_rate": 6.547482660536313e-06, + "loss": 1.491, + "step": 34528 + }, + { + "epoch": 2.72, + "learning_rate": 6.543871350492758e-06, + "loss": 1.4542, + "step": 34529 + }, + { + "epoch": 2.72, + "learning_rate": 6.540261014437176e-06, + "loss": 1.4234, + "step": 34530 + }, + { + "epoch": 2.72, + "learning_rate": 6.536651652394065e-06, + "loss": 1.4619, + "step": 34531 + }, + { + "epoch": 2.72, + "learning_rate": 6.533043264387888e-06, + "loss": 1.448, + "step": 34532 + }, + { + "epoch": 2.72, + "learning_rate": 6.529435850443193e-06, + "loss": 1.4035, + "step": 34533 + }, + { + "epoch": 2.72, + "learning_rate": 6.52582941058446e-06, + "loss": 1.4432, + "step": 34534 + }, + { + "epoch": 2.72, + "learning_rate": 6.522223944836152e-06, + "loss": 1.4531, + "step": 34535 + }, + { + "epoch": 2.72, + "learning_rate": 6.518619453222751e-06, + "loss": 1.423, + "step": 34536 + }, + { + "epoch": 2.72, + "learning_rate": 6.515015935768769e-06, + "loss": 1.4347, + "step": 34537 + }, + { + "epoch": 2.72, + "learning_rate": 6.5114133924986546e-06, + "loss": 1.4056, + "step": 34538 + }, + { + "epoch": 2.72, + "learning_rate": 6.507811823436854e-06, + "loss": 1.4293, + "step": 34539 + }, + { + "epoch": 2.72, + "learning_rate": 6.504211228607814e-06, + "loss": 1.439, + "step": 34540 + }, + { + "epoch": 2.72, + "learning_rate": 6.5006116080359996e-06, + "loss": 1.4474, + "step": 34541 + }, + { + "epoch": 2.72, + "learning_rate": 6.497012961745856e-06, + "loss": 1.4485, + "step": 34542 + }, + { + "epoch": 2.72, + "learning_rate": 6.493415289761783e-06, + "loss": 1.3797, + "step": 34543 + }, + { + "epoch": 2.72, + "learning_rate": 6.489818592108242e-06, + "loss": 1.4351, + "step": 34544 + }, + { + "epoch": 2.72, + "learning_rate": 6.4862228688096316e-06, + "loss": 1.4193, + "step": 34545 + }, + { + "epoch": 2.72, + "learning_rate": 6.482628119890348e-06, + "loss": 1.4613, + "step": 34546 + }, + { + "epoch": 2.72, + "learning_rate": 6.479034345374856e-06, + "loss": 1.4267, + "step": 34547 + }, + { + "epoch": 2.72, + "learning_rate": 6.475441545287502e-06, + "loss": 1.4954, + "step": 34548 + }, + { + "epoch": 2.72, + "learning_rate": 6.4718497196527e-06, + "loss": 1.4752, + "step": 34549 + }, + { + "epoch": 2.72, + "learning_rate": 6.46825886849483e-06, + "loss": 1.4502, + "step": 34550 + }, + { + "epoch": 2.72, + "learning_rate": 6.46466899183829e-06, + "loss": 1.4597, + "step": 34551 + }, + { + "epoch": 2.72, + "learning_rate": 6.46108008970741e-06, + "loss": 1.4514, + "step": 34552 + }, + { + "epoch": 2.72, + "learning_rate": 6.457492162126587e-06, + "loss": 1.4957, + "step": 34553 + }, + { + "epoch": 2.72, + "learning_rate": 6.453905209120186e-06, + "loss": 1.4369, + "step": 34554 + }, + { + "epoch": 2.72, + "learning_rate": 6.450319230712569e-06, + "loss": 1.3752, + "step": 34555 + }, + { + "epoch": 2.72, + "learning_rate": 6.446734226928052e-06, + "loss": 1.4057, + "step": 34556 + }, + { + "epoch": 2.72, + "learning_rate": 6.4431501977909975e-06, + "loss": 1.376, + "step": 34557 + }, + { + "epoch": 2.72, + "learning_rate": 6.439567143325736e-06, + "loss": 1.4295, + "step": 34558 + }, + { + "epoch": 2.72, + "learning_rate": 6.435985063556598e-06, + "loss": 1.4269, + "step": 34559 + }, + { + "epoch": 2.72, + "learning_rate": 6.432403958507865e-06, + "loss": 1.4214, + "step": 34560 + }, + { + "epoch": 2.72, + "learning_rate": 6.428823828203899e-06, + "loss": 1.4885, + "step": 34561 + }, + { + "epoch": 2.72, + "learning_rate": 6.4252446726689995e-06, + "loss": 1.4656, + "step": 34562 + }, + { + "epoch": 2.72, + "learning_rate": 6.421666491927446e-06, + "loss": 1.4528, + "step": 34563 + }, + { + "epoch": 2.72, + "learning_rate": 6.418089286003552e-06, + "loss": 1.4326, + "step": 34564 + }, + { + "epoch": 2.72, + "learning_rate": 6.414513054921583e-06, + "loss": 1.4636, + "step": 34565 + }, + { + "epoch": 2.72, + "learning_rate": 6.410937798705834e-06, + "loss": 1.4155, + "step": 34566 + }, + { + "epoch": 2.72, + "learning_rate": 6.407363517380587e-06, + "loss": 1.4366, + "step": 34567 + }, + { + "epoch": 2.72, + "learning_rate": 6.403790210970089e-06, + "loss": 1.4454, + "step": 34568 + }, + { + "epoch": 2.72, + "learning_rate": 6.400217879498637e-06, + "loss": 1.4951, + "step": 34569 + }, + { + "epoch": 2.72, + "learning_rate": 6.396646522990429e-06, + "loss": 1.448, + "step": 34570 + }, + { + "epoch": 2.72, + "learning_rate": 6.393076141469778e-06, + "loss": 1.4209, + "step": 34571 + }, + { + "epoch": 2.72, + "learning_rate": 6.389506734960881e-06, + "loss": 1.4974, + "step": 34572 + }, + { + "epoch": 2.72, + "learning_rate": 6.385938303487953e-06, + "loss": 1.5042, + "step": 34573 + }, + { + "epoch": 2.72, + "learning_rate": 6.382370847075291e-06, + "loss": 1.427, + "step": 34574 + }, + { + "epoch": 2.72, + "learning_rate": 6.378804365747059e-06, + "loss": 1.4467, + "step": 34575 + }, + { + "epoch": 2.72, + "learning_rate": 6.375238859527504e-06, + "loss": 1.3962, + "step": 34576 + }, + { + "epoch": 2.72, + "learning_rate": 6.37167432844079e-06, + "loss": 1.4995, + "step": 34577 + }, + { + "epoch": 2.72, + "learning_rate": 6.368110772511165e-06, + "loss": 1.4292, + "step": 34578 + }, + { + "epoch": 2.72, + "learning_rate": 6.364548191762808e-06, + "loss": 1.4152, + "step": 34579 + }, + { + "epoch": 2.72, + "learning_rate": 6.360986586219885e-06, + "loss": 1.4164, + "step": 34580 + }, + { + "epoch": 2.72, + "learning_rate": 6.357425955906609e-06, + "loss": 1.4374, + "step": 34581 + }, + { + "epoch": 2.72, + "learning_rate": 6.3538663008471435e-06, + "loss": 1.3796, + "step": 34582 + }, + { + "epoch": 2.72, + "learning_rate": 6.350307621065653e-06, + "loss": 1.4724, + "step": 34583 + }, + { + "epoch": 2.72, + "learning_rate": 6.346749916586286e-06, + "loss": 1.4946, + "step": 34584 + }, + { + "epoch": 2.72, + "learning_rate": 6.3431931874332375e-06, + "loss": 1.4671, + "step": 34585 + }, + { + "epoch": 2.72, + "learning_rate": 6.339637433630624e-06, + "loss": 1.4402, + "step": 34586 + }, + { + "epoch": 2.72, + "learning_rate": 6.3360826552025735e-06, + "loss": 1.4166, + "step": 34587 + }, + { + "epoch": 2.72, + "learning_rate": 6.332528852173269e-06, + "loss": 1.4206, + "step": 34588 + }, + { + "epoch": 2.72, + "learning_rate": 6.328976024566807e-06, + "loss": 1.5192, + "step": 34589 + }, + { + "epoch": 2.72, + "learning_rate": 6.3254241724073005e-06, + "loss": 1.4109, + "step": 34590 + }, + { + "epoch": 2.72, + "learning_rate": 6.321873295718899e-06, + "loss": 1.4015, + "step": 34591 + }, + { + "epoch": 2.72, + "learning_rate": 6.3183233945256814e-06, + "loss": 1.465, + "step": 34592 + }, + { + "epoch": 2.72, + "learning_rate": 6.314774468851763e-06, + "loss": 1.4949, + "step": 34593 + }, + { + "epoch": 2.72, + "learning_rate": 6.3112265187212076e-06, + "loss": 1.3748, + "step": 34594 + }, + { + "epoch": 2.72, + "learning_rate": 6.307679544158145e-06, + "loss": 1.4338, + "step": 34595 + }, + { + "epoch": 2.72, + "learning_rate": 6.304133545186657e-06, + "loss": 1.4453, + "step": 34596 + }, + { + "epoch": 2.72, + "learning_rate": 6.300588521830774e-06, + "loss": 1.4318, + "step": 34597 + }, + { + "epoch": 2.72, + "learning_rate": 6.297044474114627e-06, + "loss": 1.4123, + "step": 34598 + }, + { + "epoch": 2.72, + "learning_rate": 6.293501402062212e-06, + "loss": 1.4461, + "step": 34599 + }, + { + "epoch": 2.72, + "learning_rate": 6.289959305697645e-06, + "loss": 1.4518, + "step": 34600 + }, + { + "epoch": 2.72, + "learning_rate": 6.286418185044922e-06, + "loss": 1.4492, + "step": 34601 + }, + { + "epoch": 2.72, + "learning_rate": 6.282878040128142e-06, + "loss": 1.4231, + "step": 34602 + }, + { + "epoch": 2.72, + "learning_rate": 6.279338870971301e-06, + "loss": 1.4173, + "step": 34603 + }, + { + "epoch": 2.72, + "learning_rate": 6.27580067759843e-06, + "loss": 1.4719, + "step": 34604 + }, + { + "epoch": 2.72, + "learning_rate": 6.272263460033577e-06, + "loss": 1.4081, + "step": 34605 + }, + { + "epoch": 2.72, + "learning_rate": 6.268727218300723e-06, + "loss": 1.4715, + "step": 34606 + }, + { + "epoch": 2.72, + "learning_rate": 6.265191952423898e-06, + "loss": 1.4307, + "step": 34607 + }, + { + "epoch": 2.72, + "learning_rate": 6.2616576624271e-06, + "loss": 1.376, + "step": 34608 + }, + { + "epoch": 2.72, + "learning_rate": 6.258124348334326e-06, + "loss": 1.5085, + "step": 34609 + }, + { + "epoch": 2.72, + "learning_rate": 6.254592010169557e-06, + "loss": 1.4376, + "step": 34610 + }, + { + "epoch": 2.72, + "learning_rate": 6.251060647956807e-06, + "loss": 1.448, + "step": 34611 + }, + { + "epoch": 2.72, + "learning_rate": 6.247530261720007e-06, + "loss": 1.4033, + "step": 34612 + }, + { + "epoch": 2.72, + "learning_rate": 6.244000851483155e-06, + "loss": 1.4589, + "step": 34613 + }, + { + "epoch": 2.72, + "learning_rate": 6.2404724172701984e-06, + "loss": 1.4309, + "step": 34614 + }, + { + "epoch": 2.72, + "learning_rate": 6.236944959105083e-06, + "loss": 1.4618, + "step": 34615 + }, + { + "epoch": 2.72, + "learning_rate": 6.233418477011809e-06, + "loss": 1.4296, + "step": 34616 + }, + { + "epoch": 2.72, + "learning_rate": 6.229892971014289e-06, + "loss": 1.4429, + "step": 34617 + }, + { + "epoch": 2.72, + "learning_rate": 6.22636844113642e-06, + "loss": 1.404, + "step": 34618 + }, + { + "epoch": 2.72, + "learning_rate": 6.222844887402201e-06, + "loss": 1.413, + "step": 34619 + }, + { + "epoch": 2.72, + "learning_rate": 6.219322309835528e-06, + "loss": 1.3976, + "step": 34620 + }, + { + "epoch": 2.72, + "learning_rate": 6.215800708460283e-06, + "loss": 1.3982, + "step": 34621 + }, + { + "epoch": 2.72, + "learning_rate": 6.21228008330043e-06, + "loss": 1.4972, + "step": 34622 + }, + { + "epoch": 2.72, + "learning_rate": 6.208760434379833e-06, + "loss": 1.4363, + "step": 34623 + }, + { + "epoch": 2.72, + "learning_rate": 6.20524176172239e-06, + "loss": 1.4251, + "step": 34624 + }, + { + "epoch": 2.72, + "learning_rate": 6.201724065352032e-06, + "loss": 1.4581, + "step": 34625 + }, + { + "epoch": 2.72, + "learning_rate": 6.198207345292605e-06, + "loss": 1.5041, + "step": 34626 + }, + { + "epoch": 2.72, + "learning_rate": 6.194691601567975e-06, + "loss": 1.4212, + "step": 34627 + }, + { + "epoch": 2.72, + "learning_rate": 6.191176834202038e-06, + "loss": 1.5071, + "step": 34628 + }, + { + "epoch": 2.72, + "learning_rate": 6.187663043218677e-06, + "loss": 1.3721, + "step": 34629 + }, + { + "epoch": 2.72, + "learning_rate": 6.184150228641704e-06, + "loss": 1.4427, + "step": 34630 + }, + { + "epoch": 2.72, + "learning_rate": 6.180638390494952e-06, + "loss": 1.4722, + "step": 34631 + }, + { + "epoch": 2.72, + "learning_rate": 6.177127528802334e-06, + "loss": 1.4459, + "step": 34632 + }, + { + "epoch": 2.72, + "learning_rate": 6.173617643587647e-06, + "loss": 1.4705, + "step": 34633 + }, + { + "epoch": 2.73, + "learning_rate": 6.17010873487474e-06, + "loss": 1.4464, + "step": 34634 + }, + { + "epoch": 2.73, + "learning_rate": 6.166600802687394e-06, + "loss": 1.4347, + "step": 34635 + }, + { + "epoch": 2.73, + "learning_rate": 6.1630938470494715e-06, + "loss": 1.4261, + "step": 34636 + }, + { + "epoch": 2.73, + "learning_rate": 6.159587867984772e-06, + "loss": 1.4194, + "step": 34637 + }, + { + "epoch": 2.73, + "learning_rate": 6.156082865517076e-06, + "loss": 1.417, + "step": 34638 + }, + { + "epoch": 2.73, + "learning_rate": 6.152578839670213e-06, + "loss": 1.3872, + "step": 34639 + }, + { + "epoch": 2.73, + "learning_rate": 6.149075790467967e-06, + "loss": 1.4896, + "step": 34640 + }, + { + "epoch": 2.73, + "learning_rate": 6.145573717934083e-06, + "loss": 1.4487, + "step": 34641 + }, + { + "epoch": 2.73, + "learning_rate": 6.142072622092392e-06, + "loss": 1.4166, + "step": 34642 + }, + { + "epoch": 2.73, + "learning_rate": 6.138572502966643e-06, + "loss": 1.4973, + "step": 34643 + }, + { + "epoch": 2.73, + "learning_rate": 6.135073360580567e-06, + "loss": 1.4507, + "step": 34644 + }, + { + "epoch": 2.73, + "learning_rate": 6.131575194957978e-06, + "loss": 1.4464, + "step": 34645 + }, + { + "epoch": 2.73, + "learning_rate": 6.128078006122588e-06, + "loss": 1.4802, + "step": 34646 + }, + { + "epoch": 2.73, + "learning_rate": 6.124581794098166e-06, + "loss": 1.4351, + "step": 34647 + }, + { + "epoch": 2.73, + "learning_rate": 6.121086558908406e-06, + "loss": 1.4304, + "step": 34648 + }, + { + "epoch": 2.73, + "learning_rate": 6.1175923005771065e-06, + "loss": 1.4809, + "step": 34649 + }, + { + "epoch": 2.73, + "learning_rate": 6.114099019127949e-06, + "loss": 1.4723, + "step": 34650 + }, + { + "epoch": 2.73, + "learning_rate": 6.110606714584648e-06, + "loss": 1.4188, + "step": 34651 + }, + { + "epoch": 2.73, + "learning_rate": 6.1071153869709175e-06, + "loss": 1.428, + "step": 34652 + }, + { + "epoch": 2.73, + "learning_rate": 6.103625036310472e-06, + "loss": 1.4695, + "step": 34653 + }, + { + "epoch": 2.73, + "learning_rate": 6.10013566262701e-06, + "loss": 1.5068, + "step": 34654 + }, + { + "epoch": 2.73, + "learning_rate": 6.09664726594421e-06, + "loss": 1.4356, + "step": 34655 + }, + { + "epoch": 2.73, + "learning_rate": 6.093159846285756e-06, + "loss": 1.4831, + "step": 34656 + }, + { + "epoch": 2.73, + "learning_rate": 6.08967340367536e-06, + "loss": 1.413, + "step": 34657 + }, + { + "epoch": 2.73, + "learning_rate": 6.086187938136622e-06, + "loss": 1.4548, + "step": 34658 + }, + { + "epoch": 2.73, + "learning_rate": 6.082703449693288e-06, + "loss": 1.4662, + "step": 34659 + }, + { + "epoch": 2.73, + "learning_rate": 6.079219938368957e-06, + "loss": 1.4181, + "step": 34660 + }, + { + "epoch": 2.73, + "learning_rate": 6.0757374041872915e-06, + "loss": 1.4275, + "step": 34661 + }, + { + "epoch": 2.73, + "learning_rate": 6.072255847171959e-06, + "loss": 1.4123, + "step": 34662 + }, + { + "epoch": 2.73, + "learning_rate": 6.068775267346588e-06, + "loss": 1.4265, + "step": 34663 + }, + { + "epoch": 2.73, + "learning_rate": 6.065295664734809e-06, + "loss": 1.4594, + "step": 34664 + }, + { + "epoch": 2.73, + "learning_rate": 6.061817039360223e-06, + "loss": 1.4461, + "step": 34665 + }, + { + "epoch": 2.73, + "learning_rate": 6.058339391246475e-06, + "loss": 1.4537, + "step": 34666 + }, + { + "epoch": 2.73, + "learning_rate": 6.05486272041718e-06, + "loss": 1.4141, + "step": 34667 + }, + { + "epoch": 2.73, + "learning_rate": 6.051387026895921e-06, + "loss": 1.4584, + "step": 34668 + }, + { + "epoch": 2.73, + "learning_rate": 6.0479123107063096e-06, + "loss": 1.4529, + "step": 34669 + }, + { + "epoch": 2.73, + "learning_rate": 6.044438571871945e-06, + "loss": 1.5105, + "step": 34670 + }, + { + "epoch": 2.73, + "learning_rate": 6.040965810416393e-06, + "loss": 1.4357, + "step": 34671 + }, + { + "epoch": 2.73, + "learning_rate": 6.037494026363232e-06, + "loss": 1.409, + "step": 34672 + }, + { + "epoch": 2.73, + "learning_rate": 6.034023219736045e-06, + "loss": 1.4056, + "step": 34673 + }, + { + "epoch": 2.73, + "learning_rate": 6.0305533905584124e-06, + "loss": 1.4688, + "step": 34674 + }, + { + "epoch": 2.73, + "learning_rate": 6.027084538853833e-06, + "loss": 1.4914, + "step": 34675 + }, + { + "epoch": 2.73, + "learning_rate": 6.023616664645936e-06, + "loss": 1.4147, + "step": 34676 + }, + { + "epoch": 2.73, + "learning_rate": 6.020149767958221e-06, + "loss": 1.4615, + "step": 34677 + }, + { + "epoch": 2.73, + "learning_rate": 6.016683848814219e-06, + "loss": 1.4636, + "step": 34678 + }, + { + "epoch": 2.73, + "learning_rate": 6.013218907237477e-06, + "loss": 1.4264, + "step": 34679 + }, + { + "epoch": 2.73, + "learning_rate": 6.009754943251527e-06, + "loss": 1.524, + "step": 34680 + }, + { + "epoch": 2.73, + "learning_rate": 6.006291956879899e-06, + "loss": 1.413, + "step": 34681 + }, + { + "epoch": 2.73, + "learning_rate": 6.00282994814606e-06, + "loss": 1.4792, + "step": 34682 + }, + { + "epoch": 2.73, + "learning_rate": 5.999368917073555e-06, + "loss": 1.4809, + "step": 34683 + }, + { + "epoch": 2.73, + "learning_rate": 5.995908863685866e-06, + "loss": 1.4773, + "step": 34684 + }, + { + "epoch": 2.73, + "learning_rate": 5.992449788006476e-06, + "loss": 1.4357, + "step": 34685 + }, + { + "epoch": 2.73, + "learning_rate": 5.988991690058914e-06, + "loss": 1.491, + "step": 34686 + }, + { + "epoch": 2.73, + "learning_rate": 5.985534569866612e-06, + "loss": 1.4455, + "step": 34687 + }, + { + "epoch": 2.73, + "learning_rate": 5.982078427453052e-06, + "loss": 1.3941, + "step": 34688 + }, + { + "epoch": 2.73, + "learning_rate": 5.978623262841697e-06, + "loss": 1.4772, + "step": 34689 + }, + { + "epoch": 2.73, + "learning_rate": 5.9751690760560135e-06, + "loss": 1.4068, + "step": 34690 + }, + { + "epoch": 2.73, + "learning_rate": 5.971715867119465e-06, + "loss": 1.4668, + "step": 34691 + }, + { + "epoch": 2.73, + "learning_rate": 5.9682636360554645e-06, + "loss": 1.4342, + "step": 34692 + }, + { + "epoch": 2.73, + "learning_rate": 5.964812382887496e-06, + "loss": 1.4365, + "step": 34693 + }, + { + "epoch": 2.73, + "learning_rate": 5.96136210763894e-06, + "loss": 1.4237, + "step": 34694 + }, + { + "epoch": 2.73, + "learning_rate": 5.957912810333276e-06, + "loss": 1.4434, + "step": 34695 + }, + { + "epoch": 2.73, + "learning_rate": 5.954464490993871e-06, + "loss": 1.4444, + "step": 34696 + }, + { + "epoch": 2.73, + "learning_rate": 5.951017149644172e-06, + "loss": 1.4151, + "step": 34697 + }, + { + "epoch": 2.73, + "learning_rate": 5.9475707863075764e-06, + "loss": 1.4465, + "step": 34698 + }, + { + "epoch": 2.73, + "learning_rate": 5.9441254010074654e-06, + "loss": 1.4463, + "step": 34699 + }, + { + "epoch": 2.73, + "learning_rate": 5.940680993767272e-06, + "loss": 1.4541, + "step": 34700 + }, + { + "epoch": 2.73, + "learning_rate": 5.937237564610342e-06, + "loss": 1.4691, + "step": 34701 + }, + { + "epoch": 2.73, + "learning_rate": 5.933795113560058e-06, + "loss": 1.4606, + "step": 34702 + }, + { + "epoch": 2.73, + "learning_rate": 5.930353640639818e-06, + "loss": 1.4659, + "step": 34703 + }, + { + "epoch": 2.73, + "learning_rate": 5.926913145872969e-06, + "loss": 1.4433, + "step": 34704 + }, + { + "epoch": 2.73, + "learning_rate": 5.923473629282877e-06, + "loss": 1.4543, + "step": 34705 + }, + { + "epoch": 2.73, + "learning_rate": 5.920035090892872e-06, + "loss": 1.4313, + "step": 34706 + }, + { + "epoch": 2.73, + "learning_rate": 5.916597530726352e-06, + "loss": 1.4593, + "step": 34707 + }, + { + "epoch": 2.73, + "learning_rate": 5.9131609488066005e-06, + "loss": 1.4669, + "step": 34708 + }, + { + "epoch": 2.73, + "learning_rate": 5.909725345156946e-06, + "loss": 1.3997, + "step": 34709 + }, + { + "epoch": 2.73, + "learning_rate": 5.906290719800788e-06, + "loss": 1.4443, + "step": 34710 + }, + { + "epoch": 2.73, + "learning_rate": 5.902857072761374e-06, + "loss": 1.4755, + "step": 34711 + }, + { + "epoch": 2.73, + "learning_rate": 5.8994244040620695e-06, + "loss": 1.429, + "step": 34712 + }, + { + "epoch": 2.73, + "learning_rate": 5.8959927137261055e-06, + "loss": 1.4384, + "step": 34713 + }, + { + "epoch": 2.73, + "learning_rate": 5.892562001776863e-06, + "loss": 1.4157, + "step": 34714 + }, + { + "epoch": 2.73, + "learning_rate": 5.889132268237606e-06, + "loss": 1.4963, + "step": 34715 + }, + { + "epoch": 2.73, + "learning_rate": 5.885703513131585e-06, + "loss": 1.457, + "step": 34716 + }, + { + "epoch": 2.73, + "learning_rate": 5.882275736482128e-06, + "loss": 1.432, + "step": 34717 + }, + { + "epoch": 2.73, + "learning_rate": 5.878848938312486e-06, + "loss": 1.4148, + "step": 34718 + }, + { + "epoch": 2.73, + "learning_rate": 5.875423118645906e-06, + "loss": 1.4379, + "step": 34719 + }, + { + "epoch": 2.73, + "learning_rate": 5.871998277505685e-06, + "loss": 1.4991, + "step": 34720 + }, + { + "epoch": 2.73, + "learning_rate": 5.868574414915072e-06, + "loss": 1.4457, + "step": 34721 + }, + { + "epoch": 2.73, + "learning_rate": 5.865151530897283e-06, + "loss": 1.4592, + "step": 34722 + }, + { + "epoch": 2.73, + "learning_rate": 5.8617296254755805e-06, + "loss": 1.4435, + "step": 34723 + }, + { + "epoch": 2.73, + "learning_rate": 5.8583086986731975e-06, + "loss": 1.4764, + "step": 34724 + }, + { + "epoch": 2.73, + "learning_rate": 5.854888750513331e-06, + "loss": 1.4419, + "step": 34725 + }, + { + "epoch": 2.73, + "learning_rate": 5.85146978101923e-06, + "loss": 1.4552, + "step": 34726 + }, + { + "epoch": 2.73, + "learning_rate": 5.8480517902141255e-06, + "loss": 1.5081, + "step": 34727 + }, + { + "epoch": 2.73, + "learning_rate": 5.844634778121182e-06, + "loss": 1.4227, + "step": 34728 + }, + { + "epoch": 2.73, + "learning_rate": 5.841218744763632e-06, + "loss": 1.4012, + "step": 34729 + }, + { + "epoch": 2.73, + "learning_rate": 5.8378036901646385e-06, + "loss": 1.4672, + "step": 34730 + }, + { + "epoch": 2.73, + "learning_rate": 5.8343896143474015e-06, + "loss": 1.4308, + "step": 34731 + }, + { + "epoch": 2.73, + "learning_rate": 5.8309765173351176e-06, + "loss": 1.4567, + "step": 34732 + }, + { + "epoch": 2.73, + "learning_rate": 5.827564399150919e-06, + "loss": 1.4159, + "step": 34733 + }, + { + "epoch": 2.73, + "learning_rate": 5.82415325981802e-06, + "loss": 1.4251, + "step": 34734 + }, + { + "epoch": 2.73, + "learning_rate": 5.820743099359554e-06, + "loss": 1.4696, + "step": 34735 + }, + { + "epoch": 2.73, + "learning_rate": 5.817333917798667e-06, + "loss": 1.4247, + "step": 34736 + }, + { + "epoch": 2.73, + "learning_rate": 5.813925715158524e-06, + "loss": 1.4106, + "step": 34737 + }, + { + "epoch": 2.73, + "learning_rate": 5.810518491462257e-06, + "loss": 1.4879, + "step": 34738 + }, + { + "epoch": 2.73, + "learning_rate": 5.807112246732998e-06, + "loss": 1.4542, + "step": 34739 + }, + { + "epoch": 2.73, + "learning_rate": 5.8037069809938775e-06, + "loss": 1.4501, + "step": 34740 + }, + { + "epoch": 2.73, + "learning_rate": 5.8003026942679945e-06, + "loss": 1.4346, + "step": 34741 + }, + { + "epoch": 2.73, + "learning_rate": 5.796899386578496e-06, + "loss": 1.4339, + "step": 34742 + }, + { + "epoch": 2.73, + "learning_rate": 5.7934970579484655e-06, + "loss": 1.4394, + "step": 34743 + }, + { + "epoch": 2.73, + "learning_rate": 5.790095708401016e-06, + "loss": 1.4495, + "step": 34744 + }, + { + "epoch": 2.73, + "learning_rate": 5.7866953379592465e-06, + "loss": 1.421, + "step": 34745 + }, + { + "epoch": 2.73, + "learning_rate": 5.783295946646221e-06, + "loss": 1.4389, + "step": 34746 + }, + { + "epoch": 2.73, + "learning_rate": 5.779897534485023e-06, + "loss": 1.4304, + "step": 34747 + }, + { + "epoch": 2.73, + "learning_rate": 5.776500101498749e-06, + "loss": 1.4462, + "step": 34748 + }, + { + "epoch": 2.73, + "learning_rate": 5.773103647710447e-06, + "loss": 1.3992, + "step": 34749 + }, + { + "epoch": 2.73, + "learning_rate": 5.769708173143167e-06, + "loss": 1.402, + "step": 34750 + }, + { + "epoch": 2.73, + "learning_rate": 5.7663136778199894e-06, + "loss": 1.4633, + "step": 34751 + }, + { + "epoch": 2.73, + "learning_rate": 5.762920161763945e-06, + "loss": 1.4519, + "step": 34752 + }, + { + "epoch": 2.73, + "learning_rate": 5.759527624998067e-06, + "loss": 1.5026, + "step": 34753 + }, + { + "epoch": 2.73, + "learning_rate": 5.756136067545402e-06, + "loss": 1.4644, + "step": 34754 + }, + { + "epoch": 2.73, + "learning_rate": 5.752745489428983e-06, + "loss": 1.4358, + "step": 34755 + }, + { + "epoch": 2.73, + "learning_rate": 5.749355890671791e-06, + "loss": 1.4519, + "step": 34756 + }, + { + "epoch": 2.73, + "learning_rate": 5.745967271296892e-06, + "loss": 1.4347, + "step": 34757 + }, + { + "epoch": 2.73, + "learning_rate": 5.742579631327266e-06, + "loss": 1.4307, + "step": 34758 + }, + { + "epoch": 2.73, + "learning_rate": 5.739192970785928e-06, + "loss": 1.4571, + "step": 34759 + }, + { + "epoch": 2.73, + "learning_rate": 5.735807289695826e-06, + "loss": 1.4613, + "step": 34760 + }, + { + "epoch": 2.74, + "learning_rate": 5.7324225880800105e-06, + "loss": 1.3896, + "step": 34761 + }, + { + "epoch": 2.74, + "learning_rate": 5.729038865961444e-06, + "loss": 1.4813, + "step": 34762 + }, + { + "epoch": 2.74, + "learning_rate": 5.725656123363043e-06, + "loss": 1.4754, + "step": 34763 + }, + { + "epoch": 2.74, + "learning_rate": 5.7222743603078545e-06, + "loss": 1.4646, + "step": 34764 + }, + { + "epoch": 2.74, + "learning_rate": 5.7188935768188115e-06, + "loss": 1.4941, + "step": 34765 + }, + { + "epoch": 2.74, + "learning_rate": 5.7155137729188445e-06, + "loss": 1.4469, + "step": 34766 + }, + { + "epoch": 2.74, + "learning_rate": 5.712134948630903e-06, + "loss": 1.4651, + "step": 34767 + }, + { + "epoch": 2.74, + "learning_rate": 5.7087571039779675e-06, + "loss": 1.4727, + "step": 34768 + }, + { + "epoch": 2.74, + "learning_rate": 5.705380238982937e-06, + "loss": 1.4164, + "step": 34769 + }, + { + "epoch": 2.74, + "learning_rate": 5.702004353668726e-06, + "loss": 1.448, + "step": 34770 + }, + { + "epoch": 2.74, + "learning_rate": 5.6986294480583005e-06, + "loss": 1.4283, + "step": 34771 + }, + { + "epoch": 2.74, + "learning_rate": 5.695255522174524e-06, + "loss": 1.4493, + "step": 34772 + }, + { + "epoch": 2.74, + "learning_rate": 5.691882576040347e-06, + "loss": 1.4129, + "step": 34773 + }, + { + "epoch": 2.74, + "learning_rate": 5.6885106096786315e-06, + "loss": 1.4091, + "step": 34774 + }, + { + "epoch": 2.74, + "learning_rate": 5.685139623112312e-06, + "loss": 1.4519, + "step": 34775 + }, + { + "epoch": 2.74, + "learning_rate": 5.681769616364268e-06, + "loss": 1.4464, + "step": 34776 + }, + { + "epoch": 2.74, + "learning_rate": 5.678400589457333e-06, + "loss": 1.4532, + "step": 34777 + }, + { + "epoch": 2.74, + "learning_rate": 5.6750325424144375e-06, + "loss": 1.4354, + "step": 34778 + }, + { + "epoch": 2.74, + "learning_rate": 5.67166547525843e-06, + "loss": 1.4808, + "step": 34779 + }, + { + "epoch": 2.74, + "learning_rate": 5.668299388012143e-06, + "loss": 1.4958, + "step": 34780 + }, + { + "epoch": 2.74, + "learning_rate": 5.664934280698474e-06, + "loss": 1.3468, + "step": 34781 + }, + { + "epoch": 2.74, + "learning_rate": 5.661570153340239e-06, + "loss": 1.5227, + "step": 34782 + }, + { + "epoch": 2.74, + "learning_rate": 5.658207005960303e-06, + "loss": 1.4577, + "step": 34783 + }, + { + "epoch": 2.74, + "learning_rate": 5.6548448385814795e-06, + "loss": 1.4201, + "step": 34784 + }, + { + "epoch": 2.74, + "learning_rate": 5.651483651226602e-06, + "loss": 1.4441, + "step": 34785 + }, + { + "epoch": 2.74, + "learning_rate": 5.648123443918501e-06, + "loss": 1.4428, + "step": 34786 + }, + { + "epoch": 2.74, + "learning_rate": 5.644764216679959e-06, + "loss": 1.4092, + "step": 34787 + }, + { + "epoch": 2.74, + "learning_rate": 5.641405969533808e-06, + "loss": 1.3982, + "step": 34788 + }, + { + "epoch": 2.74, + "learning_rate": 5.638048702502878e-06, + "loss": 1.4666, + "step": 34789 + }, + { + "epoch": 2.74, + "learning_rate": 5.63469241560992e-06, + "loss": 1.4631, + "step": 34790 + }, + { + "epoch": 2.74, + "learning_rate": 5.631337108877715e-06, + "loss": 1.4875, + "step": 34791 + }, + { + "epoch": 2.74, + "learning_rate": 5.627982782329077e-06, + "loss": 1.4776, + "step": 34792 + }, + { + "epoch": 2.74, + "learning_rate": 5.624629435986772e-06, + "loss": 1.3966, + "step": 34793 + }, + { + "epoch": 2.74, + "learning_rate": 5.621277069873531e-06, + "loss": 1.4083, + "step": 34794 + }, + { + "epoch": 2.74, + "learning_rate": 5.61792568401217e-06, + "loss": 1.4382, + "step": 34795 + }, + { + "epoch": 2.74, + "learning_rate": 5.6145752784254205e-06, + "loss": 1.4499, + "step": 34796 + }, + { + "epoch": 2.74, + "learning_rate": 5.611225853135997e-06, + "loss": 1.4093, + "step": 34797 + }, + { + "epoch": 2.74, + "learning_rate": 5.6078774081667e-06, + "loss": 1.5057, + "step": 34798 + }, + { + "epoch": 2.74, + "learning_rate": 5.604529943540226e-06, + "loss": 1.4566, + "step": 34799 + }, + { + "epoch": 2.74, + "learning_rate": 5.601183459279307e-06, + "loss": 1.4316, + "step": 34800 + }, + { + "epoch": 2.74, + "learning_rate": 5.5978379554066585e-06, + "loss": 1.4668, + "step": 34801 + }, + { + "epoch": 2.74, + "learning_rate": 5.594493431945013e-06, + "loss": 1.4145, + "step": 34802 + }, + { + "epoch": 2.74, + "learning_rate": 5.5911498889170684e-06, + "loss": 1.4624, + "step": 34803 + }, + { + "epoch": 2.74, + "learning_rate": 5.587807326345506e-06, + "loss": 1.4611, + "step": 34804 + }, + { + "epoch": 2.74, + "learning_rate": 5.584465744253042e-06, + "loss": 1.4106, + "step": 34805 + }, + { + "epoch": 2.74, + "learning_rate": 5.581125142662374e-06, + "loss": 1.4765, + "step": 34806 + }, + { + "epoch": 2.74, + "learning_rate": 5.577785521596184e-06, + "loss": 1.4254, + "step": 34807 + }, + { + "epoch": 2.74, + "learning_rate": 5.574446881077105e-06, + "loss": 1.4649, + "step": 34808 + }, + { + "epoch": 2.74, + "learning_rate": 5.5711092211278344e-06, + "loss": 1.4482, + "step": 34809 + }, + { + "epoch": 2.74, + "learning_rate": 5.567772541771038e-06, + "loss": 1.3694, + "step": 34810 + }, + { + "epoch": 2.74, + "learning_rate": 5.564436843029363e-06, + "loss": 1.4689, + "step": 34811 + }, + { + "epoch": 2.74, + "learning_rate": 5.5611021249254424e-06, + "loss": 1.5131, + "step": 34812 + }, + { + "epoch": 2.74, + "learning_rate": 5.557768387481959e-06, + "loss": 1.4212, + "step": 34813 + }, + { + "epoch": 2.74, + "learning_rate": 5.554435630721477e-06, + "loss": 1.4685, + "step": 34814 + }, + { + "epoch": 2.74, + "learning_rate": 5.5511038546666944e-06, + "loss": 1.4932, + "step": 34815 + }, + { + "epoch": 2.74, + "learning_rate": 5.54777305934021e-06, + "loss": 1.4464, + "step": 34816 + }, + { + "epoch": 2.74, + "learning_rate": 5.544443244764624e-06, + "loss": 1.4362, + "step": 34817 + }, + { + "epoch": 2.74, + "learning_rate": 5.541114410962532e-06, + "loss": 1.397, + "step": 34818 + }, + { + "epoch": 2.74, + "learning_rate": 5.537786557956553e-06, + "loss": 1.4679, + "step": 34819 + }, + { + "epoch": 2.74, + "learning_rate": 5.534459685769299e-06, + "loss": 1.4773, + "step": 34820 + }, + { + "epoch": 2.74, + "learning_rate": 5.531133794423337e-06, + "loss": 1.4196, + "step": 34821 + }, + { + "epoch": 2.74, + "learning_rate": 5.527808883941248e-06, + "loss": 1.4762, + "step": 34822 + }, + { + "epoch": 2.74, + "learning_rate": 5.5244849543456314e-06, + "loss": 1.4208, + "step": 34823 + }, + { + "epoch": 2.74, + "learning_rate": 5.521162005659019e-06, + "loss": 1.4657, + "step": 34824 + }, + { + "epoch": 2.74, + "learning_rate": 5.517840037903976e-06, + "loss": 1.4029, + "step": 34825 + }, + { + "epoch": 2.74, + "learning_rate": 5.514519051103083e-06, + "loss": 1.4072, + "step": 34826 + }, + { + "epoch": 2.74, + "learning_rate": 5.511199045278874e-06, + "loss": 1.4236, + "step": 34827 + }, + { + "epoch": 2.74, + "learning_rate": 5.507880020453864e-06, + "loss": 1.4357, + "step": 34828 + }, + { + "epoch": 2.74, + "learning_rate": 5.504561976650635e-06, + "loss": 1.4772, + "step": 34829 + }, + { + "epoch": 2.74, + "learning_rate": 5.501244913891684e-06, + "loss": 1.4668, + "step": 34830 + }, + { + "epoch": 2.74, + "learning_rate": 5.497928832199528e-06, + "loss": 1.4294, + "step": 34831 + }, + { + "epoch": 2.74, + "learning_rate": 5.494613731596714e-06, + "loss": 1.4217, + "step": 34832 + }, + { + "epoch": 2.74, + "learning_rate": 5.491299612105726e-06, + "loss": 1.499, + "step": 34833 + }, + { + "epoch": 2.74, + "learning_rate": 5.487986473749045e-06, + "loss": 1.4605, + "step": 34834 + }, + { + "epoch": 2.74, + "learning_rate": 5.484674316549187e-06, + "loss": 1.4791, + "step": 34835 + }, + { + "epoch": 2.74, + "learning_rate": 5.48136314052865e-06, + "loss": 1.4768, + "step": 34836 + }, + { + "epoch": 2.74, + "learning_rate": 5.478052945709915e-06, + "loss": 1.4306, + "step": 34837 + }, + { + "epoch": 2.74, + "learning_rate": 5.474743732115433e-06, + "loss": 1.4141, + "step": 34838 + }, + { + "epoch": 2.74, + "learning_rate": 5.4714354997677015e-06, + "loss": 1.4827, + "step": 34839 + }, + { + "epoch": 2.74, + "learning_rate": 5.468128248689169e-06, + "loss": 1.4549, + "step": 34840 + }, + { + "epoch": 2.74, + "learning_rate": 5.464821978902268e-06, + "loss": 1.53, + "step": 34841 + }, + { + "epoch": 2.74, + "learning_rate": 5.461516690429463e-06, + "loss": 1.4069, + "step": 34842 + }, + { + "epoch": 2.74, + "learning_rate": 5.45821238329322e-06, + "loss": 1.4868, + "step": 34843 + }, + { + "epoch": 2.74, + "learning_rate": 5.454909057515938e-06, + "loss": 1.4606, + "step": 34844 + }, + { + "epoch": 2.74, + "learning_rate": 5.451606713120033e-06, + "loss": 1.4468, + "step": 34845 + }, + { + "epoch": 2.74, + "learning_rate": 5.448305350127985e-06, + "loss": 1.4511, + "step": 34846 + }, + { + "epoch": 2.74, + "learning_rate": 5.445004968562161e-06, + "loss": 1.4547, + "step": 34847 + }, + { + "epoch": 2.74, + "learning_rate": 5.441705568444976e-06, + "loss": 1.4895, + "step": 34848 + }, + { + "epoch": 2.74, + "learning_rate": 5.438407149798846e-06, + "loss": 1.4391, + "step": 34849 + }, + { + "epoch": 2.74, + "learning_rate": 5.435109712646152e-06, + "loss": 1.4631, + "step": 34850 + }, + { + "epoch": 2.74, + "learning_rate": 5.431813257009276e-06, + "loss": 1.443, + "step": 34851 + }, + { + "epoch": 2.74, + "learning_rate": 5.428517782910602e-06, + "loss": 1.4593, + "step": 34852 + }, + { + "epoch": 2.74, + "learning_rate": 5.4252232903725265e-06, + "loss": 1.4219, + "step": 34853 + }, + { + "epoch": 2.74, + "learning_rate": 5.4219297794174e-06, + "loss": 1.4237, + "step": 34854 + }, + { + "epoch": 2.74, + "learning_rate": 5.418637250067587e-06, + "loss": 1.4354, + "step": 34855 + }, + { + "epoch": 2.74, + "learning_rate": 5.415345702345436e-06, + "loss": 1.4987, + "step": 34856 + }, + { + "epoch": 2.74, + "learning_rate": 5.412055136273313e-06, + "loss": 1.4171, + "step": 34857 + }, + { + "epoch": 2.74, + "learning_rate": 5.408765551873534e-06, + "loss": 1.4567, + "step": 34858 + }, + { + "epoch": 2.74, + "learning_rate": 5.405476949168447e-06, + "loss": 1.4582, + "step": 34859 + }, + { + "epoch": 2.74, + "learning_rate": 5.402189328180384e-06, + "loss": 1.4475, + "step": 34860 + }, + { + "epoch": 2.74, + "learning_rate": 5.3989026889316444e-06, + "loss": 1.4296, + "step": 34861 + }, + { + "epoch": 2.74, + "learning_rate": 5.39561703144456e-06, + "loss": 1.4946, + "step": 34862 + }, + { + "epoch": 2.74, + "learning_rate": 5.392332355741447e-06, + "loss": 1.4535, + "step": 34863 + }, + { + "epoch": 2.74, + "learning_rate": 5.389048661844603e-06, + "loss": 1.4576, + "step": 34864 + }, + { + "epoch": 2.74, + "learning_rate": 5.385765949776294e-06, + "loss": 1.4212, + "step": 34865 + }, + { + "epoch": 2.74, + "learning_rate": 5.382484219558819e-06, + "loss": 1.462, + "step": 34866 + }, + { + "epoch": 2.74, + "learning_rate": 5.379203471214511e-06, + "loss": 1.4893, + "step": 34867 + }, + { + "epoch": 2.74, + "learning_rate": 5.375923704765583e-06, + "loss": 1.4573, + "step": 34868 + }, + { + "epoch": 2.74, + "learning_rate": 5.372644920234303e-06, + "loss": 1.4168, + "step": 34869 + }, + { + "epoch": 2.74, + "learning_rate": 5.369367117642987e-06, + "loss": 1.4126, + "step": 34870 + }, + { + "epoch": 2.74, + "learning_rate": 5.366090297013847e-06, + "loss": 1.4308, + "step": 34871 + }, + { + "epoch": 2.74, + "learning_rate": 5.3628144583691194e-06, + "loss": 1.51, + "step": 34872 + }, + { + "epoch": 2.74, + "learning_rate": 5.3595396017310835e-06, + "loss": 1.4978, + "step": 34873 + }, + { + "epoch": 2.74, + "learning_rate": 5.356265727121939e-06, + "loss": 1.4141, + "step": 34874 + }, + { + "epoch": 2.74, + "learning_rate": 5.352992834563935e-06, + "loss": 1.4328, + "step": 34875 + }, + { + "epoch": 2.74, + "learning_rate": 5.349720924079287e-06, + "loss": 1.479, + "step": 34876 + }, + { + "epoch": 2.74, + "learning_rate": 5.346449995690227e-06, + "loss": 1.4441, + "step": 34877 + }, + { + "epoch": 2.74, + "learning_rate": 5.343180049418921e-06, + "loss": 1.428, + "step": 34878 + }, + { + "epoch": 2.74, + "learning_rate": 5.339911085287601e-06, + "loss": 1.4387, + "step": 34879 + }, + { + "epoch": 2.74, + "learning_rate": 5.33664310331845e-06, + "loss": 1.3907, + "step": 34880 + }, + { + "epoch": 2.74, + "learning_rate": 5.333376103533682e-06, + "loss": 1.5017, + "step": 34881 + }, + { + "epoch": 2.74, + "learning_rate": 5.33011008595543e-06, + "loss": 1.422, + "step": 34882 + }, + { + "epoch": 2.74, + "learning_rate": 5.326845050605894e-06, + "loss": 1.4208, + "step": 34883 + }, + { + "epoch": 2.74, + "learning_rate": 5.323580997507254e-06, + "loss": 1.4244, + "step": 34884 + }, + { + "epoch": 2.74, + "learning_rate": 5.3203179266816774e-06, + "loss": 1.426, + "step": 34885 + }, + { + "epoch": 2.74, + "learning_rate": 5.317055838151263e-06, + "loss": 1.4364, + "step": 34886 + }, + { + "epoch": 2.74, + "learning_rate": 5.313794731938226e-06, + "loss": 1.4413, + "step": 34887 + }, + { + "epoch": 2.75, + "learning_rate": 5.3105346080646815e-06, + "loss": 1.4424, + "step": 34888 + }, + { + "epoch": 2.75, + "learning_rate": 5.307275466552729e-06, + "loss": 1.3684, + "step": 34889 + }, + { + "epoch": 2.75, + "learning_rate": 5.304017307424552e-06, + "loss": 1.3863, + "step": 34890 + }, + { + "epoch": 2.75, + "learning_rate": 5.300760130702264e-06, + "loss": 1.4282, + "step": 34891 + }, + { + "epoch": 2.75, + "learning_rate": 5.297503936407932e-06, + "loss": 1.4289, + "step": 34892 + }, + { + "epoch": 2.75, + "learning_rate": 5.294248724563704e-06, + "loss": 1.4357, + "step": 34893 + }, + { + "epoch": 2.75, + "learning_rate": 5.290994495191681e-06, + "loss": 1.4456, + "step": 34894 + }, + { + "epoch": 2.75, + "learning_rate": 5.2877412483139425e-06, + "loss": 1.4801, + "step": 34895 + }, + { + "epoch": 2.75, + "learning_rate": 5.284488983952573e-06, + "loss": 1.4056, + "step": 34896 + }, + { + "epoch": 2.75, + "learning_rate": 5.281237702129687e-06, + "loss": 1.4391, + "step": 34897 + }, + { + "epoch": 2.75, + "learning_rate": 5.277987402867301e-06, + "loss": 1.4854, + "step": 34898 + }, + { + "epoch": 2.75, + "learning_rate": 5.274738086187547e-06, + "loss": 1.4115, + "step": 34899 + }, + { + "epoch": 2.75, + "learning_rate": 5.271489752112424e-06, + "loss": 1.4364, + "step": 34900 + }, + { + "epoch": 2.75, + "learning_rate": 5.268242400664047e-06, + "loss": 1.4662, + "step": 34901 + }, + { + "epoch": 2.75, + "learning_rate": 5.264996031864433e-06, + "loss": 1.3979, + "step": 34902 + }, + { + "epoch": 2.75, + "learning_rate": 5.261750645735596e-06, + "loss": 1.4424, + "step": 34903 + }, + { + "epoch": 2.75, + "learning_rate": 5.25850624229962e-06, + "loss": 1.4104, + "step": 34904 + }, + { + "epoch": 2.75, + "learning_rate": 5.255262821578521e-06, + "loss": 1.4358, + "step": 34905 + }, + { + "epoch": 2.75, + "learning_rate": 5.25202038359428e-06, + "loss": 1.4187, + "step": 34906 + }, + { + "epoch": 2.75, + "learning_rate": 5.24877892836898e-06, + "loss": 1.4196, + "step": 34907 + }, + { + "epoch": 2.75, + "learning_rate": 5.24553845592457e-06, + "loss": 1.3993, + "step": 34908 + }, + { + "epoch": 2.75, + "learning_rate": 5.242298966283065e-06, + "loss": 1.4153, + "step": 34909 + }, + { + "epoch": 2.75, + "learning_rate": 5.239060459466482e-06, + "loss": 1.4481, + "step": 34910 + }, + { + "epoch": 2.75, + "learning_rate": 5.235822935496786e-06, + "loss": 1.4117, + "step": 34911 + }, + { + "epoch": 2.75, + "learning_rate": 5.232586394395977e-06, + "loss": 1.463, + "step": 34912 + }, + { + "epoch": 2.75, + "learning_rate": 5.229350836185986e-06, + "loss": 1.4742, + "step": 34913 + }, + { + "epoch": 2.75, + "learning_rate": 5.22611626088883e-06, + "loss": 1.4211, + "step": 34914 + }, + { + "epoch": 2.75, + "learning_rate": 5.222882668526457e-06, + "loss": 1.431, + "step": 34915 + }, + { + "epoch": 2.75, + "learning_rate": 5.219650059120817e-06, + "loss": 1.4606, + "step": 34916 + }, + { + "epoch": 2.75, + "learning_rate": 5.216418432693842e-06, + "loss": 1.4266, + "step": 34917 + }, + { + "epoch": 2.75, + "learning_rate": 5.213187789267498e-06, + "loss": 1.4623, + "step": 34918 + }, + { + "epoch": 2.75, + "learning_rate": 5.209958128863717e-06, + "loss": 1.3893, + "step": 34919 + }, + { + "epoch": 2.75, + "learning_rate": 5.206729451504399e-06, + "loss": 1.4387, + "step": 34920 + }, + { + "epoch": 2.75, + "learning_rate": 5.203501757211492e-06, + "loss": 1.4419, + "step": 34921 + }, + { + "epoch": 2.75, + "learning_rate": 5.200275046006913e-06, + "loss": 1.4679, + "step": 34922 + }, + { + "epoch": 2.75, + "learning_rate": 5.197049317912544e-06, + "loss": 1.4526, + "step": 34923 + }, + { + "epoch": 2.75, + "learning_rate": 5.193824572950317e-06, + "loss": 1.4531, + "step": 34924 + }, + { + "epoch": 2.75, + "learning_rate": 5.190600811142099e-06, + "loss": 1.4287, + "step": 34925 + }, + { + "epoch": 2.75, + "learning_rate": 5.187378032509787e-06, + "loss": 1.4201, + "step": 34926 + }, + { + "epoch": 2.75, + "learning_rate": 5.1841562370752655e-06, + "loss": 1.4664, + "step": 34927 + }, + { + "epoch": 2.75, + "learning_rate": 5.1809354248604326e-06, + "loss": 1.4379, + "step": 34928 + }, + { + "epoch": 2.75, + "learning_rate": 5.177715595887089e-06, + "loss": 1.4655, + "step": 34929 + }, + { + "epoch": 2.75, + "learning_rate": 5.174496750177148e-06, + "loss": 1.4871, + "step": 34930 + }, + { + "epoch": 2.75, + "learning_rate": 5.171278887752461e-06, + "loss": 1.4357, + "step": 34931 + }, + { + "epoch": 2.75, + "learning_rate": 5.1680620086348766e-06, + "loss": 1.3697, + "step": 34932 + }, + { + "epoch": 2.75, + "learning_rate": 5.16484611284621e-06, + "loss": 1.493, + "step": 34933 + }, + { + "epoch": 2.75, + "learning_rate": 5.161631200408328e-06, + "loss": 1.4477, + "step": 34934 + }, + { + "epoch": 2.75, + "learning_rate": 5.15841727134303e-06, + "loss": 1.4422, + "step": 34935 + }, + { + "epoch": 2.75, + "learning_rate": 5.1552043256721635e-06, + "loss": 1.4278, + "step": 34936 + }, + { + "epoch": 2.75, + "learning_rate": 5.151992363417495e-06, + "loss": 1.517, + "step": 34937 + }, + { + "epoch": 2.75, + "learning_rate": 5.148781384600892e-06, + "loss": 1.4254, + "step": 34938 + }, + { + "epoch": 2.75, + "learning_rate": 5.145571389244135e-06, + "loss": 1.459, + "step": 34939 + }, + { + "epoch": 2.75, + "learning_rate": 5.142362377368992e-06, + "loss": 1.4698, + "step": 34940 + }, + { + "epoch": 2.75, + "learning_rate": 5.139154348997276e-06, + "loss": 1.4389, + "step": 34941 + }, + { + "epoch": 2.75, + "learning_rate": 5.135947304150756e-06, + "loss": 1.4791, + "step": 34942 + }, + { + "epoch": 2.75, + "learning_rate": 5.1327412428512125e-06, + "loss": 1.4416, + "step": 34943 + }, + { + "epoch": 2.75, + "learning_rate": 5.129536165120413e-06, + "loss": 1.4153, + "step": 34944 + }, + { + "epoch": 2.75, + "learning_rate": 5.126332070980104e-06, + "loss": 1.4871, + "step": 34945 + }, + { + "epoch": 2.75, + "learning_rate": 5.123128960452089e-06, + "loss": 1.4345, + "step": 34946 + }, + { + "epoch": 2.75, + "learning_rate": 5.1199268335580305e-06, + "loss": 1.4412, + "step": 34947 + }, + { + "epoch": 2.75, + "learning_rate": 5.116725690319762e-06, + "loss": 1.4751, + "step": 34948 + }, + { + "epoch": 2.75, + "learning_rate": 5.1135255307589495e-06, + "loss": 1.3945, + "step": 34949 + }, + { + "epoch": 2.75, + "learning_rate": 5.110326354897343e-06, + "loss": 1.4443, + "step": 34950 + }, + { + "epoch": 2.75, + "learning_rate": 5.107128162756674e-06, + "loss": 1.4051, + "step": 34951 + }, + { + "epoch": 2.75, + "learning_rate": 5.103930954358643e-06, + "loss": 1.4833, + "step": 34952 + }, + { + "epoch": 2.75, + "learning_rate": 5.100734729724965e-06, + "loss": 1.388, + "step": 34953 + }, + { + "epoch": 2.75, + "learning_rate": 5.097539488877323e-06, + "loss": 1.4639, + "step": 34954 + }, + { + "epoch": 2.75, + "learning_rate": 5.094345231837433e-06, + "loss": 1.4264, + "step": 34955 + }, + { + "epoch": 2.75, + "learning_rate": 5.091151958626976e-06, + "loss": 1.4926, + "step": 34956 + }, + { + "epoch": 2.75, + "learning_rate": 5.087959669267605e-06, + "loss": 1.3806, + "step": 34957 + }, + { + "epoch": 2.75, + "learning_rate": 5.08476836378105e-06, + "loss": 1.4331, + "step": 34958 + }, + { + "epoch": 2.75, + "learning_rate": 5.081578042188944e-06, + "loss": 1.4647, + "step": 34959 + }, + { + "epoch": 2.75, + "learning_rate": 5.078388704512937e-06, + "loss": 1.3969, + "step": 34960 + }, + { + "epoch": 2.75, + "learning_rate": 5.075200350774678e-06, + "loss": 1.4883, + "step": 34961 + }, + { + "epoch": 2.75, + "learning_rate": 5.072012980995865e-06, + "loss": 1.4357, + "step": 34962 + }, + { + "epoch": 2.75, + "learning_rate": 5.0688265951981e-06, + "loss": 1.4924, + "step": 34963 + }, + { + "epoch": 2.75, + "learning_rate": 5.065641193403014e-06, + "loss": 1.4575, + "step": 34964 + }, + { + "epoch": 2.75, + "learning_rate": 5.0624567756322566e-06, + "loss": 1.458, + "step": 34965 + }, + { + "epoch": 2.75, + "learning_rate": 5.059273341907427e-06, + "loss": 1.4502, + "step": 34966 + }, + { + "epoch": 2.75, + "learning_rate": 5.056090892250142e-06, + "loss": 1.4397, + "step": 34967 + }, + { + "epoch": 2.75, + "learning_rate": 5.052909426682017e-06, + "loss": 1.3788, + "step": 34968 + }, + { + "epoch": 2.75, + "learning_rate": 5.049728945224651e-06, + "loss": 1.4377, + "step": 34969 + }, + { + "epoch": 2.75, + "learning_rate": 5.046549447899645e-06, + "loss": 1.4248, + "step": 34970 + }, + { + "epoch": 2.75, + "learning_rate": 5.043370934728547e-06, + "loss": 1.473, + "step": 34971 + }, + { + "epoch": 2.75, + "learning_rate": 5.0401934057329894e-06, + "loss": 1.4095, + "step": 34972 + }, + { + "epoch": 2.75, + "learning_rate": 5.037016860934523e-06, + "loss": 1.4463, + "step": 34973 + }, + { + "epoch": 2.75, + "learning_rate": 5.033841300354713e-06, + "loss": 1.4691, + "step": 34974 + }, + { + "epoch": 2.75, + "learning_rate": 5.0306667240151254e-06, + "loss": 1.4583, + "step": 34975 + }, + { + "epoch": 2.75, + "learning_rate": 5.027493131937277e-06, + "loss": 1.4089, + "step": 34976 + }, + { + "epoch": 2.75, + "learning_rate": 5.024320524142783e-06, + "loss": 1.402, + "step": 34977 + }, + { + "epoch": 2.75, + "learning_rate": 5.021148900653127e-06, + "loss": 1.4364, + "step": 34978 + }, + { + "epoch": 2.75, + "learning_rate": 5.0179782614898915e-06, + "loss": 1.3802, + "step": 34979 + }, + { + "epoch": 2.75, + "learning_rate": 5.014808606674558e-06, + "loss": 1.4355, + "step": 34980 + }, + { + "epoch": 2.75, + "learning_rate": 5.011639936228662e-06, + "loss": 1.4801, + "step": 34981 + }, + { + "epoch": 2.75, + "learning_rate": 5.0084722501737336e-06, + "loss": 1.4501, + "step": 34982 + }, + { + "epoch": 2.75, + "learning_rate": 5.005305548531258e-06, + "loss": 1.4759, + "step": 34983 + }, + { + "epoch": 2.75, + "learning_rate": 5.002139831322732e-06, + "loss": 1.4356, + "step": 34984 + }, + { + "epoch": 2.75, + "learning_rate": 4.9989750985696745e-06, + "loss": 1.4908, + "step": 34985 + }, + { + "epoch": 2.75, + "learning_rate": 4.995811350293566e-06, + "loss": 1.4146, + "step": 34986 + }, + { + "epoch": 2.75, + "learning_rate": 4.992648586515858e-06, + "loss": 1.4271, + "step": 34987 + }, + { + "epoch": 2.75, + "learning_rate": 4.989486807258047e-06, + "loss": 1.4495, + "step": 34988 + }, + { + "epoch": 2.75, + "learning_rate": 4.986326012541619e-06, + "loss": 1.4764, + "step": 34989 + }, + { + "epoch": 2.75, + "learning_rate": 4.983166202387989e-06, + "loss": 1.4544, + "step": 34990 + }, + { + "epoch": 2.75, + "learning_rate": 4.98000737681864e-06, + "loss": 1.4828, + "step": 34991 + }, + { + "epoch": 2.75, + "learning_rate": 4.9768495358550045e-06, + "loss": 1.484, + "step": 34992 + }, + { + "epoch": 2.75, + "learning_rate": 4.973692679518531e-06, + "loss": 1.4629, + "step": 34993 + }, + { + "epoch": 2.75, + "learning_rate": 4.970536807830672e-06, + "loss": 1.4906, + "step": 34994 + }, + { + "epoch": 2.75, + "learning_rate": 4.9673819208128074e-06, + "loss": 1.4332, + "step": 34995 + }, + { + "epoch": 2.75, + "learning_rate": 4.964228018486405e-06, + "loss": 1.4624, + "step": 34996 + }, + { + "epoch": 2.75, + "learning_rate": 4.961075100872863e-06, + "loss": 1.4591, + "step": 34997 + }, + { + "epoch": 2.75, + "learning_rate": 4.95792316799355e-06, + "loss": 1.4727, + "step": 34998 + }, + { + "epoch": 2.75, + "learning_rate": 4.954772219869929e-06, + "loss": 1.4573, + "step": 34999 + }, + { + "epoch": 2.75, + "learning_rate": 4.9516222565233524e-06, + "loss": 1.464, + "step": 35000 + }, + { + "epoch": 2.75, + "learning_rate": 4.948473277975201e-06, + "loss": 1.4448, + "step": 35001 + }, + { + "epoch": 2.75, + "learning_rate": 4.945325284246893e-06, + "loss": 1.4957, + "step": 35002 + }, + { + "epoch": 2.75, + "learning_rate": 4.942178275359776e-06, + "loss": 1.4507, + "step": 35003 + }, + { + "epoch": 2.75, + "learning_rate": 4.939032251335201e-06, + "loss": 1.4536, + "step": 35004 + }, + { + "epoch": 2.75, + "learning_rate": 4.93588721219455e-06, + "loss": 1.4368, + "step": 35005 + }, + { + "epoch": 2.75, + "learning_rate": 4.93274315795919e-06, + "loss": 1.4719, + "step": 35006 + }, + { + "epoch": 2.75, + "learning_rate": 4.929600088650437e-06, + "loss": 1.4995, + "step": 35007 + }, + { + "epoch": 2.75, + "learning_rate": 4.926458004289624e-06, + "loss": 1.4657, + "step": 35008 + }, + { + "epoch": 2.75, + "learning_rate": 4.923316904898134e-06, + "loss": 1.4102, + "step": 35009 + }, + { + "epoch": 2.75, + "learning_rate": 4.920176790497249e-06, + "loss": 1.4652, + "step": 35010 + }, + { + "epoch": 2.75, + "learning_rate": 4.917037661108303e-06, + "loss": 1.4345, + "step": 35011 + }, + { + "epoch": 2.75, + "learning_rate": 4.913899516752612e-06, + "loss": 1.4197, + "step": 35012 + }, + { + "epoch": 2.75, + "learning_rate": 4.9107623574514755e-06, + "loss": 1.4759, + "step": 35013 + }, + { + "epoch": 2.75, + "learning_rate": 4.907626183226193e-06, + "loss": 1.456, + "step": 35014 + }, + { + "epoch": 2.76, + "learning_rate": 4.904490994098048e-06, + "loss": 1.4515, + "step": 35015 + }, + { + "epoch": 2.76, + "learning_rate": 4.901356790088373e-06, + "loss": 1.4879, + "step": 35016 + }, + { + "epoch": 2.76, + "learning_rate": 4.898223571218385e-06, + "loss": 1.506, + "step": 35017 + }, + { + "epoch": 2.76, + "learning_rate": 4.895091337509383e-06, + "loss": 1.4294, + "step": 35018 + }, + { + "epoch": 2.76, + "learning_rate": 4.891960088982666e-06, + "loss": 1.4331, + "step": 35019 + }, + { + "epoch": 2.76, + "learning_rate": 4.888829825659435e-06, + "loss": 1.4016, + "step": 35020 + }, + { + "epoch": 2.76, + "learning_rate": 4.885700547560972e-06, + "loss": 1.4037, + "step": 35021 + }, + { + "epoch": 2.76, + "learning_rate": 4.882572254708528e-06, + "loss": 1.4014, + "step": 35022 + }, + { + "epoch": 2.76, + "learning_rate": 4.879444947123351e-06, + "loss": 1.4214, + "step": 35023 + }, + { + "epoch": 2.76, + "learning_rate": 4.876318624826625e-06, + "loss": 1.4799, + "step": 35024 + }, + { + "epoch": 2.76, + "learning_rate": 4.873193287839616e-06, + "loss": 1.4605, + "step": 35025 + }, + { + "epoch": 2.76, + "learning_rate": 4.870068936183557e-06, + "loss": 1.4593, + "step": 35026 + }, + { + "epoch": 2.76, + "learning_rate": 4.866945569879632e-06, + "loss": 1.4454, + "step": 35027 + }, + { + "epoch": 2.76, + "learning_rate": 4.863823188949073e-06, + "loss": 1.4454, + "step": 35028 + }, + { + "epoch": 2.76, + "learning_rate": 4.86070179341303e-06, + "loss": 1.4513, + "step": 35029 + }, + { + "epoch": 2.76, + "learning_rate": 4.857581383292752e-06, + "loss": 1.5065, + "step": 35030 + }, + { + "epoch": 2.76, + "learning_rate": 4.85446195860939e-06, + "loss": 1.4448, + "step": 35031 + }, + { + "epoch": 2.76, + "learning_rate": 4.8513435193841265e-06, + "loss": 1.4156, + "step": 35032 + }, + { + "epoch": 2.76, + "learning_rate": 4.848226065638144e-06, + "loss": 1.4363, + "step": 35033 + }, + { + "epoch": 2.76, + "learning_rate": 4.8451095973926264e-06, + "loss": 1.4308, + "step": 35034 + }, + { + "epoch": 2.76, + "learning_rate": 4.841994114668673e-06, + "loss": 1.4464, + "step": 35035 + }, + { + "epoch": 2.76, + "learning_rate": 4.838879617487501e-06, + "loss": 1.4103, + "step": 35036 + }, + { + "epoch": 2.76, + "learning_rate": 4.835766105870242e-06, + "loss": 1.4273, + "step": 35037 + }, + { + "epoch": 2.76, + "learning_rate": 4.832653579837997e-06, + "loss": 1.4555, + "step": 35038 + }, + { + "epoch": 2.76, + "learning_rate": 4.829542039411915e-06, + "loss": 1.4021, + "step": 35039 + }, + { + "epoch": 2.76, + "learning_rate": 4.826431484613147e-06, + "loss": 1.4491, + "step": 35040 + }, + { + "epoch": 2.76, + "learning_rate": 4.823321915462808e-06, + "loss": 1.4618, + "step": 35041 + }, + { + "epoch": 2.76, + "learning_rate": 4.820213331981982e-06, + "loss": 1.4623, + "step": 35042 + }, + { + "epoch": 2.76, + "learning_rate": 4.8171057341918e-06, + "loss": 1.3892, + "step": 35043 + }, + { + "epoch": 2.76, + "learning_rate": 4.813999122113349e-06, + "loss": 1.4924, + "step": 35044 + }, + { + "epoch": 2.76, + "learning_rate": 4.810893495767709e-06, + "loss": 1.4131, + "step": 35045 + }, + { + "epoch": 2.76, + "learning_rate": 4.807788855176015e-06, + "loss": 1.4506, + "step": 35046 + }, + { + "epoch": 2.76, + "learning_rate": 4.804685200359281e-06, + "loss": 1.4123, + "step": 35047 + }, + { + "epoch": 2.76, + "learning_rate": 4.801582531338627e-06, + "loss": 1.4399, + "step": 35048 + }, + { + "epoch": 2.76, + "learning_rate": 4.798480848135083e-06, + "loss": 1.3856, + "step": 35049 + }, + { + "epoch": 2.76, + "learning_rate": 4.7953801507697345e-06, + "loss": 1.4363, + "step": 35050 + }, + { + "epoch": 2.76, + "learning_rate": 4.792280439263629e-06, + "loss": 1.4439, + "step": 35051 + }, + { + "epoch": 2.76, + "learning_rate": 4.789181713637802e-06, + "loss": 1.462, + "step": 35052 + }, + { + "epoch": 2.76, + "learning_rate": 4.786083973913301e-06, + "loss": 1.3979, + "step": 35053 + }, + { + "epoch": 2.76, + "learning_rate": 4.7829872201111455e-06, + "loss": 1.4136, + "step": 35054 + }, + { + "epoch": 2.76, + "learning_rate": 4.7798914522523655e-06, + "loss": 1.3698, + "step": 35055 + }, + { + "epoch": 2.76, + "learning_rate": 4.7767966703579796e-06, + "loss": 1.4085, + "step": 35056 + }, + { + "epoch": 2.76, + "learning_rate": 4.77370287444902e-06, + "loss": 1.4949, + "step": 35057 + }, + { + "epoch": 2.76, + "learning_rate": 4.770610064546488e-06, + "loss": 1.4243, + "step": 35058 + }, + { + "epoch": 2.76, + "learning_rate": 4.767518240671331e-06, + "loss": 1.4586, + "step": 35059 + }, + { + "epoch": 2.76, + "learning_rate": 4.764427402844617e-06, + "loss": 1.3752, + "step": 35060 + }, + { + "epoch": 2.76, + "learning_rate": 4.76133755108728e-06, + "loss": 1.4561, + "step": 35061 + }, + { + "epoch": 2.76, + "learning_rate": 4.758248685420285e-06, + "loss": 1.4496, + "step": 35062 + }, + { + "epoch": 2.76, + "learning_rate": 4.755160805864666e-06, + "loss": 1.4359, + "step": 35063 + }, + { + "epoch": 2.76, + "learning_rate": 4.75207391244134e-06, + "loss": 1.4188, + "step": 35064 + }, + { + "epoch": 2.76, + "learning_rate": 4.748988005171289e-06, + "loss": 1.4639, + "step": 35065 + }, + { + "epoch": 2.76, + "learning_rate": 4.745903084075431e-06, + "loss": 1.4312, + "step": 35066 + }, + { + "epoch": 2.76, + "learning_rate": 4.7428191491747484e-06, + "loss": 1.4261, + "step": 35067 + }, + { + "epoch": 2.76, + "learning_rate": 4.739736200490174e-06, + "loss": 1.4644, + "step": 35068 + }, + { + "epoch": 2.76, + "learning_rate": 4.7366542380426084e-06, + "loss": 1.4927, + "step": 35069 + }, + { + "epoch": 2.76, + "learning_rate": 4.733573261853002e-06, + "loss": 1.4402, + "step": 35070 + }, + { + "epoch": 2.76, + "learning_rate": 4.7304932719422705e-06, + "loss": 1.3981, + "step": 35071 + }, + { + "epoch": 2.76, + "learning_rate": 4.727414268331331e-06, + "loss": 1.4064, + "step": 35072 + }, + { + "epoch": 2.76, + "learning_rate": 4.72433625104105e-06, + "loss": 1.4092, + "step": 35073 + }, + { + "epoch": 2.76, + "learning_rate": 4.721259220092393e-06, + "loss": 1.4602, + "step": 35074 + }, + { + "epoch": 2.76, + "learning_rate": 4.718183175506213e-06, + "loss": 1.4315, + "step": 35075 + }, + { + "epoch": 2.76, + "learning_rate": 4.715108117303373e-06, + "loss": 1.42, + "step": 35076 + }, + { + "epoch": 2.76, + "learning_rate": 4.712034045504792e-06, + "loss": 1.4471, + "step": 35077 + }, + { + "epoch": 2.76, + "learning_rate": 4.70896096013132e-06, + "loss": 1.4481, + "step": 35078 + }, + { + "epoch": 2.76, + "learning_rate": 4.705888861203805e-06, + "loss": 1.4099, + "step": 35079 + }, + { + "epoch": 2.76, + "learning_rate": 4.702817748743148e-06, + "loss": 1.4489, + "step": 35080 + }, + { + "epoch": 2.76, + "learning_rate": 4.699747622770184e-06, + "loss": 1.4969, + "step": 35081 + }, + { + "epoch": 2.76, + "learning_rate": 4.696678483305744e-06, + "loss": 1.4803, + "step": 35082 + }, + { + "epoch": 2.76, + "learning_rate": 4.693610330370645e-06, + "loss": 1.4614, + "step": 35083 + }, + { + "epoch": 2.76, + "learning_rate": 4.690543163985771e-06, + "loss": 1.476, + "step": 35084 + }, + { + "epoch": 2.76, + "learning_rate": 4.687476984171923e-06, + "loss": 1.4294, + "step": 35085 + }, + { + "epoch": 2.76, + "learning_rate": 4.6844117909498824e-06, + "loss": 1.4672, + "step": 35086 + }, + { + "epoch": 2.76, + "learning_rate": 4.681347584340517e-06, + "loss": 1.4778, + "step": 35087 + }, + { + "epoch": 2.76, + "learning_rate": 4.678284364364626e-06, + "loss": 1.4248, + "step": 35088 + }, + { + "epoch": 2.76, + "learning_rate": 4.675222131042977e-06, + "loss": 1.3874, + "step": 35089 + }, + { + "epoch": 2.76, + "learning_rate": 4.672160884396353e-06, + "loss": 1.4223, + "step": 35090 + }, + { + "epoch": 2.76, + "learning_rate": 4.669100624445587e-06, + "loss": 1.4324, + "step": 35091 + }, + { + "epoch": 2.76, + "learning_rate": 4.666041351211414e-06, + "loss": 1.4208, + "step": 35092 + }, + { + "epoch": 2.76, + "learning_rate": 4.662983064714615e-06, + "loss": 1.4666, + "step": 35093 + }, + { + "epoch": 2.76, + "learning_rate": 4.659925764975958e-06, + "loss": 1.416, + "step": 35094 + }, + { + "epoch": 2.76, + "learning_rate": 4.65686945201621e-06, + "loss": 1.4267, + "step": 35095 + }, + { + "epoch": 2.76, + "learning_rate": 4.6538141258561035e-06, + "loss": 1.4632, + "step": 35096 + }, + { + "epoch": 2.76, + "learning_rate": 4.6507597865163894e-06, + "loss": 1.5155, + "step": 35097 + }, + { + "epoch": 2.76, + "learning_rate": 4.647706434017817e-06, + "loss": 1.4903, + "step": 35098 + }, + { + "epoch": 2.76, + "learning_rate": 4.644654068381087e-06, + "loss": 1.4696, + "step": 35099 + }, + { + "epoch": 2.76, + "learning_rate": 4.641602689626967e-06, + "loss": 1.4391, + "step": 35100 + }, + { + "epoch": 2.76, + "learning_rate": 4.638552297776138e-06, + "loss": 1.4072, + "step": 35101 + }, + { + "epoch": 2.76, + "learning_rate": 4.635502892849302e-06, + "loss": 1.4402, + "step": 35102 + }, + { + "epoch": 2.76, + "learning_rate": 4.632454474867192e-06, + "loss": 1.4596, + "step": 35103 + }, + { + "epoch": 2.76, + "learning_rate": 4.629407043850508e-06, + "loss": 1.4686, + "step": 35104 + }, + { + "epoch": 2.76, + "learning_rate": 4.626360599819934e-06, + "loss": 1.49, + "step": 35105 + }, + { + "epoch": 2.76, + "learning_rate": 4.623315142796136e-06, + "loss": 1.4739, + "step": 35106 + }, + { + "epoch": 2.76, + "learning_rate": 4.620270672799797e-06, + "loss": 1.4302, + "step": 35107 + }, + { + "epoch": 2.76, + "learning_rate": 4.6172271898516026e-06, + "loss": 1.4283, + "step": 35108 + }, + { + "epoch": 2.76, + "learning_rate": 4.614184693972201e-06, + "loss": 1.4658, + "step": 35109 + }, + { + "epoch": 2.76, + "learning_rate": 4.611143185182259e-06, + "loss": 1.4765, + "step": 35110 + }, + { + "epoch": 2.76, + "learning_rate": 4.608102663502428e-06, + "loss": 1.4416, + "step": 35111 + }, + { + "epoch": 2.76, + "learning_rate": 4.60506312895334e-06, + "loss": 1.4199, + "step": 35112 + }, + { + "epoch": 2.76, + "learning_rate": 4.60202458155563e-06, + "loss": 1.4327, + "step": 35113 + }, + { + "epoch": 2.76, + "learning_rate": 4.598987021329947e-06, + "loss": 1.4719, + "step": 35114 + }, + { + "epoch": 2.76, + "learning_rate": 4.595950448296892e-06, + "loss": 1.4706, + "step": 35115 + }, + { + "epoch": 2.76, + "learning_rate": 4.5929148624770985e-06, + "loss": 1.4523, + "step": 35116 + }, + { + "epoch": 2.76, + "learning_rate": 4.589880263891166e-06, + "loss": 1.4241, + "step": 35117 + }, + { + "epoch": 2.76, + "learning_rate": 4.586846652559711e-06, + "loss": 1.4578, + "step": 35118 + }, + { + "epoch": 2.76, + "learning_rate": 4.5838140285033185e-06, + "loss": 1.4388, + "step": 35119 + }, + { + "epoch": 2.76, + "learning_rate": 4.580782391742571e-06, + "loss": 1.4147, + "step": 35120 + }, + { + "epoch": 2.76, + "learning_rate": 4.577751742298086e-06, + "loss": 1.4014, + "step": 35121 + }, + { + "epoch": 2.76, + "learning_rate": 4.574722080190396e-06, + "loss": 1.4347, + "step": 35122 + }, + { + "epoch": 2.76, + "learning_rate": 4.5716934054401025e-06, + "loss": 1.4247, + "step": 35123 + }, + { + "epoch": 2.76, + "learning_rate": 4.5686657180677545e-06, + "loss": 1.451, + "step": 35124 + }, + { + "epoch": 2.76, + "learning_rate": 4.565639018093903e-06, + "loss": 1.3938, + "step": 35125 + }, + { + "epoch": 2.76, + "learning_rate": 4.562613305539115e-06, + "loss": 1.4639, + "step": 35126 + }, + { + "epoch": 2.76, + "learning_rate": 4.559588580423923e-06, + "loss": 1.4901, + "step": 35127 + }, + { + "epoch": 2.76, + "learning_rate": 4.556564842768862e-06, + "loss": 1.4157, + "step": 35128 + }, + { + "epoch": 2.76, + "learning_rate": 4.553542092594464e-06, + "loss": 1.4231, + "step": 35129 + }, + { + "epoch": 2.76, + "learning_rate": 4.550520329921231e-06, + "loss": 1.4005, + "step": 35130 + }, + { + "epoch": 2.76, + "learning_rate": 4.547499554769729e-06, + "loss": 1.4106, + "step": 35131 + }, + { + "epoch": 2.76, + "learning_rate": 4.544479767160425e-06, + "loss": 1.4889, + "step": 35132 + }, + { + "epoch": 2.76, + "learning_rate": 4.541460967113836e-06, + "loss": 1.4651, + "step": 35133 + }, + { + "epoch": 2.76, + "learning_rate": 4.538443154650445e-06, + "loss": 1.4403, + "step": 35134 + }, + { + "epoch": 2.76, + "learning_rate": 4.53542632979077e-06, + "loss": 1.4588, + "step": 35135 + }, + { + "epoch": 2.76, + "learning_rate": 4.532410492555277e-06, + "loss": 1.4161, + "step": 35136 + }, + { + "epoch": 2.76, + "learning_rate": 4.529395642964418e-06, + "loss": 1.4273, + "step": 35137 + }, + { + "epoch": 2.76, + "learning_rate": 4.526381781038707e-06, + "loss": 1.4638, + "step": 35138 + }, + { + "epoch": 2.76, + "learning_rate": 4.52336890679858e-06, + "loss": 1.4432, + "step": 35139 + }, + { + "epoch": 2.76, + "learning_rate": 4.520357020264486e-06, + "loss": 1.4147, + "step": 35140 + }, + { + "epoch": 2.76, + "learning_rate": 4.517346121456894e-06, + "loss": 1.4028, + "step": 35141 + }, + { + "epoch": 2.77, + "learning_rate": 4.514336210396252e-06, + "loss": 1.4689, + "step": 35142 + }, + { + "epoch": 2.77, + "learning_rate": 4.511327287102978e-06, + "loss": 1.4253, + "step": 35143 + }, + { + "epoch": 2.77, + "learning_rate": 4.5083193515974895e-06, + "loss": 1.4373, + "step": 35144 + }, + { + "epoch": 2.77, + "learning_rate": 4.505312403900235e-06, + "loss": 1.447, + "step": 35145 + }, + { + "epoch": 2.77, + "learning_rate": 4.502306444031617e-06, + "loss": 1.4317, + "step": 35146 + }, + { + "epoch": 2.77, + "learning_rate": 4.499301472012018e-06, + "loss": 1.3922, + "step": 35147 + }, + { + "epoch": 2.77, + "learning_rate": 4.4962974878619055e-06, + "loss": 1.4731, + "step": 35148 + }, + { + "epoch": 2.77, + "learning_rate": 4.493294491601612e-06, + "loss": 1.4594, + "step": 35149 + }, + { + "epoch": 2.77, + "learning_rate": 4.490292483251573e-06, + "loss": 1.3961, + "step": 35150 + }, + { + "epoch": 2.77, + "learning_rate": 4.487291462832121e-06, + "loss": 1.437, + "step": 35151 + }, + { + "epoch": 2.77, + "learning_rate": 4.48429143036369e-06, + "loss": 1.4451, + "step": 35152 + }, + { + "epoch": 2.77, + "learning_rate": 4.481292385866614e-06, + "loss": 1.4503, + "step": 35153 + }, + { + "epoch": 2.77, + "learning_rate": 4.478294329361243e-06, + "loss": 1.4412, + "step": 35154 + }, + { + "epoch": 2.77, + "learning_rate": 4.4752972608679606e-06, + "loss": 1.4706, + "step": 35155 + }, + { + "epoch": 2.77, + "learning_rate": 4.472301180407101e-06, + "loss": 1.4395, + "step": 35156 + }, + { + "epoch": 2.77, + "learning_rate": 4.469306087998997e-06, + "loss": 1.4771, + "step": 35157 + }, + { + "epoch": 2.77, + "learning_rate": 4.466311983664001e-06, + "loss": 1.4231, + "step": 35158 + }, + { + "epoch": 2.77, + "learning_rate": 4.463318867422444e-06, + "loss": 1.5165, + "step": 35159 + }, + { + "epoch": 2.77, + "learning_rate": 4.4603267392946455e-06, + "loss": 1.4307, + "step": 35160 + }, + { + "epoch": 2.77, + "learning_rate": 4.457335599300871e-06, + "loss": 1.4555, + "step": 35161 + }, + { + "epoch": 2.77, + "learning_rate": 4.454345447461505e-06, + "loss": 1.4331, + "step": 35162 + }, + { + "epoch": 2.77, + "learning_rate": 4.451356283796814e-06, + "loss": 1.4756, + "step": 35163 + }, + { + "epoch": 2.77, + "learning_rate": 4.448368108327083e-06, + "loss": 1.4215, + "step": 35164 + }, + { + "epoch": 2.77, + "learning_rate": 4.4453809210725945e-06, + "loss": 1.4393, + "step": 35165 + }, + { + "epoch": 2.77, + "learning_rate": 4.442394722053666e-06, + "loss": 1.4305, + "step": 35166 + }, + { + "epoch": 2.77, + "learning_rate": 4.439409511290565e-06, + "loss": 1.4451, + "step": 35167 + }, + { + "epoch": 2.77, + "learning_rate": 4.436425288803525e-06, + "loss": 1.4537, + "step": 35168 + }, + { + "epoch": 2.77, + "learning_rate": 4.433442054612829e-06, + "loss": 1.3891, + "step": 35169 + }, + { + "epoch": 2.77, + "learning_rate": 4.430459808738746e-06, + "loss": 1.4806, + "step": 35170 + }, + { + "epoch": 2.77, + "learning_rate": 4.427478551201491e-06, + "loss": 1.4261, + "step": 35171 + }, + { + "epoch": 2.77, + "learning_rate": 4.4244982820213495e-06, + "loss": 1.4613, + "step": 35172 + }, + { + "epoch": 2.77, + "learning_rate": 4.421519001218521e-06, + "loss": 1.4794, + "step": 35173 + }, + { + "epoch": 2.77, + "learning_rate": 4.418540708813223e-06, + "loss": 1.4131, + "step": 35174 + }, + { + "epoch": 2.77, + "learning_rate": 4.415563404825706e-06, + "loss": 1.3854, + "step": 35175 + }, + { + "epoch": 2.77, + "learning_rate": 4.412587089276171e-06, + "loss": 1.4473, + "step": 35176 + }, + { + "epoch": 2.77, + "learning_rate": 4.409611762184834e-06, + "loss": 1.4137, + "step": 35177 + }, + { + "epoch": 2.77, + "learning_rate": 4.40663742357188e-06, + "loss": 1.469, + "step": 35178 + }, + { + "epoch": 2.77, + "learning_rate": 4.403664073457524e-06, + "loss": 1.4058, + "step": 35179 + }, + { + "epoch": 2.77, + "learning_rate": 4.400691711861954e-06, + "loss": 1.4721, + "step": 35180 + }, + { + "epoch": 2.77, + "learning_rate": 4.3977203388053e-06, + "loss": 1.4746, + "step": 35181 + }, + { + "epoch": 2.77, + "learning_rate": 4.394749954307797e-06, + "loss": 1.4668, + "step": 35182 + }, + { + "epoch": 2.77, + "learning_rate": 4.391780558389596e-06, + "loss": 1.4026, + "step": 35183 + }, + { + "epoch": 2.77, + "learning_rate": 4.3888121510708475e-06, + "loss": 1.5041, + "step": 35184 + }, + { + "epoch": 2.77, + "learning_rate": 4.385844732371685e-06, + "loss": 1.4289, + "step": 35185 + }, + { + "epoch": 2.77, + "learning_rate": 4.382878302312309e-06, + "loss": 1.4476, + "step": 35186 + }, + { + "epoch": 2.77, + "learning_rate": 4.379912860912838e-06, + "loss": 1.4494, + "step": 35187 + }, + { + "epoch": 2.77, + "learning_rate": 4.376948408193371e-06, + "loss": 1.4311, + "step": 35188 + }, + { + "epoch": 2.77, + "learning_rate": 4.373984944174091e-06, + "loss": 1.4693, + "step": 35189 + }, + { + "epoch": 2.77, + "learning_rate": 4.371022468875085e-06, + "loss": 1.3864, + "step": 35190 + }, + { + "epoch": 2.77, + "learning_rate": 4.368060982316451e-06, + "loss": 1.4643, + "step": 35191 + }, + { + "epoch": 2.77, + "learning_rate": 4.3651004845183244e-06, + "loss": 1.4575, + "step": 35192 + }, + { + "epoch": 2.77, + "learning_rate": 4.362140975500822e-06, + "loss": 1.3845, + "step": 35193 + }, + { + "epoch": 2.77, + "learning_rate": 4.359182455283994e-06, + "loss": 1.4897, + "step": 35194 + }, + { + "epoch": 2.77, + "learning_rate": 4.356224923887941e-06, + "loss": 1.4027, + "step": 35195 + }, + { + "epoch": 2.77, + "learning_rate": 4.3532683813327305e-06, + "loss": 1.506, + "step": 35196 + }, + { + "epoch": 2.77, + "learning_rate": 4.3503128276384804e-06, + "loss": 1.4674, + "step": 35197 + }, + { + "epoch": 2.77, + "learning_rate": 4.347358262825223e-06, + "loss": 1.4486, + "step": 35198 + }, + { + "epoch": 2.77, + "learning_rate": 4.3444046869130275e-06, + "loss": 1.4728, + "step": 35199 + }, + { + "epoch": 2.77, + "learning_rate": 4.3414520999219435e-06, + "loss": 1.4037, + "step": 35200 + }, + { + "epoch": 2.77, + "learning_rate": 4.338500501872022e-06, + "loss": 1.3636, + "step": 35201 + }, + { + "epoch": 2.77, + "learning_rate": 4.335549892783297e-06, + "loss": 1.4461, + "step": 35202 + }, + { + "epoch": 2.77, + "learning_rate": 4.332600272675801e-06, + "loss": 1.4669, + "step": 35203 + }, + { + "epoch": 2.77, + "learning_rate": 4.32965164156957e-06, + "loss": 1.4734, + "step": 35204 + }, + { + "epoch": 2.77, + "learning_rate": 4.326703999484604e-06, + "loss": 1.4295, + "step": 35205 + }, + { + "epoch": 2.77, + "learning_rate": 4.3237573464409536e-06, + "loss": 1.4229, + "step": 35206 + }, + { + "epoch": 2.77, + "learning_rate": 4.320811682458586e-06, + "loss": 1.4859, + "step": 35207 + }, + { + "epoch": 2.77, + "learning_rate": 4.317867007557502e-06, + "loss": 1.4641, + "step": 35208 + }, + { + "epoch": 2.77, + "learning_rate": 4.314923321757719e-06, + "loss": 1.4502, + "step": 35209 + }, + { + "epoch": 2.77, + "learning_rate": 4.31198062507922e-06, + "loss": 1.4262, + "step": 35210 + }, + { + "epoch": 2.77, + "learning_rate": 4.30903891754194e-06, + "loss": 1.4308, + "step": 35211 + }, + { + "epoch": 2.77, + "learning_rate": 4.3060981991659135e-06, + "loss": 1.4327, + "step": 35212 + }, + { + "epoch": 2.77, + "learning_rate": 4.303158469971074e-06, + "loss": 1.4354, + "step": 35213 + }, + { + "epoch": 2.77, + "learning_rate": 4.3002197299774055e-06, + "loss": 1.4522, + "step": 35214 + }, + { + "epoch": 2.77, + "learning_rate": 4.297281979204809e-06, + "loss": 1.4596, + "step": 35215 + }, + { + "epoch": 2.77, + "learning_rate": 4.294345217673284e-06, + "loss": 1.4272, + "step": 35216 + }, + { + "epoch": 2.77, + "learning_rate": 4.291409445402749e-06, + "loss": 1.4739, + "step": 35217 + }, + { + "epoch": 2.77, + "learning_rate": 4.288474662413138e-06, + "loss": 1.4205, + "step": 35218 + }, + { + "epoch": 2.77, + "learning_rate": 4.285540868724352e-06, + "loss": 1.4266, + "step": 35219 + }, + { + "epoch": 2.77, + "learning_rate": 4.282608064356341e-06, + "loss": 1.514, + "step": 35220 + }, + { + "epoch": 2.77, + "learning_rate": 4.279676249329023e-06, + "loss": 1.4319, + "step": 35221 + }, + { + "epoch": 2.77, + "learning_rate": 4.276745423662265e-06, + "loss": 1.4459, + "step": 35222 + }, + { + "epoch": 2.77, + "learning_rate": 4.273815587376001e-06, + "loss": 1.4331, + "step": 35223 + }, + { + "epoch": 2.77, + "learning_rate": 4.270886740490115e-06, + "loss": 1.4522, + "step": 35224 + }, + { + "epoch": 2.77, + "learning_rate": 4.267958883024475e-06, + "loss": 1.4326, + "step": 35225 + }, + { + "epoch": 2.77, + "learning_rate": 4.265032014998998e-06, + "loss": 1.4736, + "step": 35226 + }, + { + "epoch": 2.77, + "learning_rate": 4.262106136433519e-06, + "loss": 1.4757, + "step": 35227 + }, + { + "epoch": 2.77, + "learning_rate": 4.259181247347887e-06, + "loss": 1.4309, + "step": 35228 + }, + { + "epoch": 2.77, + "learning_rate": 4.256257347762004e-06, + "loss": 1.4826, + "step": 35229 + }, + { + "epoch": 2.77, + "learning_rate": 4.253334437695721e-06, + "loss": 1.4155, + "step": 35230 + }, + { + "epoch": 2.77, + "learning_rate": 4.2504125171688556e-06, + "loss": 1.4297, + "step": 35231 + }, + { + "epoch": 2.77, + "learning_rate": 4.247491586201257e-06, + "loss": 1.4243, + "step": 35232 + }, + { + "epoch": 2.77, + "learning_rate": 4.244571644812761e-06, + "loss": 1.4873, + "step": 35233 + }, + { + "epoch": 2.77, + "learning_rate": 4.241652693023201e-06, + "loss": 1.4362, + "step": 35234 + }, + { + "epoch": 2.77, + "learning_rate": 4.238734730852361e-06, + "loss": 1.4569, + "step": 35235 + }, + { + "epoch": 2.77, + "learning_rate": 4.2358177583200755e-06, + "loss": 1.4099, + "step": 35236 + }, + { + "epoch": 2.77, + "learning_rate": 4.232901775446163e-06, + "loss": 1.4314, + "step": 35237 + }, + { + "epoch": 2.77, + "learning_rate": 4.229986782250405e-06, + "loss": 1.5123, + "step": 35238 + }, + { + "epoch": 2.77, + "learning_rate": 4.227072778752588e-06, + "loss": 1.4638, + "step": 35239 + }, + { + "epoch": 2.77, + "learning_rate": 4.224159764972513e-06, + "loss": 1.4933, + "step": 35240 + }, + { + "epoch": 2.77, + "learning_rate": 4.221247740929945e-06, + "loss": 1.411, + "step": 35241 + }, + { + "epoch": 2.77, + "learning_rate": 4.218336706644637e-06, + "loss": 1.4525, + "step": 35242 + }, + { + "epoch": 2.77, + "learning_rate": 4.21542666213639e-06, + "loss": 1.4294, + "step": 35243 + }, + { + "epoch": 2.77, + "learning_rate": 4.212517607424937e-06, + "loss": 1.4184, + "step": 35244 + }, + { + "epoch": 2.77, + "learning_rate": 4.209609542530046e-06, + "loss": 1.4468, + "step": 35245 + }, + { + "epoch": 2.77, + "learning_rate": 4.2067024674714344e-06, + "loss": 1.4709, + "step": 35246 + }, + { + "epoch": 2.77, + "learning_rate": 4.203796382268887e-06, + "loss": 1.4268, + "step": 35247 + }, + { + "epoch": 2.77, + "learning_rate": 4.200891286942088e-06, + "loss": 1.4533, + "step": 35248 + }, + { + "epoch": 2.77, + "learning_rate": 4.1979871815107705e-06, + "loss": 1.4634, + "step": 35249 + }, + { + "epoch": 2.77, + "learning_rate": 4.195084065994686e-06, + "loss": 1.4288, + "step": 35250 + }, + { + "epoch": 2.77, + "learning_rate": 4.192181940413502e-06, + "loss": 1.4233, + "step": 35251 + }, + { + "epoch": 2.77, + "learning_rate": 4.189280804786938e-06, + "loss": 1.4698, + "step": 35252 + }, + { + "epoch": 2.77, + "learning_rate": 4.1863806591346915e-06, + "loss": 1.4468, + "step": 35253 + }, + { + "epoch": 2.77, + "learning_rate": 4.1834815034764655e-06, + "loss": 1.4568, + "step": 35254 + }, + { + "epoch": 2.77, + "learning_rate": 4.180583337831927e-06, + "loss": 1.4442, + "step": 35255 + }, + { + "epoch": 2.77, + "learning_rate": 4.177686162220745e-06, + "loss": 1.4096, + "step": 35256 + }, + { + "epoch": 2.77, + "learning_rate": 4.174789976662618e-06, + "loss": 1.4515, + "step": 35257 + }, + { + "epoch": 2.77, + "learning_rate": 4.171894781177199e-06, + "loss": 1.4657, + "step": 35258 + }, + { + "epoch": 2.77, + "learning_rate": 4.169000575784121e-06, + "loss": 1.382, + "step": 35259 + }, + { + "epoch": 2.77, + "learning_rate": 4.166107360503051e-06, + "loss": 1.4543, + "step": 35260 + }, + { + "epoch": 2.77, + "learning_rate": 4.163215135353643e-06, + "loss": 1.4276, + "step": 35261 + }, + { + "epoch": 2.77, + "learning_rate": 4.160323900355544e-06, + "loss": 1.466, + "step": 35262 + }, + { + "epoch": 2.77, + "learning_rate": 4.157433655528325e-06, + "loss": 1.4403, + "step": 35263 + }, + { + "epoch": 2.77, + "learning_rate": 4.154544400891685e-06, + "loss": 1.4689, + "step": 35264 + }, + { + "epoch": 2.77, + "learning_rate": 4.151656136465193e-06, + "loss": 1.461, + "step": 35265 + }, + { + "epoch": 2.77, + "learning_rate": 4.1487688622684645e-06, + "loss": 1.4356, + "step": 35266 + }, + { + "epoch": 2.77, + "learning_rate": 4.145882578321102e-06, + "loss": 1.4375, + "step": 35267 + }, + { + "epoch": 2.77, + "learning_rate": 4.142997284642724e-06, + "loss": 1.4275, + "step": 35268 + }, + { + "epoch": 2.78, + "learning_rate": 4.140112981252897e-06, + "loss": 1.4017, + "step": 35269 + }, + { + "epoch": 2.78, + "learning_rate": 4.1372296681712044e-06, + "loss": 1.4839, + "step": 35270 + }, + { + "epoch": 2.78, + "learning_rate": 4.134347345417249e-06, + "loss": 1.444, + "step": 35271 + }, + { + "epoch": 2.78, + "learning_rate": 4.131466013010565e-06, + "loss": 1.5185, + "step": 35272 + }, + { + "epoch": 2.78, + "learning_rate": 4.128585670970719e-06, + "loss": 1.4192, + "step": 35273 + }, + { + "epoch": 2.78, + "learning_rate": 4.125706319317296e-06, + "loss": 1.4414, + "step": 35274 + }, + { + "epoch": 2.78, + "learning_rate": 4.122827958069813e-06, + "loss": 1.4458, + "step": 35275 + }, + { + "epoch": 2.78, + "learning_rate": 4.119950587247839e-06, + "loss": 1.4336, + "step": 35276 + }, + { + "epoch": 2.78, + "learning_rate": 4.117074206870874e-06, + "loss": 1.4559, + "step": 35277 + }, + { + "epoch": 2.78, + "learning_rate": 4.114198816958503e-06, + "loss": 1.4833, + "step": 35278 + }, + { + "epoch": 2.78, + "learning_rate": 4.1113244175302095e-06, + "loss": 1.4507, + "step": 35279 + }, + { + "epoch": 2.78, + "learning_rate": 4.1084510086054954e-06, + "loss": 1.3741, + "step": 35280 + }, + { + "epoch": 2.78, + "learning_rate": 4.105578590203895e-06, + "loss": 1.4592, + "step": 35281 + }, + { + "epoch": 2.78, + "learning_rate": 4.102707162344926e-06, + "loss": 1.4258, + "step": 35282 + }, + { + "epoch": 2.78, + "learning_rate": 4.099836725048039e-06, + "loss": 1.4286, + "step": 35283 + }, + { + "epoch": 2.78, + "learning_rate": 4.096967278332753e-06, + "loss": 1.4437, + "step": 35284 + }, + { + "epoch": 2.78, + "learning_rate": 4.09409882221855e-06, + "loss": 1.4644, + "step": 35285 + }, + { + "epoch": 2.78, + "learning_rate": 4.091231356724884e-06, + "loss": 1.4196, + "step": 35286 + }, + { + "epoch": 2.78, + "learning_rate": 4.0883648818712535e-06, + "loss": 1.4674, + "step": 35287 + }, + { + "epoch": 2.78, + "learning_rate": 4.085499397677095e-06, + "loss": 1.4844, + "step": 35288 + }, + { + "epoch": 2.78, + "learning_rate": 4.082634904161891e-06, + "loss": 1.4409, + "step": 35289 + }, + { + "epoch": 2.78, + "learning_rate": 4.079771401345044e-06, + "loss": 1.4794, + "step": 35290 + }, + { + "epoch": 2.78, + "learning_rate": 4.076908889246022e-06, + "loss": 1.431, + "step": 35291 + }, + { + "epoch": 2.78, + "learning_rate": 4.074047367884292e-06, + "loss": 1.488, + "step": 35292 + }, + { + "epoch": 2.78, + "learning_rate": 4.0711868372792385e-06, + "loss": 1.4693, + "step": 35293 + }, + { + "epoch": 2.78, + "learning_rate": 4.06832729745028e-06, + "loss": 1.4093, + "step": 35294 + }, + { + "epoch": 2.78, + "learning_rate": 4.065468748416867e-06, + "loss": 1.4553, + "step": 35295 + }, + { + "epoch": 2.78, + "learning_rate": 4.062611190198384e-06, + "loss": 1.4587, + "step": 35296 + }, + { + "epoch": 2.78, + "learning_rate": 4.059754622814232e-06, + "loss": 1.3302, + "step": 35297 + }, + { + "epoch": 2.78, + "learning_rate": 4.056899046283812e-06, + "loss": 1.4627, + "step": 35298 + }, + { + "epoch": 2.78, + "learning_rate": 4.05404446062651e-06, + "loss": 1.4454, + "step": 35299 + }, + { + "epoch": 2.78, + "learning_rate": 4.051190865861709e-06, + "loss": 1.4605, + "step": 35300 + }, + { + "epoch": 2.78, + "learning_rate": 4.048338262008777e-06, + "loss": 1.4146, + "step": 35301 + }, + { + "epoch": 2.78, + "learning_rate": 4.0454866490870985e-06, + "loss": 1.422, + "step": 35302 + }, + { + "epoch": 2.78, + "learning_rate": 4.042636027115992e-06, + "loss": 1.4842, + "step": 35303 + }, + { + "epoch": 2.78, + "learning_rate": 4.039786396114858e-06, + "loss": 1.4749, + "step": 35304 + }, + { + "epoch": 2.78, + "learning_rate": 4.036937756103031e-06, + "loss": 1.4306, + "step": 35305 + }, + { + "epoch": 2.78, + "learning_rate": 4.034090107099846e-06, + "loss": 1.4484, + "step": 35306 + }, + { + "epoch": 2.78, + "learning_rate": 4.031243449124621e-06, + "loss": 1.4923, + "step": 35307 + }, + { + "epoch": 2.78, + "learning_rate": 4.028397782196724e-06, + "loss": 1.4409, + "step": 35308 + }, + { + "epoch": 2.78, + "learning_rate": 4.025553106335439e-06, + "loss": 1.3835, + "step": 35309 + }, + { + "epoch": 2.78, + "learning_rate": 4.0227094215600995e-06, + "loss": 1.4481, + "step": 35310 + }, + { + "epoch": 2.78, + "learning_rate": 4.019866727890008e-06, + "loss": 1.4478, + "step": 35311 + }, + { + "epoch": 2.78, + "learning_rate": 4.0170250253444666e-06, + "loss": 1.4629, + "step": 35312 + }, + { + "epoch": 2.78, + "learning_rate": 4.0141843139427585e-06, + "loss": 1.4391, + "step": 35313 + }, + { + "epoch": 2.78, + "learning_rate": 4.0113445937041685e-06, + "loss": 1.4384, + "step": 35314 + }, + { + "epoch": 2.78, + "learning_rate": 4.008505864647999e-06, + "loss": 1.4805, + "step": 35315 + }, + { + "epoch": 2.78, + "learning_rate": 4.005668126793515e-06, + "loss": 1.452, + "step": 35316 + }, + { + "epoch": 2.78, + "learning_rate": 4.0028313801599545e-06, + "loss": 1.4622, + "step": 35317 + }, + { + "epoch": 2.78, + "learning_rate": 3.9999956247666165e-06, + "loss": 1.4371, + "step": 35318 + }, + { + "epoch": 2.78, + "learning_rate": 3.9971608606327365e-06, + "loss": 1.3884, + "step": 35319 + }, + { + "epoch": 2.78, + "learning_rate": 3.994327087777566e-06, + "loss": 1.4693, + "step": 35320 + }, + { + "epoch": 2.78, + "learning_rate": 3.991494306220339e-06, + "loss": 1.4531, + "step": 35321 + }, + { + "epoch": 2.78, + "learning_rate": 3.988662515980273e-06, + "loss": 1.3954, + "step": 35322 + }, + { + "epoch": 2.78, + "learning_rate": 3.985831717076638e-06, + "loss": 1.3814, + "step": 35323 + }, + { + "epoch": 2.78, + "learning_rate": 3.983001909528616e-06, + "loss": 1.4154, + "step": 35324 + }, + { + "epoch": 2.78, + "learning_rate": 3.980173093355443e-06, + "loss": 1.4453, + "step": 35325 + }, + { + "epoch": 2.78, + "learning_rate": 3.977345268576321e-06, + "loss": 1.4274, + "step": 35326 + }, + { + "epoch": 2.78, + "learning_rate": 3.974518435210416e-06, + "loss": 1.4703, + "step": 35327 + }, + { + "epoch": 2.78, + "learning_rate": 3.971692593276965e-06, + "loss": 1.4521, + "step": 35328 + }, + { + "epoch": 2.78, + "learning_rate": 3.968867742795151e-06, + "loss": 1.4033, + "step": 35329 + }, + { + "epoch": 2.78, + "learning_rate": 3.966043883784125e-06, + "loss": 1.4444, + "step": 35330 + }, + { + "epoch": 2.78, + "learning_rate": 3.9632210162630575e-06, + "loss": 1.5305, + "step": 35331 + }, + { + "epoch": 2.78, + "learning_rate": 3.960399140251147e-06, + "loss": 1.436, + "step": 35332 + }, + { + "epoch": 2.78, + "learning_rate": 3.957578255767529e-06, + "loss": 1.4533, + "step": 35333 + }, + { + "epoch": 2.78, + "learning_rate": 3.954758362831356e-06, + "loss": 1.4468, + "step": 35334 + }, + { + "epoch": 2.78, + "learning_rate": 3.951939461461778e-06, + "loss": 1.4637, + "step": 35335 + }, + { + "epoch": 2.78, + "learning_rate": 3.949121551677964e-06, + "loss": 1.4667, + "step": 35336 + }, + { + "epoch": 2.78, + "learning_rate": 3.946304633498981e-06, + "loss": 1.3603, + "step": 35337 + }, + { + "epoch": 2.78, + "learning_rate": 3.943488706943998e-06, + "loss": 1.4235, + "step": 35338 + }, + { + "epoch": 2.78, + "learning_rate": 3.940673772032133e-06, + "loss": 1.458, + "step": 35339 + }, + { + "epoch": 2.78, + "learning_rate": 3.937859828782486e-06, + "loss": 1.4726, + "step": 35340 + }, + { + "epoch": 2.78, + "learning_rate": 3.935046877214177e-06, + "loss": 1.4611, + "step": 35341 + }, + { + "epoch": 2.78, + "learning_rate": 3.932234917346289e-06, + "loss": 1.4795, + "step": 35342 + }, + { + "epoch": 2.78, + "learning_rate": 3.929423949197924e-06, + "loss": 1.4456, + "step": 35343 + }, + { + "epoch": 2.78, + "learning_rate": 3.926613972788151e-06, + "loss": 1.4485, + "step": 35344 + }, + { + "epoch": 2.78, + "learning_rate": 3.92380498813607e-06, + "loss": 1.4668, + "step": 35345 + }, + { + "epoch": 2.78, + "learning_rate": 3.920996995260733e-06, + "loss": 1.4359, + "step": 35346 + }, + { + "epoch": 2.78, + "learning_rate": 3.918189994181225e-06, + "loss": 1.4831, + "step": 35347 + }, + { + "epoch": 2.78, + "learning_rate": 3.915383984916581e-06, + "loss": 1.4411, + "step": 35348 + }, + { + "epoch": 2.78, + "learning_rate": 3.912578967485868e-06, + "loss": 1.4106, + "step": 35349 + }, + { + "epoch": 2.78, + "learning_rate": 3.9097749419081225e-06, + "loss": 1.4501, + "step": 35350 + }, + { + "epoch": 2.78, + "learning_rate": 3.9069719082023775e-06, + "loss": 1.4337, + "step": 35351 + }, + { + "epoch": 2.78, + "learning_rate": 3.904169866387702e-06, + "loss": 1.3529, + "step": 35352 + }, + { + "epoch": 2.78, + "learning_rate": 3.901368816483081e-06, + "loss": 1.4215, + "step": 35353 + }, + { + "epoch": 2.78, + "learning_rate": 3.898568758507514e-06, + "loss": 1.4204, + "step": 35354 + }, + { + "epoch": 2.78, + "learning_rate": 3.895769692480055e-06, + "loss": 1.4569, + "step": 35355 + }, + { + "epoch": 2.78, + "learning_rate": 3.892971618419705e-06, + "loss": 1.4193, + "step": 35356 + }, + { + "epoch": 2.78, + "learning_rate": 3.890174536345431e-06, + "loss": 1.4501, + "step": 35357 + }, + { + "epoch": 2.78, + "learning_rate": 3.8873784462762515e-06, + "loss": 1.4317, + "step": 35358 + }, + { + "epoch": 2.78, + "learning_rate": 3.884583348231135e-06, + "loss": 1.4536, + "step": 35359 + }, + { + "epoch": 2.78, + "learning_rate": 3.881789242229083e-06, + "loss": 1.398, + "step": 35360 + }, + { + "epoch": 2.78, + "learning_rate": 3.8789961282890305e-06, + "loss": 1.4447, + "step": 35361 + }, + { + "epoch": 2.78, + "learning_rate": 3.876204006429961e-06, + "loss": 1.4218, + "step": 35362 + }, + { + "epoch": 2.78, + "learning_rate": 3.873412876670829e-06, + "loss": 1.4988, + "step": 35363 + }, + { + "epoch": 2.78, + "learning_rate": 3.870622739030582e-06, + "loss": 1.3944, + "step": 35364 + }, + { + "epoch": 2.78, + "learning_rate": 3.867833593528175e-06, + "loss": 1.4752, + "step": 35365 + }, + { + "epoch": 2.78, + "learning_rate": 3.865045440182541e-06, + "loss": 1.4212, + "step": 35366 + }, + { + "epoch": 2.78, + "learning_rate": 3.862258279012598e-06, + "loss": 1.4688, + "step": 35367 + }, + { + "epoch": 2.78, + "learning_rate": 3.859472110037248e-06, + "loss": 1.4593, + "step": 35368 + }, + { + "epoch": 2.78, + "learning_rate": 3.85668693327546e-06, + "loss": 1.4367, + "step": 35369 + }, + { + "epoch": 2.78, + "learning_rate": 3.853902748746118e-06, + "loss": 1.4922, + "step": 35370 + }, + { + "epoch": 2.78, + "learning_rate": 3.851119556468124e-06, + "loss": 1.4057, + "step": 35371 + }, + { + "epoch": 2.78, + "learning_rate": 3.848337356460379e-06, + "loss": 1.447, + "step": 35372 + }, + { + "epoch": 2.78, + "learning_rate": 3.845556148741769e-06, + "loss": 1.4835, + "step": 35373 + }, + { + "epoch": 2.78, + "learning_rate": 3.842775933331177e-06, + "loss": 1.4592, + "step": 35374 + }, + { + "epoch": 2.78, + "learning_rate": 3.839996710247472e-06, + "loss": 1.3919, + "step": 35375 + }, + { + "epoch": 2.78, + "learning_rate": 3.837218479509557e-06, + "loss": 1.4306, + "step": 35376 + }, + { + "epoch": 2.78, + "learning_rate": 3.834441241136249e-06, + "loss": 1.427, + "step": 35377 + }, + { + "epoch": 2.78, + "learning_rate": 3.831664995146416e-06, + "loss": 1.4808, + "step": 35378 + }, + { + "epoch": 2.78, + "learning_rate": 3.828889741558943e-06, + "loss": 1.4155, + "step": 35379 + }, + { + "epoch": 2.78, + "learning_rate": 3.826115480392633e-06, + "loss": 1.4656, + "step": 35380 + }, + { + "epoch": 2.78, + "learning_rate": 3.8233422116663195e-06, + "loss": 1.4294, + "step": 35381 + }, + { + "epoch": 2.78, + "learning_rate": 3.820569935398854e-06, + "loss": 1.4498, + "step": 35382 + }, + { + "epoch": 2.78, + "learning_rate": 3.817798651609055e-06, + "loss": 1.415, + "step": 35383 + }, + { + "epoch": 2.78, + "learning_rate": 3.815028360315742e-06, + "loss": 1.4537, + "step": 35384 + }, + { + "epoch": 2.78, + "learning_rate": 3.8122590615376812e-06, + "loss": 1.4619, + "step": 35385 + }, + { + "epoch": 2.78, + "learning_rate": 3.8094907552937258e-06, + "loss": 1.4378, + "step": 35386 + }, + { + "epoch": 2.78, + "learning_rate": 3.806723441602677e-06, + "loss": 1.4295, + "step": 35387 + }, + { + "epoch": 2.78, + "learning_rate": 3.8039571204832863e-06, + "loss": 1.4377, + "step": 35388 + }, + { + "epoch": 2.78, + "learning_rate": 3.801191791954322e-06, + "loss": 1.4095, + "step": 35389 + }, + { + "epoch": 2.78, + "learning_rate": 3.7984274560346195e-06, + "loss": 1.4402, + "step": 35390 + }, + { + "epoch": 2.78, + "learning_rate": 3.7956641127429133e-06, + "loss": 1.4837, + "step": 35391 + }, + { + "epoch": 2.78, + "learning_rate": 3.7929017620979386e-06, + "loss": 1.4806, + "step": 35392 + }, + { + "epoch": 2.78, + "learning_rate": 3.790140404118497e-06, + "loss": 1.452, + "step": 35393 + }, + { + "epoch": 2.78, + "learning_rate": 3.7873800388233234e-06, + "loss": 1.4479, + "step": 35394 + }, + { + "epoch": 2.78, + "learning_rate": 3.7846206662311197e-06, + "loss": 1.4576, + "step": 35395 + }, + { + "epoch": 2.79, + "learning_rate": 3.7818622863606873e-06, + "loss": 1.4284, + "step": 35396 + }, + { + "epoch": 2.79, + "learning_rate": 3.7791048992307115e-06, + "loss": 1.3846, + "step": 35397 + }, + { + "epoch": 2.79, + "learning_rate": 3.7763485048599107e-06, + "loss": 1.5076, + "step": 35398 + }, + { + "epoch": 2.79, + "learning_rate": 3.7735931032670198e-06, + "loss": 1.4451, + "step": 35399 + }, + { + "epoch": 2.79, + "learning_rate": 3.77083869447074e-06, + "loss": 1.399, + "step": 35400 + }, + { + "epoch": 2.79, + "learning_rate": 3.7680852784897576e-06, + "loss": 1.4201, + "step": 35401 + }, + { + "epoch": 2.79, + "learning_rate": 3.7653328553427896e-06, + "loss": 1.4616, + "step": 35402 + }, + { + "epoch": 2.79, + "learning_rate": 3.7625814250485054e-06, + "loss": 1.4512, + "step": 35403 + }, + { + "epoch": 2.79, + "learning_rate": 3.759830987625606e-06, + "loss": 1.5024, + "step": 35404 + }, + { + "epoch": 2.79, + "learning_rate": 3.757081543092744e-06, + "loss": 1.495, + "step": 35405 + }, + { + "epoch": 2.79, + "learning_rate": 3.7543330914685863e-06, + "loss": 1.4088, + "step": 35406 + }, + { + "epoch": 2.79, + "learning_rate": 3.7515856327718196e-06, + "loss": 1.4468, + "step": 35407 + }, + { + "epoch": 2.79, + "learning_rate": 3.7488391670210783e-06, + "loss": 1.4425, + "step": 35408 + }, + { + "epoch": 2.79, + "learning_rate": 3.7460936942349972e-06, + "loss": 1.4294, + "step": 35409 + }, + { + "epoch": 2.79, + "learning_rate": 3.7433492144322284e-06, + "loss": 1.4543, + "step": 35410 + }, + { + "epoch": 2.79, + "learning_rate": 3.740605727631424e-06, + "loss": 1.4631, + "step": 35411 + }, + { + "epoch": 2.79, + "learning_rate": 3.737863233851185e-06, + "loss": 1.4503, + "step": 35412 + }, + { + "epoch": 2.79, + "learning_rate": 3.735121733110147e-06, + "loss": 1.4378, + "step": 35413 + }, + { + "epoch": 2.79, + "learning_rate": 3.7323812254269114e-06, + "loss": 1.3899, + "step": 35414 + }, + { + "epoch": 2.79, + "learning_rate": 3.7296417108200805e-06, + "loss": 1.4473, + "step": 35415 + }, + { + "epoch": 2.79, + "learning_rate": 3.726903189308256e-06, + "loss": 1.4132, + "step": 35416 + }, + { + "epoch": 2.79, + "learning_rate": 3.7241656609100723e-06, + "loss": 1.4576, + "step": 35417 + }, + { + "epoch": 2.79, + "learning_rate": 3.7214291256440654e-06, + "loss": 1.4936, + "step": 35418 + }, + { + "epoch": 2.79, + "learning_rate": 3.7186935835288202e-06, + "loss": 1.4425, + "step": 35419 + }, + { + "epoch": 2.79, + "learning_rate": 3.715959034582938e-06, + "loss": 1.4067, + "step": 35420 + }, + { + "epoch": 2.79, + "learning_rate": 3.7132254788249717e-06, + "loss": 1.4426, + "step": 35421 + }, + { + "epoch": 2.79, + "learning_rate": 3.7104929162734553e-06, + "loss": 1.3846, + "step": 35422 + }, + { + "epoch": 2.79, + "learning_rate": 3.707761346946975e-06, + "loss": 1.4264, + "step": 35423 + }, + { + "epoch": 2.79, + "learning_rate": 3.7050307708640648e-06, + "loss": 1.4555, + "step": 35424 + }, + { + "epoch": 2.79, + "learning_rate": 3.7023011880432772e-06, + "loss": 1.4204, + "step": 35425 + }, + { + "epoch": 2.79, + "learning_rate": 3.699572598503098e-06, + "loss": 1.453, + "step": 35426 + }, + { + "epoch": 2.79, + "learning_rate": 3.696845002262111e-06, + "loss": 1.4485, + "step": 35427 + }, + { + "epoch": 2.79, + "learning_rate": 3.6941183993388024e-06, + "loss": 1.4647, + "step": 35428 + }, + { + "epoch": 2.79, + "learning_rate": 3.6913927897516904e-06, + "loss": 1.4167, + "step": 35429 + }, + { + "epoch": 2.79, + "learning_rate": 3.688668173519277e-06, + "loss": 1.4243, + "step": 35430 + }, + { + "epoch": 2.79, + "learning_rate": 3.6859445506600803e-06, + "loss": 1.4485, + "step": 35431 + }, + { + "epoch": 2.79, + "learning_rate": 3.683221921192553e-06, + "loss": 1.4742, + "step": 35432 + }, + { + "epoch": 2.79, + "learning_rate": 3.680500285135213e-06, + "loss": 1.3931, + "step": 35433 + }, + { + "epoch": 2.79, + "learning_rate": 3.6777796425065454e-06, + "loss": 1.4493, + "step": 35434 + }, + { + "epoch": 2.79, + "learning_rate": 3.6750599933250025e-06, + "loss": 1.4198, + "step": 35435 + }, + { + "epoch": 2.79, + "learning_rate": 3.672341337609036e-06, + "loss": 1.4799, + "step": 35436 + }, + { + "epoch": 2.79, + "learning_rate": 3.6696236753771478e-06, + "loss": 1.4829, + "step": 35437 + }, + { + "epoch": 2.79, + "learning_rate": 3.666907006647757e-06, + "loss": 1.4959, + "step": 35438 + }, + { + "epoch": 2.79, + "learning_rate": 3.664191331439298e-06, + "loss": 1.4664, + "step": 35439 + }, + { + "epoch": 2.79, + "learning_rate": 3.6614766497702396e-06, + "loss": 1.4402, + "step": 35440 + }, + { + "epoch": 2.79, + "learning_rate": 3.6587629616589842e-06, + "loss": 1.4098, + "step": 35441 + }, + { + "epoch": 2.79, + "learning_rate": 3.6560502671239833e-06, + "loss": 1.4622, + "step": 35442 + }, + { + "epoch": 2.79, + "learning_rate": 3.653338566183639e-06, + "loss": 1.4612, + "step": 35443 + }, + { + "epoch": 2.79, + "learning_rate": 3.6506278588563697e-06, + "loss": 1.4858, + "step": 35444 + }, + { + "epoch": 2.79, + "learning_rate": 3.647918145160578e-06, + "loss": 1.4623, + "step": 35445 + }, + { + "epoch": 2.79, + "learning_rate": 3.645209425114631e-06, + "loss": 1.4113, + "step": 35446 + }, + { + "epoch": 2.79, + "learning_rate": 3.642501698736966e-06, + "loss": 1.4673, + "step": 35447 + }, + { + "epoch": 2.79, + "learning_rate": 3.6397949660459503e-06, + "loss": 1.3848, + "step": 35448 + }, + { + "epoch": 2.79, + "learning_rate": 3.637089227059953e-06, + "loss": 1.4274, + "step": 35449 + }, + { + "epoch": 2.79, + "learning_rate": 3.6343844817973424e-06, + "loss": 1.4311, + "step": 35450 + }, + { + "epoch": 2.79, + "learning_rate": 3.631680730276504e-06, + "loss": 1.491, + "step": 35451 + }, + { + "epoch": 2.79, + "learning_rate": 3.6289779725157897e-06, + "loss": 1.4357, + "step": 35452 + }, + { + "epoch": 2.79, + "learning_rate": 3.6262762085335185e-06, + "loss": 1.4191, + "step": 35453 + }, + { + "epoch": 2.79, + "learning_rate": 3.6235754383480585e-06, + "loss": 1.4054, + "step": 35454 + }, + { + "epoch": 2.79, + "learning_rate": 3.6208756619777624e-06, + "loss": 1.4516, + "step": 35455 + }, + { + "epoch": 2.79, + "learning_rate": 3.618176879440915e-06, + "loss": 1.4047, + "step": 35456 + }, + { + "epoch": 2.79, + "learning_rate": 3.6154790907559016e-06, + "loss": 1.4276, + "step": 35457 + }, + { + "epoch": 2.79, + "learning_rate": 3.6127822959409746e-06, + "loss": 1.4718, + "step": 35458 + }, + { + "epoch": 2.79, + "learning_rate": 3.6100864950145027e-06, + "loss": 1.4214, + "step": 35459 + }, + { + "epoch": 2.79, + "learning_rate": 3.6073916879947208e-06, + "loss": 1.4807, + "step": 35460 + }, + { + "epoch": 2.79, + "learning_rate": 3.604697874899981e-06, + "loss": 1.4816, + "step": 35461 + }, + { + "epoch": 2.79, + "learning_rate": 3.602005055748569e-06, + "loss": 1.4393, + "step": 35462 + }, + { + "epoch": 2.79, + "learning_rate": 3.5993132305587202e-06, + "loss": 1.424, + "step": 35463 + }, + { + "epoch": 2.79, + "learning_rate": 3.596622399348753e-06, + "loss": 1.4717, + "step": 35464 + }, + { + "epoch": 2.79, + "learning_rate": 3.593932562136953e-06, + "loss": 1.483, + "step": 35465 + }, + { + "epoch": 2.79, + "learning_rate": 3.591243718941539e-06, + "loss": 1.447, + "step": 35466 + }, + { + "epoch": 2.79, + "learning_rate": 3.5885558697807795e-06, + "loss": 1.4389, + "step": 35467 + }, + { + "epoch": 2.79, + "learning_rate": 3.585869014672943e-06, + "loss": 1.4093, + "step": 35468 + }, + { + "epoch": 2.79, + "learning_rate": 3.5831831536362654e-06, + "loss": 1.4178, + "step": 35469 + }, + { + "epoch": 2.79, + "learning_rate": 3.580498286688949e-06, + "loss": 1.4337, + "step": 35470 + }, + { + "epoch": 2.79, + "learning_rate": 3.5778144138492614e-06, + "loss": 1.453, + "step": 35471 + }, + { + "epoch": 2.79, + "learning_rate": 3.575131535135423e-06, + "loss": 1.4568, + "step": 35472 + }, + { + "epoch": 2.79, + "learning_rate": 3.5724496505656175e-06, + "loss": 1.4691, + "step": 35473 + }, + { + "epoch": 2.79, + "learning_rate": 3.5697687601580816e-06, + "loss": 1.4596, + "step": 35474 + }, + { + "epoch": 2.79, + "learning_rate": 3.5670888639310167e-06, + "loss": 1.447, + "step": 35475 + }, + { + "epoch": 2.79, + "learning_rate": 3.564409961902592e-06, + "loss": 1.4439, + "step": 35476 + }, + { + "epoch": 2.79, + "learning_rate": 3.5617320540910266e-06, + "loss": 1.4527, + "step": 35477 + }, + { + "epoch": 2.79, + "learning_rate": 3.5590551405144885e-06, + "loss": 1.4279, + "step": 35478 + }, + { + "epoch": 2.79, + "learning_rate": 3.556379221191147e-06, + "loss": 1.4577, + "step": 35479 + }, + { + "epoch": 2.79, + "learning_rate": 3.5537042961391703e-06, + "loss": 1.4514, + "step": 35480 + }, + { + "epoch": 2.79, + "learning_rate": 3.5510303653767445e-06, + "loss": 1.4293, + "step": 35481 + }, + { + "epoch": 2.79, + "learning_rate": 3.548357428922005e-06, + "loss": 1.3958, + "step": 35482 + }, + { + "epoch": 2.79, + "learning_rate": 3.5456854867930874e-06, + "loss": 1.4455, + "step": 35483 + }, + { + "epoch": 2.79, + "learning_rate": 3.543014539008143e-06, + "loss": 1.5019, + "step": 35484 + }, + { + "epoch": 2.79, + "learning_rate": 3.5403445855853252e-06, + "loss": 1.4469, + "step": 35485 + }, + { + "epoch": 2.79, + "learning_rate": 3.5376756265427354e-06, + "loss": 1.4395, + "step": 35486 + }, + { + "epoch": 2.79, + "learning_rate": 3.5350076618984925e-06, + "loss": 1.4067, + "step": 35487 + }, + { + "epoch": 2.79, + "learning_rate": 3.532340691670732e-06, + "loss": 1.4167, + "step": 35488 + }, + { + "epoch": 2.79, + "learning_rate": 3.5296747158775563e-06, + "loss": 1.4505, + "step": 35489 + }, + { + "epoch": 2.79, + "learning_rate": 3.527009734537051e-06, + "loss": 1.4427, + "step": 35490 + }, + { + "epoch": 2.79, + "learning_rate": 3.5243457476673174e-06, + "loss": 1.4468, + "step": 35491 + }, + { + "epoch": 2.79, + "learning_rate": 3.5216827552864592e-06, + "loss": 1.436, + "step": 35492 + }, + { + "epoch": 2.79, + "learning_rate": 3.5190207574125274e-06, + "loss": 1.392, + "step": 35493 + }, + { + "epoch": 2.79, + "learning_rate": 3.5163597540636078e-06, + "loss": 1.4102, + "step": 35494 + }, + { + "epoch": 2.79, + "learning_rate": 3.5136997452577696e-06, + "loss": 1.4672, + "step": 35495 + }, + { + "epoch": 2.79, + "learning_rate": 3.5110407310130816e-06, + "loss": 1.4687, + "step": 35496 + }, + { + "epoch": 2.79, + "learning_rate": 3.5083827113475793e-06, + "loss": 1.4028, + "step": 35497 + }, + { + "epoch": 2.79, + "learning_rate": 3.5057256862793315e-06, + "loss": 1.3887, + "step": 35498 + }, + { + "epoch": 2.79, + "learning_rate": 3.503069655826357e-06, + "loss": 1.4524, + "step": 35499 + }, + { + "epoch": 2.79, + "learning_rate": 3.5004146200066916e-06, + "loss": 1.4184, + "step": 35500 + }, + { + "epoch": 2.79, + "learning_rate": 3.4977605788383713e-06, + "loss": 1.3881, + "step": 35501 + }, + { + "epoch": 2.79, + "learning_rate": 3.4951075323393972e-06, + "loss": 1.4031, + "step": 35502 + }, + { + "epoch": 2.79, + "learning_rate": 3.4924554805278225e-06, + "loss": 1.4654, + "step": 35503 + }, + { + "epoch": 2.79, + "learning_rate": 3.4898044234215993e-06, + "loss": 1.4497, + "step": 35504 + }, + { + "epoch": 2.79, + "learning_rate": 3.487154361038763e-06, + "loss": 1.506, + "step": 35505 + }, + { + "epoch": 2.79, + "learning_rate": 3.4845052933972994e-06, + "loss": 1.4859, + "step": 35506 + }, + { + "epoch": 2.79, + "learning_rate": 3.481857220515177e-06, + "loss": 1.447, + "step": 35507 + }, + { + "epoch": 2.79, + "learning_rate": 3.479210142410399e-06, + "loss": 1.4727, + "step": 35508 + }, + { + "epoch": 2.79, + "learning_rate": 3.4765640591009338e-06, + "loss": 1.407, + "step": 35509 + }, + { + "epoch": 2.79, + "learning_rate": 3.4739189706047166e-06, + "loss": 1.3684, + "step": 35510 + }, + { + "epoch": 2.79, + "learning_rate": 3.4712748769397335e-06, + "loss": 1.46, + "step": 35511 + }, + { + "epoch": 2.79, + "learning_rate": 3.4686317781239535e-06, + "loss": 1.4737, + "step": 35512 + }, + { + "epoch": 2.79, + "learning_rate": 3.4659896741752955e-06, + "loss": 1.4056, + "step": 35513 + }, + { + "epoch": 2.79, + "learning_rate": 3.4633485651116955e-06, + "loss": 1.4674, + "step": 35514 + }, + { + "epoch": 2.79, + "learning_rate": 3.460708450951105e-06, + "loss": 1.4681, + "step": 35515 + }, + { + "epoch": 2.79, + "learning_rate": 3.458069331711427e-06, + "loss": 1.4654, + "step": 35516 + }, + { + "epoch": 2.79, + "learning_rate": 3.4554312074105804e-06, + "loss": 1.4281, + "step": 35517 + }, + { + "epoch": 2.79, + "learning_rate": 3.4527940780665007e-06, + "loss": 1.4346, + "step": 35518 + }, + { + "epoch": 2.79, + "learning_rate": 3.4501579436970904e-06, + "loss": 1.5012, + "step": 35519 + }, + { + "epoch": 2.79, + "learning_rate": 3.4475228043202184e-06, + "loss": 1.4602, + "step": 35520 + }, + { + "epoch": 2.79, + "learning_rate": 3.4448886599537874e-06, + "loss": 1.4221, + "step": 35521 + }, + { + "epoch": 2.79, + "learning_rate": 3.442255510615699e-06, + "loss": 1.4892, + "step": 35522 + }, + { + "epoch": 2.79, + "learning_rate": 3.439623356323823e-06, + "loss": 1.4641, + "step": 35523 + }, + { + "epoch": 2.8, + "learning_rate": 3.4369921970959945e-06, + "loss": 1.4374, + "step": 35524 + }, + { + "epoch": 2.8, + "learning_rate": 3.434362032950133e-06, + "loss": 1.4771, + "step": 35525 + }, + { + "epoch": 2.8, + "learning_rate": 3.4317328639040743e-06, + "loss": 1.4734, + "step": 35526 + }, + { + "epoch": 2.8, + "learning_rate": 3.4291046899756535e-06, + "loss": 1.4268, + "step": 35527 + }, + { + "epoch": 2.8, + "learning_rate": 3.4264775111827236e-06, + "loss": 1.3813, + "step": 35528 + }, + { + "epoch": 2.8, + "learning_rate": 3.4238513275431367e-06, + "loss": 1.4224, + "step": 35529 + }, + { + "epoch": 2.8, + "learning_rate": 3.4212261390747286e-06, + "loss": 1.4098, + "step": 35530 + }, + { + "epoch": 2.8, + "learning_rate": 3.4186019457952686e-06, + "loss": 1.4177, + "step": 35531 + }, + { + "epoch": 2.8, + "learning_rate": 3.415978747722642e-06, + "loss": 1.4471, + "step": 35532 + }, + { + "epoch": 2.8, + "learning_rate": 3.413356544874618e-06, + "loss": 1.4356, + "step": 35533 + }, + { + "epoch": 2.8, + "learning_rate": 3.4107353372689994e-06, + "loss": 1.4282, + "step": 35534 + }, + { + "epoch": 2.8, + "learning_rate": 3.408115124923605e-06, + "loss": 1.4964, + "step": 35535 + }, + { + "epoch": 2.8, + "learning_rate": 3.4054959078562206e-06, + "loss": 1.368, + "step": 35536 + }, + { + "epoch": 2.8, + "learning_rate": 3.402877686084615e-06, + "loss": 1.4923, + "step": 35537 + }, + { + "epoch": 2.8, + "learning_rate": 3.400260459626558e-06, + "loss": 1.4674, + "step": 35538 + }, + { + "epoch": 2.8, + "learning_rate": 3.3976442284998352e-06, + "loss": 1.4572, + "step": 35539 + }, + { + "epoch": 2.8, + "learning_rate": 3.3950289927222318e-06, + "loss": 1.4164, + "step": 35540 + }, + { + "epoch": 2.8, + "learning_rate": 3.392414752311434e-06, + "loss": 1.4658, + "step": 35541 + }, + { + "epoch": 2.8, + "learning_rate": 3.3898015072852614e-06, + "loss": 1.4854, + "step": 35542 + }, + { + "epoch": 2.8, + "learning_rate": 3.387189257661432e-06, + "loss": 1.4042, + "step": 35543 + }, + { + "epoch": 2.8, + "learning_rate": 3.384578003457683e-06, + "loss": 1.5157, + "step": 35544 + }, + { + "epoch": 2.8, + "learning_rate": 3.3819677446917158e-06, + "loss": 1.44, + "step": 35545 + }, + { + "epoch": 2.8, + "learning_rate": 3.3793584813813e-06, + "loss": 1.4259, + "step": 35546 + }, + { + "epoch": 2.8, + "learning_rate": 3.3767502135441383e-06, + "loss": 1.4246, + "step": 35547 + }, + { + "epoch": 2.8, + "learning_rate": 3.3741429411978993e-06, + "loss": 1.4684, + "step": 35548 + }, + { + "epoch": 2.8, + "learning_rate": 3.3715366643603357e-06, + "loss": 1.4825, + "step": 35549 + }, + { + "epoch": 2.8, + "learning_rate": 3.368931383049117e-06, + "loss": 1.4811, + "step": 35550 + }, + { + "epoch": 2.8, + "learning_rate": 3.3663270972819288e-06, + "loss": 1.4549, + "step": 35551 + }, + { + "epoch": 2.8, + "learning_rate": 3.3637238070764737e-06, + "loss": 1.4062, + "step": 35552 + }, + { + "epoch": 2.8, + "learning_rate": 3.3611215124504043e-06, + "loss": 1.3899, + "step": 35553 + }, + { + "epoch": 2.8, + "learning_rate": 3.358520213421406e-06, + "loss": 1.4569, + "step": 35554 + }, + { + "epoch": 2.8, + "learning_rate": 3.355919910007132e-06, + "loss": 1.477, + "step": 35555 + }, + { + "epoch": 2.8, + "learning_rate": 3.3533206022252347e-06, + "loss": 1.442, + "step": 35556 + }, + { + "epoch": 2.8, + "learning_rate": 3.350722290093366e-06, + "loss": 1.4638, + "step": 35557 + }, + { + "epoch": 2.8, + "learning_rate": 3.348124973629146e-06, + "loss": 1.4855, + "step": 35558 + }, + { + "epoch": 2.8, + "learning_rate": 3.345528652850227e-06, + "loss": 1.425, + "step": 35559 + }, + { + "epoch": 2.8, + "learning_rate": 3.342933327774261e-06, + "loss": 1.5128, + "step": 35560 + }, + { + "epoch": 2.8, + "learning_rate": 3.3403389984188513e-06, + "loss": 1.4442, + "step": 35561 + }, + { + "epoch": 2.8, + "learning_rate": 3.337745664801583e-06, + "loss": 1.388, + "step": 35562 + }, + { + "epoch": 2.8, + "learning_rate": 3.3351533269400932e-06, + "loss": 1.4693, + "step": 35563 + }, + { + "epoch": 2.8, + "learning_rate": 3.3325619848519837e-06, + "loss": 1.4039, + "step": 35564 + }, + { + "epoch": 2.8, + "learning_rate": 3.3299716385548236e-06, + "loss": 1.4623, + "step": 35565 + }, + { + "epoch": 2.8, + "learning_rate": 3.3273822880662327e-06, + "loss": 1.4101, + "step": 35566 + }, + { + "epoch": 2.8, + "learning_rate": 3.32479393340378e-06, + "loss": 1.4102, + "step": 35567 + }, + { + "epoch": 2.8, + "learning_rate": 3.3222065745850178e-06, + "loss": 1.4044, + "step": 35568 + }, + { + "epoch": 2.8, + "learning_rate": 3.3196202116275494e-06, + "loss": 1.419, + "step": 35569 + }, + { + "epoch": 2.8, + "learning_rate": 3.3170348445489103e-06, + "loss": 1.4357, + "step": 35570 + }, + { + "epoch": 2.8, + "learning_rate": 3.3144504733666535e-06, + "loss": 1.427, + "step": 35571 + }, + { + "epoch": 2.8, + "learning_rate": 3.311867098098314e-06, + "loss": 1.4598, + "step": 35572 + }, + { + "epoch": 2.8, + "learning_rate": 3.3092847187614624e-06, + "loss": 1.4593, + "step": 35573 + }, + { + "epoch": 2.8, + "learning_rate": 3.3067033353736173e-06, + "loss": 1.4847, + "step": 35574 + }, + { + "epoch": 2.8, + "learning_rate": 3.304122947952281e-06, + "loss": 1.4485, + "step": 35575 + }, + { + "epoch": 2.8, + "learning_rate": 3.301543556515024e-06, + "loss": 1.4702, + "step": 35576 + }, + { + "epoch": 2.8, + "learning_rate": 3.2989651610793312e-06, + "loss": 1.4532, + "step": 35577 + }, + { + "epoch": 2.8, + "learning_rate": 3.2963877616627223e-06, + "loss": 1.4439, + "step": 35578 + }, + { + "epoch": 2.8, + "learning_rate": 3.29381135828265e-06, + "loss": 1.4389, + "step": 35579 + }, + { + "epoch": 2.8, + "learning_rate": 3.29123595095665e-06, + "loss": 1.4283, + "step": 35580 + }, + { + "epoch": 2.8, + "learning_rate": 3.288661539702209e-06, + "loss": 1.4541, + "step": 35581 + }, + { + "epoch": 2.8, + "learning_rate": 3.2860881245367786e-06, + "loss": 1.4287, + "step": 35582 + }, + { + "epoch": 2.8, + "learning_rate": 3.2835157054778626e-06, + "loss": 1.4198, + "step": 35583 + }, + { + "epoch": 2.8, + "learning_rate": 3.2809442825428966e-06, + "loss": 1.3919, + "step": 35584 + }, + { + "epoch": 2.8, + "learning_rate": 3.27837385574935e-06, + "loss": 1.4265, + "step": 35585 + }, + { + "epoch": 2.8, + "learning_rate": 3.275804425114692e-06, + "loss": 1.4625, + "step": 35586 + }, + { + "epoch": 2.8, + "learning_rate": 3.273235990656359e-06, + "loss": 1.3746, + "step": 35587 + }, + { + "epoch": 2.8, + "learning_rate": 3.270668552391753e-06, + "loss": 1.4535, + "step": 35588 + }, + { + "epoch": 2.8, + "learning_rate": 3.2681021103383443e-06, + "loss": 1.4702, + "step": 35589 + }, + { + "epoch": 2.8, + "learning_rate": 3.2655366645135683e-06, + "loss": 1.4497, + "step": 35590 + }, + { + "epoch": 2.8, + "learning_rate": 3.2629722149348115e-06, + "loss": 1.3907, + "step": 35591 + }, + { + "epoch": 2.8, + "learning_rate": 3.260408761619493e-06, + "loss": 1.4592, + "step": 35592 + }, + { + "epoch": 2.8, + "learning_rate": 3.2578463045850323e-06, + "loss": 1.4195, + "step": 35593 + }, + { + "epoch": 2.8, + "learning_rate": 3.2552848438488157e-06, + "loss": 1.4304, + "step": 35594 + }, + { + "epoch": 2.8, + "learning_rate": 3.2527243794282288e-06, + "loss": 1.4431, + "step": 35595 + }, + { + "epoch": 2.8, + "learning_rate": 3.250164911340658e-06, + "loss": 1.4603, + "step": 35596 + }, + { + "epoch": 2.8, + "learning_rate": 3.2476064396034896e-06, + "loss": 1.4143, + "step": 35597 + }, + { + "epoch": 2.8, + "learning_rate": 3.245048964234093e-06, + "loss": 1.4442, + "step": 35598 + }, + { + "epoch": 2.8, + "learning_rate": 3.2424924852498036e-06, + "loss": 1.4784, + "step": 35599 + }, + { + "epoch": 2.8, + "learning_rate": 3.239937002668025e-06, + "loss": 1.4354, + "step": 35600 + }, + { + "epoch": 2.8, + "learning_rate": 3.237382516506093e-06, + "loss": 1.4101, + "step": 35601 + }, + { + "epoch": 2.8, + "learning_rate": 3.234829026781327e-06, + "loss": 1.4248, + "step": 35602 + }, + { + "epoch": 2.8, + "learning_rate": 3.23227653351108e-06, + "loss": 1.4231, + "step": 35603 + }, + { + "epoch": 2.8, + "learning_rate": 3.229725036712688e-06, + "loss": 1.4337, + "step": 35604 + }, + { + "epoch": 2.8, + "learning_rate": 3.2271745364034708e-06, + "loss": 1.5154, + "step": 35605 + }, + { + "epoch": 2.8, + "learning_rate": 3.2246250326007308e-06, + "loss": 1.4506, + "step": 35606 + }, + { + "epoch": 2.8, + "learning_rate": 3.222076525321804e-06, + "loss": 1.4947, + "step": 35607 + }, + { + "epoch": 2.8, + "learning_rate": 3.219529014583977e-06, + "loss": 1.4476, + "step": 35608 + }, + { + "epoch": 2.8, + "learning_rate": 3.216982500404519e-06, + "loss": 1.4545, + "step": 35609 + }, + { + "epoch": 2.8, + "learning_rate": 3.214436982800783e-06, + "loss": 1.4069, + "step": 35610 + }, + { + "epoch": 2.8, + "learning_rate": 3.2118924617900223e-06, + "loss": 1.4365, + "step": 35611 + }, + { + "epoch": 2.8, + "learning_rate": 3.209348937389489e-06, + "loss": 1.4104, + "step": 35612 + }, + { + "epoch": 2.8, + "learning_rate": 3.206806409616469e-06, + "loss": 1.428, + "step": 35613 + }, + { + "epoch": 2.8, + "learning_rate": 3.204264878488233e-06, + "loss": 1.4228, + "step": 35614 + }, + { + "epoch": 2.8, + "learning_rate": 3.201724344022033e-06, + "loss": 1.4552, + "step": 35615 + }, + { + "epoch": 2.8, + "learning_rate": 3.1991848062351054e-06, + "loss": 1.4273, + "step": 35616 + }, + { + "epoch": 2.8, + "learning_rate": 3.1966462651447033e-06, + "loss": 1.4539, + "step": 35617 + }, + { + "epoch": 2.8, + "learning_rate": 3.1941087207680627e-06, + "loss": 1.457, + "step": 35618 + }, + { + "epoch": 2.8, + "learning_rate": 3.1915721731224033e-06, + "loss": 1.4061, + "step": 35619 + }, + { + "epoch": 2.8, + "learning_rate": 3.189036622224961e-06, + "loss": 1.4182, + "step": 35620 + }, + { + "epoch": 2.8, + "learning_rate": 3.1865020680929388e-06, + "loss": 1.4244, + "step": 35621 + }, + { + "epoch": 2.8, + "learning_rate": 3.1839685107435563e-06, + "loss": 1.459, + "step": 35622 + }, + { + "epoch": 2.8, + "learning_rate": 3.181435950194e-06, + "loss": 1.4321, + "step": 35623 + }, + { + "epoch": 2.8, + "learning_rate": 3.1789043864614726e-06, + "loss": 1.4667, + "step": 35624 + }, + { + "epoch": 2.8, + "learning_rate": 3.176373819563177e-06, + "loss": 1.454, + "step": 35625 + }, + { + "epoch": 2.8, + "learning_rate": 3.1738442495162495e-06, + "loss": 1.4229, + "step": 35626 + }, + { + "epoch": 2.8, + "learning_rate": 3.1713156763379265e-06, + "loss": 1.4645, + "step": 35627 + }, + { + "epoch": 2.8, + "learning_rate": 3.1687881000453274e-06, + "loss": 1.4167, + "step": 35628 + }, + { + "epoch": 2.8, + "learning_rate": 3.166261520655622e-06, + "loss": 1.4863, + "step": 35629 + }, + { + "epoch": 2.8, + "learning_rate": 3.1637359381859797e-06, + "loss": 1.4171, + "step": 35630 + }, + { + "epoch": 2.8, + "learning_rate": 3.1612113526535533e-06, + "loss": 1.4358, + "step": 35631 + }, + { + "epoch": 2.8, + "learning_rate": 3.158687764075446e-06, + "loss": 1.4027, + "step": 35632 + }, + { + "epoch": 2.8, + "learning_rate": 3.1561651724688275e-06, + "loss": 1.4684, + "step": 35633 + }, + { + "epoch": 2.8, + "learning_rate": 3.1536435778508172e-06, + "loss": 1.3878, + "step": 35634 + }, + { + "epoch": 2.8, + "learning_rate": 3.1511229802385187e-06, + "loss": 1.4342, + "step": 35635 + }, + { + "epoch": 2.8, + "learning_rate": 3.1486033796490507e-06, + "loss": 1.4259, + "step": 35636 + }, + { + "epoch": 2.8, + "learning_rate": 3.1460847760995332e-06, + "loss": 1.4397, + "step": 35637 + }, + { + "epoch": 2.8, + "learning_rate": 3.14356716960707e-06, + "loss": 1.462, + "step": 35638 + }, + { + "epoch": 2.8, + "learning_rate": 3.141050560188729e-06, + "loss": 1.4155, + "step": 35639 + }, + { + "epoch": 2.8, + "learning_rate": 3.138534947861615e-06, + "loss": 1.4556, + "step": 35640 + }, + { + "epoch": 2.8, + "learning_rate": 3.1360203326428135e-06, + "loss": 1.4242, + "step": 35641 + }, + { + "epoch": 2.8, + "learning_rate": 3.133506714549394e-06, + "loss": 1.4189, + "step": 35642 + }, + { + "epoch": 2.8, + "learning_rate": 3.1309940935983934e-06, + "loss": 1.4375, + "step": 35643 + }, + { + "epoch": 2.8, + "learning_rate": 3.1284824698069145e-06, + "loss": 1.4714, + "step": 35644 + }, + { + "epoch": 2.8, + "learning_rate": 3.125971843191977e-06, + "loss": 1.4474, + "step": 35645 + }, + { + "epoch": 2.8, + "learning_rate": 3.1234622137706334e-06, + "loss": 1.471, + "step": 35646 + }, + { + "epoch": 2.8, + "learning_rate": 3.1209535815599374e-06, + "loss": 1.4229, + "step": 35647 + }, + { + "epoch": 2.8, + "learning_rate": 3.1184459465769252e-06, + "loss": 1.4617, + "step": 35648 + }, + { + "epoch": 2.8, + "learning_rate": 3.1159393088386e-06, + "loss": 1.4604, + "step": 35649 + }, + { + "epoch": 2.8, + "learning_rate": 3.113433668361964e-06, + "loss": 1.4609, + "step": 35650 + }, + { + "epoch": 2.81, + "learning_rate": 3.1109290251640884e-06, + "loss": 1.4717, + "step": 35651 + }, + { + "epoch": 2.81, + "learning_rate": 3.108425379261925e-06, + "loss": 1.4312, + "step": 35652 + }, + { + "epoch": 2.81, + "learning_rate": 3.1059227306724945e-06, + "loss": 1.3954, + "step": 35653 + }, + { + "epoch": 2.81, + "learning_rate": 3.103421079412782e-06, + "loss": 1.4364, + "step": 35654 + }, + { + "epoch": 2.81, + "learning_rate": 3.1009204254997923e-06, + "loss": 1.4972, + "step": 35655 + }, + { + "epoch": 2.81, + "learning_rate": 3.098420768950477e-06, + "loss": 1.4414, + "step": 35656 + }, + { + "epoch": 2.81, + "learning_rate": 3.0959221097818067e-06, + "loss": 1.4682, + "step": 35657 + }, + { + "epoch": 2.81, + "learning_rate": 3.093424448010784e-06, + "loss": 1.4345, + "step": 35658 + }, + { + "epoch": 2.81, + "learning_rate": 3.0909277836543287e-06, + "loss": 1.3734, + "step": 35659 + }, + { + "epoch": 2.81, + "learning_rate": 3.088432116729378e-06, + "loss": 1.4344, + "step": 35660 + }, + { + "epoch": 2.81, + "learning_rate": 3.085937447252934e-06, + "loss": 1.4683, + "step": 35661 + }, + { + "epoch": 2.81, + "learning_rate": 3.0834437752419004e-06, + "loss": 1.4874, + "step": 35662 + }, + { + "epoch": 2.81, + "learning_rate": 3.0809511007131804e-06, + "loss": 1.4447, + "step": 35663 + }, + { + "epoch": 2.81, + "learning_rate": 3.0784594236837433e-06, + "loss": 1.515, + "step": 35664 + }, + { + "epoch": 2.81, + "learning_rate": 3.075968744170493e-06, + "loss": 1.4554, + "step": 35665 + }, + { + "epoch": 2.81, + "learning_rate": 3.0734790621903316e-06, + "loss": 1.4186, + "step": 35666 + }, + { + "epoch": 2.81, + "learning_rate": 3.070990377760163e-06, + "loss": 1.4049, + "step": 35667 + }, + { + "epoch": 2.81, + "learning_rate": 3.0685026908968734e-06, + "loss": 1.4511, + "step": 35668 + }, + { + "epoch": 2.81, + "learning_rate": 3.0660160016173996e-06, + "loss": 1.455, + "step": 35669 + }, + { + "epoch": 2.81, + "learning_rate": 3.063530309938578e-06, + "loss": 1.4154, + "step": 35670 + }, + { + "epoch": 2.81, + "learning_rate": 3.061045615877278e-06, + "loss": 1.4347, + "step": 35671 + }, + { + "epoch": 2.81, + "learning_rate": 3.0585619194504198e-06, + "loss": 1.4335, + "step": 35672 + }, + { + "epoch": 2.81, + "learning_rate": 3.056079220674823e-06, + "loss": 1.4401, + "step": 35673 + }, + { + "epoch": 2.81, + "learning_rate": 3.0535975195673578e-06, + "loss": 1.4232, + "step": 35674 + }, + { + "epoch": 2.81, + "learning_rate": 3.0511168161448773e-06, + "loss": 1.4437, + "step": 35675 + }, + { + "epoch": 2.81, + "learning_rate": 3.048637110424235e-06, + "loss": 1.4215, + "step": 35676 + }, + { + "epoch": 2.81, + "learning_rate": 3.046158402422233e-06, + "loss": 1.4716, + "step": 35677 + }, + { + "epoch": 2.81, + "learning_rate": 3.0436806921557253e-06, + "loss": 1.4299, + "step": 35678 + }, + { + "epoch": 2.81, + "learning_rate": 3.041203979641532e-06, + "loss": 1.4278, + "step": 35679 + }, + { + "epoch": 2.81, + "learning_rate": 3.0387282648964563e-06, + "loss": 1.5027, + "step": 35680 + }, + { + "epoch": 2.81, + "learning_rate": 3.0362535479373175e-06, + "loss": 1.3878, + "step": 35681 + }, + { + "epoch": 2.81, + "learning_rate": 3.033779828780919e-06, + "loss": 1.444, + "step": 35682 + }, + { + "epoch": 2.81, + "learning_rate": 3.0313071074440474e-06, + "loss": 1.3747, + "step": 35683 + }, + { + "epoch": 2.81, + "learning_rate": 3.02883538394349e-06, + "loss": 1.4741, + "step": 35684 + }, + { + "epoch": 2.81, + "learning_rate": 3.0263646582960654e-06, + "loss": 1.458, + "step": 35685 + }, + { + "epoch": 2.81, + "learning_rate": 3.0238949305184947e-06, + "loss": 1.4509, + "step": 35686 + }, + { + "epoch": 2.81, + "learning_rate": 3.0214262006275635e-06, + "loss": 1.4226, + "step": 35687 + }, + { + "epoch": 2.81, + "learning_rate": 3.018958468640059e-06, + "loss": 1.4658, + "step": 35688 + }, + { + "epoch": 2.81, + "learning_rate": 3.016491734572718e-06, + "loss": 1.4165, + "step": 35689 + }, + { + "epoch": 2.81, + "learning_rate": 3.0140259984422765e-06, + "loss": 1.4648, + "step": 35690 + }, + { + "epoch": 2.81, + "learning_rate": 3.0115612602654713e-06, + "loss": 1.4587, + "step": 35691 + }, + { + "epoch": 2.81, + "learning_rate": 3.009097520059056e-06, + "loss": 1.4193, + "step": 35692 + }, + { + "epoch": 2.81, + "learning_rate": 3.006634777839767e-06, + "loss": 1.4173, + "step": 35693 + }, + { + "epoch": 2.81, + "learning_rate": 3.0041730336242907e-06, + "loss": 1.4751, + "step": 35694 + }, + { + "epoch": 2.81, + "learning_rate": 3.0017122874293807e-06, + "loss": 1.4234, + "step": 35695 + }, + { + "epoch": 2.81, + "learning_rate": 2.9992525392717236e-06, + "loss": 1.4817, + "step": 35696 + }, + { + "epoch": 2.81, + "learning_rate": 2.9967937891679896e-06, + "loss": 1.468, + "step": 35697 + }, + { + "epoch": 2.81, + "learning_rate": 2.994336037134931e-06, + "loss": 1.4497, + "step": 35698 + }, + { + "epoch": 2.81, + "learning_rate": 2.9918792831891857e-06, + "loss": 1.4541, + "step": 35699 + }, + { + "epoch": 2.81, + "learning_rate": 2.9894235273474733e-06, + "loss": 1.4398, + "step": 35700 + }, + { + "epoch": 2.81, + "learning_rate": 2.98696876962643e-06, + "loss": 1.4494, + "step": 35701 + }, + { + "epoch": 2.81, + "learning_rate": 2.9845150100427595e-06, + "loss": 1.4467, + "step": 35702 + }, + { + "epoch": 2.81, + "learning_rate": 2.9820622486130986e-06, + "loss": 1.4552, + "step": 35703 + }, + { + "epoch": 2.81, + "learning_rate": 2.9796104853541005e-06, + "loss": 1.4641, + "step": 35704 + }, + { + "epoch": 2.81, + "learning_rate": 2.977159720282418e-06, + "loss": 1.4978, + "step": 35705 + }, + { + "epoch": 2.81, + "learning_rate": 2.9747099534146888e-06, + "loss": 1.4344, + "step": 35706 + }, + { + "epoch": 2.81, + "learning_rate": 2.9722611847675327e-06, + "loss": 1.4304, + "step": 35707 + }, + { + "epoch": 2.81, + "learning_rate": 2.9698134143575856e-06, + "loss": 1.3818, + "step": 35708 + }, + { + "epoch": 2.81, + "learning_rate": 2.967366642201485e-06, + "loss": 1.4496, + "step": 35709 + }, + { + "epoch": 2.81, + "learning_rate": 2.9649208683158176e-06, + "loss": 1.4816, + "step": 35710 + }, + { + "epoch": 2.81, + "learning_rate": 2.9624760927171863e-06, + "loss": 1.4421, + "step": 35711 + }, + { + "epoch": 2.81, + "learning_rate": 2.9600323154222117e-06, + "loss": 1.4651, + "step": 35712 + }, + { + "epoch": 2.81, + "learning_rate": 2.95758953644748e-06, + "loss": 1.46, + "step": 35713 + }, + { + "epoch": 2.81, + "learning_rate": 2.955147755809545e-06, + "loss": 1.425, + "step": 35714 + }, + { + "epoch": 2.81, + "learning_rate": 2.9527069735250096e-06, + "loss": 1.4258, + "step": 35715 + }, + { + "epoch": 2.81, + "learning_rate": 2.950267189610478e-06, + "loss": 1.4444, + "step": 35716 + }, + { + "epoch": 2.81, + "learning_rate": 2.9478284040824698e-06, + "loss": 1.4184, + "step": 35717 + }, + { + "epoch": 2.81, + "learning_rate": 2.9453906169575547e-06, + "loss": 1.4582, + "step": 35718 + }, + { + "epoch": 2.81, + "learning_rate": 2.942953828252287e-06, + "loss": 1.5014, + "step": 35719 + }, + { + "epoch": 2.81, + "learning_rate": 2.9405180379832195e-06, + "loss": 1.4772, + "step": 35720 + }, + { + "epoch": 2.81, + "learning_rate": 2.9380832461668556e-06, + "loss": 1.4196, + "step": 35721 + }, + { + "epoch": 2.81, + "learning_rate": 2.9356494528197662e-06, + "loss": 1.4301, + "step": 35722 + }, + { + "epoch": 2.81, + "learning_rate": 2.93321665795847e-06, + "loss": 1.4728, + "step": 35723 + }, + { + "epoch": 2.81, + "learning_rate": 2.9307848615994723e-06, + "loss": 1.4364, + "step": 35724 + }, + { + "epoch": 2.81, + "learning_rate": 2.9283540637592584e-06, + "loss": 1.452, + "step": 35725 + }, + { + "epoch": 2.81, + "learning_rate": 2.925924264454399e-06, + "loss": 1.4334, + "step": 35726 + }, + { + "epoch": 2.81, + "learning_rate": 2.9234954637013308e-06, + "loss": 1.4608, + "step": 35727 + }, + { + "epoch": 2.81, + "learning_rate": 2.9210676615165573e-06, + "loss": 1.4682, + "step": 35728 + }, + { + "epoch": 2.81, + "learning_rate": 2.918640857916582e-06, + "loss": 1.4638, + "step": 35729 + }, + { + "epoch": 2.81, + "learning_rate": 2.916215052917875e-06, + "loss": 1.4224, + "step": 35730 + }, + { + "epoch": 2.81, + "learning_rate": 2.9137902465368736e-06, + "loss": 1.3743, + "step": 35731 + }, + { + "epoch": 2.81, + "learning_rate": 2.9113664387900804e-06, + "loss": 1.4028, + "step": 35732 + }, + { + "epoch": 2.81, + "learning_rate": 2.9089436296939495e-06, + "loss": 1.4703, + "step": 35733 + }, + { + "epoch": 2.81, + "learning_rate": 2.9065218192649177e-06, + "loss": 1.4724, + "step": 35734 + }, + { + "epoch": 2.81, + "learning_rate": 2.9041010075194216e-06, + "loss": 1.4706, + "step": 35735 + }, + { + "epoch": 2.81, + "learning_rate": 2.901681194473915e-06, + "loss": 1.4374, + "step": 35736 + }, + { + "epoch": 2.81, + "learning_rate": 2.899262380144818e-06, + "loss": 1.4243, + "step": 35737 + }, + { + "epoch": 2.81, + "learning_rate": 2.8968445645485337e-06, + "loss": 1.4396, + "step": 35738 + }, + { + "epoch": 2.81, + "learning_rate": 2.8944277477015166e-06, + "loss": 1.4796, + "step": 35739 + }, + { + "epoch": 2.81, + "learning_rate": 2.8920119296201526e-06, + "loss": 1.4343, + "step": 35740 + }, + { + "epoch": 2.81, + "learning_rate": 2.889597110320829e-06, + "loss": 1.456, + "step": 35741 + }, + { + "epoch": 2.81, + "learning_rate": 2.8871832898199833e-06, + "loss": 1.4594, + "step": 35742 + }, + { + "epoch": 2.81, + "learning_rate": 2.884770468133968e-06, + "loss": 1.4516, + "step": 35743 + }, + { + "epoch": 2.81, + "learning_rate": 2.88235864527917e-06, + "loss": 1.446, + "step": 35744 + }, + { + "epoch": 2.81, + "learning_rate": 2.8799478212719775e-06, + "loss": 1.4451, + "step": 35745 + }, + { + "epoch": 2.81, + "learning_rate": 2.8775379961287593e-06, + "loss": 1.4458, + "step": 35746 + }, + { + "epoch": 2.81, + "learning_rate": 2.875129169865853e-06, + "loss": 1.5022, + "step": 35747 + }, + { + "epoch": 2.81, + "learning_rate": 2.8727213424996454e-06, + "loss": 1.4472, + "step": 35748 + }, + { + "epoch": 2.81, + "learning_rate": 2.87031451404644e-06, + "loss": 1.4768, + "step": 35749 + }, + { + "epoch": 2.81, + "learning_rate": 2.8679086845226408e-06, + "loss": 1.4345, + "step": 35750 + }, + { + "epoch": 2.81, + "learning_rate": 2.865503853944534e-06, + "loss": 1.4278, + "step": 35751 + }, + { + "epoch": 2.81, + "learning_rate": 2.8631000223284574e-06, + "loss": 1.4369, + "step": 35752 + }, + { + "epoch": 2.81, + "learning_rate": 2.8606971896907307e-06, + "loss": 1.4417, + "step": 35753 + }, + { + "epoch": 2.81, + "learning_rate": 2.858295356047691e-06, + "loss": 1.4711, + "step": 35754 + }, + { + "epoch": 2.81, + "learning_rate": 2.855894521415608e-06, + "loss": 1.4887, + "step": 35755 + }, + { + "epoch": 2.81, + "learning_rate": 2.853494685810803e-06, + "loss": 1.4198, + "step": 35756 + }, + { + "epoch": 2.81, + "learning_rate": 2.8510958492495793e-06, + "loss": 1.4211, + "step": 35757 + }, + { + "epoch": 2.81, + "learning_rate": 2.8486980117481906e-06, + "loss": 1.439, + "step": 35758 + }, + { + "epoch": 2.81, + "learning_rate": 2.846301173322957e-06, + "loss": 1.4217, + "step": 35759 + }, + { + "epoch": 2.81, + "learning_rate": 2.8439053339901317e-06, + "loss": 1.4588, + "step": 35760 + }, + { + "epoch": 2.81, + "learning_rate": 2.8415104937659694e-06, + "loss": 1.4407, + "step": 35761 + }, + { + "epoch": 2.81, + "learning_rate": 2.8391166526667398e-06, + "loss": 1.5068, + "step": 35762 + }, + { + "epoch": 2.81, + "learning_rate": 2.8367238107086964e-06, + "loss": 1.4668, + "step": 35763 + }, + { + "epoch": 2.81, + "learning_rate": 2.83433196790811e-06, + "loss": 1.4301, + "step": 35764 + }, + { + "epoch": 2.81, + "learning_rate": 2.831941124281184e-06, + "loss": 1.4512, + "step": 35765 + }, + { + "epoch": 2.81, + "learning_rate": 2.8295512798441555e-06, + "loss": 1.4769, + "step": 35766 + }, + { + "epoch": 2.81, + "learning_rate": 2.8271624346132617e-06, + "loss": 1.4374, + "step": 35767 + }, + { + "epoch": 2.81, + "learning_rate": 2.824774588604739e-06, + "loss": 1.3901, + "step": 35768 + }, + { + "epoch": 2.81, + "learning_rate": 2.822387741834742e-06, + "loss": 1.4775, + "step": 35769 + }, + { + "epoch": 2.81, + "learning_rate": 2.82000189431954e-06, + "loss": 1.4219, + "step": 35770 + }, + { + "epoch": 2.81, + "learning_rate": 2.8176170460753043e-06, + "loss": 1.4614, + "step": 35771 + }, + { + "epoch": 2.81, + "learning_rate": 2.8152331971182053e-06, + "loss": 1.4604, + "step": 35772 + }, + { + "epoch": 2.81, + "learning_rate": 2.812850347464479e-06, + "loss": 1.4832, + "step": 35773 + }, + { + "epoch": 2.81, + "learning_rate": 2.810468497130264e-06, + "loss": 1.4651, + "step": 35774 + }, + { + "epoch": 2.81, + "learning_rate": 2.808087646131729e-06, + "loss": 1.4437, + "step": 35775 + }, + { + "epoch": 2.81, + "learning_rate": 2.8057077944850625e-06, + "loss": 1.5062, + "step": 35776 + }, + { + "epoch": 2.81, + "learning_rate": 2.8033289422064178e-06, + "loss": 1.4525, + "step": 35777 + }, + { + "epoch": 2.82, + "learning_rate": 2.8009510893119147e-06, + "loss": 1.4407, + "step": 35778 + }, + { + "epoch": 2.82, + "learning_rate": 2.798574235817741e-06, + "loss": 1.4049, + "step": 35779 + }, + { + "epoch": 2.82, + "learning_rate": 2.796198381740017e-06, + "loss": 1.4252, + "step": 35780 + }, + { + "epoch": 2.82, + "learning_rate": 2.7938235270948628e-06, + "loss": 1.4932, + "step": 35781 + }, + { + "epoch": 2.82, + "learning_rate": 2.7914496718984325e-06, + "loss": 1.3952, + "step": 35782 + }, + { + "epoch": 2.82, + "learning_rate": 2.7890768161667963e-06, + "loss": 1.3963, + "step": 35783 + }, + { + "epoch": 2.82, + "learning_rate": 2.7867049599161083e-06, + "loss": 1.4542, + "step": 35784 + }, + { + "epoch": 2.82, + "learning_rate": 2.7843341031624557e-06, + "loss": 1.415, + "step": 35785 + }, + { + "epoch": 2.82, + "learning_rate": 2.781964245921908e-06, + "loss": 1.4934, + "step": 35786 + }, + { + "epoch": 2.82, + "learning_rate": 2.7795953882106036e-06, + "loss": 1.4374, + "step": 35787 + }, + { + "epoch": 2.82, + "learning_rate": 2.7772275300446124e-06, + "loss": 1.4074, + "step": 35788 + }, + { + "epoch": 2.82, + "learning_rate": 2.774860671439988e-06, + "loss": 1.4223, + "step": 35789 + }, + { + "epoch": 2.82, + "learning_rate": 2.7724948124128176e-06, + "loss": 1.4578, + "step": 35790 + }, + { + "epoch": 2.82, + "learning_rate": 2.7701299529791555e-06, + "loss": 1.4752, + "step": 35791 + }, + { + "epoch": 2.82, + "learning_rate": 2.7677660931550715e-06, + "loss": 1.4514, + "step": 35792 + }, + { + "epoch": 2.82, + "learning_rate": 2.7654032329566035e-06, + "loss": 1.4021, + "step": 35793 + }, + { + "epoch": 2.82, + "learning_rate": 2.763041372399788e-06, + "loss": 1.4377, + "step": 35794 + }, + { + "epoch": 2.82, + "learning_rate": 2.7606805115006793e-06, + "loss": 1.4436, + "step": 35795 + }, + { + "epoch": 2.82, + "learning_rate": 2.7583206502752807e-06, + "loss": 1.4738, + "step": 35796 + }, + { + "epoch": 2.82, + "learning_rate": 2.755961788739647e-06, + "loss": 1.4619, + "step": 35797 + }, + { + "epoch": 2.82, + "learning_rate": 2.753603926909781e-06, + "loss": 1.4472, + "step": 35798 + }, + { + "epoch": 2.82, + "learning_rate": 2.7512470648016706e-06, + "loss": 1.4583, + "step": 35799 + }, + { + "epoch": 2.82, + "learning_rate": 2.7488912024313525e-06, + "loss": 1.4174, + "step": 35800 + }, + { + "epoch": 2.82, + "learning_rate": 2.7465363398147975e-06, + "loss": 1.4953, + "step": 35801 + }, + { + "epoch": 2.82, + "learning_rate": 2.7441824769679934e-06, + "loss": 1.4544, + "step": 35802 + }, + { + "epoch": 2.82, + "learning_rate": 2.741829613906926e-06, + "loss": 1.4273, + "step": 35803 + }, + { + "epoch": 2.82, + "learning_rate": 2.7394777506475674e-06, + "loss": 1.4055, + "step": 35804 + }, + { + "epoch": 2.82, + "learning_rate": 2.737126887205904e-06, + "loss": 1.3954, + "step": 35805 + }, + { + "epoch": 2.82, + "learning_rate": 2.734777023597873e-06, + "loss": 1.4289, + "step": 35806 + }, + { + "epoch": 2.82, + "learning_rate": 2.732428159839445e-06, + "loss": 1.4603, + "step": 35807 + }, + { + "epoch": 2.82, + "learning_rate": 2.7300802959465573e-06, + "loss": 1.4302, + "step": 35808 + }, + { + "epoch": 2.82, + "learning_rate": 2.7277334319351472e-06, + "loss": 1.4464, + "step": 35809 + }, + { + "epoch": 2.82, + "learning_rate": 2.7253875678211524e-06, + "loss": 1.4844, + "step": 35810 + }, + { + "epoch": 2.82, + "learning_rate": 2.723042703620526e-06, + "loss": 1.4448, + "step": 35811 + }, + { + "epoch": 2.82, + "learning_rate": 2.7206988393491556e-06, + "loss": 1.4443, + "step": 35812 + }, + { + "epoch": 2.82, + "learning_rate": 2.7183559750229624e-06, + "loss": 1.4192, + "step": 35813 + }, + { + "epoch": 2.82, + "learning_rate": 2.716014110657849e-06, + "loss": 1.4307, + "step": 35814 + }, + { + "epoch": 2.82, + "learning_rate": 2.7136732462697373e-06, + "loss": 1.4802, + "step": 35815 + }, + { + "epoch": 2.82, + "learning_rate": 2.711333381874481e-06, + "loss": 1.4182, + "step": 35816 + }, + { + "epoch": 2.82, + "learning_rate": 2.708994517488017e-06, + "loss": 1.4669, + "step": 35817 + }, + { + "epoch": 2.82, + "learning_rate": 2.7066566531261826e-06, + "loss": 1.4396, + "step": 35818 + }, + { + "epoch": 2.82, + "learning_rate": 2.704319788804882e-06, + "loss": 1.4328, + "step": 35819 + }, + { + "epoch": 2.82, + "learning_rate": 2.7019839245399355e-06, + "loss": 1.423, + "step": 35820 + }, + { + "epoch": 2.82, + "learning_rate": 2.699649060347264e-06, + "loss": 1.4635, + "step": 35821 + }, + { + "epoch": 2.82, + "learning_rate": 2.697315196242672e-06, + "loss": 1.4354, + "step": 35822 + }, + { + "epoch": 2.82, + "learning_rate": 2.6949823322420294e-06, + "loss": 1.4404, + "step": 35823 + }, + { + "epoch": 2.82, + "learning_rate": 2.692650468361157e-06, + "loss": 1.4484, + "step": 35824 + }, + { + "epoch": 2.82, + "learning_rate": 2.6903196046158928e-06, + "loss": 1.4396, + "step": 35825 + }, + { + "epoch": 2.82, + "learning_rate": 2.6879897410220897e-06, + "loss": 1.4022, + "step": 35826 + }, + { + "epoch": 2.82, + "learning_rate": 2.685660877595519e-06, + "loss": 1.437, + "step": 35827 + }, + { + "epoch": 2.82, + "learning_rate": 2.6833330143520183e-06, + "loss": 1.4389, + "step": 35828 + }, + { + "epoch": 2.82, + "learning_rate": 2.6810061513074075e-06, + "loss": 1.4363, + "step": 35829 + }, + { + "epoch": 2.82, + "learning_rate": 2.6786802884774584e-06, + "loss": 1.4343, + "step": 35830 + }, + { + "epoch": 2.82, + "learning_rate": 2.676355425877974e-06, + "loss": 1.4749, + "step": 35831 + }, + { + "epoch": 2.82, + "learning_rate": 2.6740315635247255e-06, + "loss": 1.4379, + "step": 35832 + }, + { + "epoch": 2.82, + "learning_rate": 2.6717087014335003e-06, + "loss": 1.446, + "step": 35833 + }, + { + "epoch": 2.82, + "learning_rate": 2.6693868396200857e-06, + "loss": 1.4906, + "step": 35834 + }, + { + "epoch": 2.82, + "learning_rate": 2.6670659781002356e-06, + "loss": 1.4636, + "step": 35835 + }, + { + "epoch": 2.82, + "learning_rate": 2.664746116889688e-06, + "loss": 1.4384, + "step": 35836 + }, + { + "epoch": 2.82, + "learning_rate": 2.6624272560042126e-06, + "loss": 1.4627, + "step": 35837 + }, + { + "epoch": 2.82, + "learning_rate": 2.6601093954595476e-06, + "loss": 1.4444, + "step": 35838 + }, + { + "epoch": 2.82, + "learning_rate": 2.6577925352714303e-06, + "loss": 1.421, + "step": 35839 + }, + { + "epoch": 2.82, + "learning_rate": 2.6554766754555813e-06, + "loss": 1.3944, + "step": 35840 + }, + { + "epoch": 2.82, + "learning_rate": 2.653161816027738e-06, + "loss": 1.4377, + "step": 35841 + }, + { + "epoch": 2.82, + "learning_rate": 2.650847957003638e-06, + "loss": 1.4325, + "step": 35842 + }, + { + "epoch": 2.82, + "learning_rate": 2.648535098398952e-06, + "loss": 1.4216, + "step": 35843 + }, + { + "epoch": 2.82, + "learning_rate": 2.6462232402293835e-06, + "loss": 1.4625, + "step": 35844 + }, + { + "epoch": 2.82, + "learning_rate": 2.6439123825106546e-06, + "loss": 1.4115, + "step": 35845 + }, + { + "epoch": 2.82, + "learning_rate": 2.6416025252584518e-06, + "loss": 1.4407, + "step": 35846 + }, + { + "epoch": 2.82, + "learning_rate": 2.639293668488429e-06, + "loss": 1.452, + "step": 35847 + }, + { + "epoch": 2.82, + "learning_rate": 2.6369858122162912e-06, + "loss": 1.4252, + "step": 35848 + }, + { + "epoch": 2.82, + "learning_rate": 2.634678956457692e-06, + "loss": 1.4136, + "step": 35849 + }, + { + "epoch": 2.82, + "learning_rate": 2.632373101228302e-06, + "loss": 1.5095, + "step": 35850 + }, + { + "epoch": 2.82, + "learning_rate": 2.630068246543793e-06, + "loss": 1.4292, + "step": 35851 + }, + { + "epoch": 2.82, + "learning_rate": 2.6277643924197845e-06, + "loss": 1.4229, + "step": 35852 + }, + { + "epoch": 2.82, + "learning_rate": 2.6254615388719147e-06, + "loss": 1.4179, + "step": 35853 + }, + { + "epoch": 2.82, + "learning_rate": 2.6231596859158378e-06, + "loss": 1.4983, + "step": 35854 + }, + { + "epoch": 2.82, + "learning_rate": 2.620858833567191e-06, + "loss": 1.4428, + "step": 35855 + }, + { + "epoch": 2.82, + "learning_rate": 2.6185589818415785e-06, + "loss": 1.4596, + "step": 35856 + }, + { + "epoch": 2.82, + "learning_rate": 2.6162601307545885e-06, + "loss": 1.4305, + "step": 35857 + }, + { + "epoch": 2.82, + "learning_rate": 2.6139622803218906e-06, + "loss": 1.4508, + "step": 35858 + }, + { + "epoch": 2.82, + "learning_rate": 2.6116654305590567e-06, + "loss": 1.419, + "step": 35859 + }, + { + "epoch": 2.82, + "learning_rate": 2.609369581481674e-06, + "loss": 1.4244, + "step": 35860 + }, + { + "epoch": 2.82, + "learning_rate": 2.60707473310533e-06, + "loss": 1.3975, + "step": 35861 + }, + { + "epoch": 2.82, + "learning_rate": 2.6047808854456122e-06, + "loss": 1.4292, + "step": 35862 + }, + { + "epoch": 2.82, + "learning_rate": 2.602488038518091e-06, + "loss": 1.4561, + "step": 35863 + }, + { + "epoch": 2.82, + "learning_rate": 2.6001961923383387e-06, + "loss": 1.5049, + "step": 35864 + }, + { + "epoch": 2.82, + "learning_rate": 2.597905346921908e-06, + "loss": 1.4621, + "step": 35865 + }, + { + "epoch": 2.82, + "learning_rate": 2.5956155022843704e-06, + "loss": 1.4605, + "step": 35866 + }, + { + "epoch": 2.82, + "learning_rate": 2.593326658441247e-06, + "loss": 1.4716, + "step": 35867 + }, + { + "epoch": 2.82, + "learning_rate": 2.5910388154080917e-06, + "loss": 1.4791, + "step": 35868 + }, + { + "epoch": 2.82, + "learning_rate": 2.5887519732004426e-06, + "loss": 1.4292, + "step": 35869 + }, + { + "epoch": 2.82, + "learning_rate": 2.5864661318338033e-06, + "loss": 1.4489, + "step": 35870 + }, + { + "epoch": 2.82, + "learning_rate": 2.5841812913237116e-06, + "loss": 1.4837, + "step": 35871 + }, + { + "epoch": 2.82, + "learning_rate": 2.5818974516856884e-06, + "loss": 1.3893, + "step": 35872 + }, + { + "epoch": 2.82, + "learning_rate": 2.5796146129352213e-06, + "loss": 1.4156, + "step": 35873 + }, + { + "epoch": 2.82, + "learning_rate": 2.5773327750878147e-06, + "loss": 1.4513, + "step": 35874 + }, + { + "epoch": 2.82, + "learning_rate": 2.575051938158973e-06, + "loss": 1.4256, + "step": 35875 + }, + { + "epoch": 2.82, + "learning_rate": 2.5727721021641833e-06, + "loss": 1.4218, + "step": 35876 + }, + { + "epoch": 2.82, + "learning_rate": 2.5704932671189006e-06, + "loss": 1.45, + "step": 35877 + }, + { + "epoch": 2.82, + "learning_rate": 2.568215433038612e-06, + "loss": 1.3913, + "step": 35878 + }, + { + "epoch": 2.82, + "learning_rate": 2.5659385999387715e-06, + "loss": 1.4402, + "step": 35879 + }, + { + "epoch": 2.82, + "learning_rate": 2.5636627678348677e-06, + "loss": 1.4463, + "step": 35880 + }, + { + "epoch": 2.82, + "learning_rate": 2.5613879367423206e-06, + "loss": 1.4057, + "step": 35881 + }, + { + "epoch": 2.82, + "learning_rate": 2.5591141066765853e-06, + "loss": 1.42, + "step": 35882 + }, + { + "epoch": 2.82, + "learning_rate": 2.5568412776530988e-06, + "loss": 1.4613, + "step": 35883 + }, + { + "epoch": 2.82, + "learning_rate": 2.554569449687299e-06, + "loss": 1.4777, + "step": 35884 + }, + { + "epoch": 2.82, + "learning_rate": 2.5522986227946075e-06, + "loss": 1.4289, + "step": 35885 + }, + { + "epoch": 2.82, + "learning_rate": 2.5500287969904276e-06, + "loss": 1.4597, + "step": 35886 + }, + { + "epoch": 2.82, + "learning_rate": 2.547759972290181e-06, + "loss": 1.4743, + "step": 35887 + }, + { + "epoch": 2.82, + "learning_rate": 2.5454921487092884e-06, + "loss": 1.4097, + "step": 35888 + }, + { + "epoch": 2.82, + "learning_rate": 2.543225326263121e-06, + "loss": 1.42, + "step": 35889 + }, + { + "epoch": 2.82, + "learning_rate": 2.5409595049670994e-06, + "loss": 1.4327, + "step": 35890 + }, + { + "epoch": 2.82, + "learning_rate": 2.538694684836562e-06, + "loss": 1.4414, + "step": 35891 + }, + { + "epoch": 2.82, + "learning_rate": 2.536430865886929e-06, + "loss": 1.4623, + "step": 35892 + }, + { + "epoch": 2.82, + "learning_rate": 2.534168048133556e-06, + "loss": 1.5071, + "step": 35893 + }, + { + "epoch": 2.82, + "learning_rate": 2.5319062315917793e-06, + "loss": 1.4622, + "step": 35894 + }, + { + "epoch": 2.82, + "learning_rate": 2.5296454162770042e-06, + "loss": 1.4249, + "step": 35895 + }, + { + "epoch": 2.82, + "learning_rate": 2.5273856022045515e-06, + "loss": 1.4253, + "step": 35896 + }, + { + "epoch": 2.82, + "learning_rate": 2.525126789389775e-06, + "loss": 1.4454, + "step": 35897 + }, + { + "epoch": 2.82, + "learning_rate": 2.5228689778479804e-06, + "loss": 1.4433, + "step": 35898 + }, + { + "epoch": 2.82, + "learning_rate": 2.5206121675945378e-06, + "loss": 1.4455, + "step": 35899 + }, + { + "epoch": 2.82, + "learning_rate": 2.518356358644752e-06, + "loss": 1.4578, + "step": 35900 + }, + { + "epoch": 2.82, + "learning_rate": 2.516101551013927e-06, + "loss": 1.449, + "step": 35901 + }, + { + "epoch": 2.82, + "learning_rate": 2.513847744717401e-06, + "loss": 1.4961, + "step": 35902 + }, + { + "epoch": 2.82, + "learning_rate": 2.5115949397704614e-06, + "loss": 1.4693, + "step": 35903 + }, + { + "epoch": 2.82, + "learning_rate": 2.5093431361883797e-06, + "loss": 1.4214, + "step": 35904 + }, + { + "epoch": 2.83, + "learning_rate": 2.5070923339864767e-06, + "loss": 1.4456, + "step": 35905 + }, + { + "epoch": 2.83, + "learning_rate": 2.504842533180024e-06, + "loss": 1.5058, + "step": 35906 + }, + { + "epoch": 2.83, + "learning_rate": 2.5025937337843085e-06, + "loss": 1.4129, + "step": 35907 + }, + { + "epoch": 2.83, + "learning_rate": 2.5003459358145517e-06, + "loss": 1.4116, + "step": 35908 + }, + { + "epoch": 2.83, + "learning_rate": 2.498099139286075e-06, + "loss": 1.4525, + "step": 35909 + }, + { + "epoch": 2.83, + "learning_rate": 2.495853344214116e-06, + "loss": 1.4445, + "step": 35910 + }, + { + "epoch": 2.83, + "learning_rate": 2.493608550613896e-06, + "loss": 1.4339, + "step": 35911 + }, + { + "epoch": 2.83, + "learning_rate": 2.4913647585006857e-06, + "loss": 1.4544, + "step": 35912 + }, + { + "epoch": 2.83, + "learning_rate": 2.48912196788969e-06, + "loss": 1.4528, + "step": 35913 + }, + { + "epoch": 2.83, + "learning_rate": 2.4868801787961802e-06, + "loss": 1.4964, + "step": 35914 + }, + { + "epoch": 2.83, + "learning_rate": 2.48463939123531e-06, + "loss": 1.5202, + "step": 35915 + }, + { + "epoch": 2.83, + "learning_rate": 2.482399605222368e-06, + "loss": 1.5168, + "step": 35916 + }, + { + "epoch": 2.83, + "learning_rate": 2.4801608207725086e-06, + "loss": 1.4345, + "step": 35917 + }, + { + "epoch": 2.83, + "learning_rate": 2.477923037900953e-06, + "loss": 1.4546, + "step": 35918 + }, + { + "epoch": 2.83, + "learning_rate": 2.475686256622872e-06, + "loss": 1.4554, + "step": 35919 + }, + { + "epoch": 2.83, + "learning_rate": 2.4734504769535033e-06, + "loss": 1.4875, + "step": 35920 + }, + { + "epoch": 2.83, + "learning_rate": 2.471215698907969e-06, + "loss": 1.4198, + "step": 35921 + }, + { + "epoch": 2.83, + "learning_rate": 2.468981922501473e-06, + "loss": 1.4785, + "step": 35922 + }, + { + "epoch": 2.83, + "learning_rate": 2.4667491477491864e-06, + "loss": 1.4867, + "step": 35923 + }, + { + "epoch": 2.83, + "learning_rate": 2.4645173746662473e-06, + "loss": 1.4406, + "step": 35924 + }, + { + "epoch": 2.83, + "learning_rate": 2.4622866032678266e-06, + "loss": 1.4343, + "step": 35925 + }, + { + "epoch": 2.83, + "learning_rate": 2.460056833569063e-06, + "loss": 1.4186, + "step": 35926 + }, + { + "epoch": 2.83, + "learning_rate": 2.4578280655850766e-06, + "loss": 1.4089, + "step": 35927 + }, + { + "epoch": 2.83, + "learning_rate": 2.455600299331023e-06, + "loss": 1.4236, + "step": 35928 + }, + { + "epoch": 2.83, + "learning_rate": 2.4533735348220396e-06, + "loss": 1.4368, + "step": 35929 + }, + { + "epoch": 2.83, + "learning_rate": 2.4511477720732143e-06, + "loss": 1.4439, + "step": 35930 + }, + { + "epoch": 2.83, + "learning_rate": 2.448923011099685e-06, + "loss": 1.3632, + "step": 35931 + }, + { + "epoch": 2.83, + "learning_rate": 2.4466992519165063e-06, + "loss": 1.4245, + "step": 35932 + }, + { + "epoch": 2.83, + "learning_rate": 2.4444764945388495e-06, + "loss": 1.4731, + "step": 35933 + }, + { + "epoch": 2.83, + "learning_rate": 2.4422547389817525e-06, + "loss": 1.3963, + "step": 35934 + }, + { + "epoch": 2.83, + "learning_rate": 2.44003398526032e-06, + "loss": 1.3863, + "step": 35935 + }, + { + "epoch": 2.83, + "learning_rate": 2.4378142333896233e-06, + "loss": 1.4285, + "step": 35936 + }, + { + "epoch": 2.83, + "learning_rate": 2.4355954833847336e-06, + "loss": 1.4591, + "step": 35937 + }, + { + "epoch": 2.83, + "learning_rate": 2.433377735260739e-06, + "loss": 1.4571, + "step": 35938 + }, + { + "epoch": 2.83, + "learning_rate": 2.4311609890326433e-06, + "loss": 1.428, + "step": 35939 + }, + { + "epoch": 2.83, + "learning_rate": 2.4289452447155522e-06, + "loss": 1.4361, + "step": 35940 + }, + { + "epoch": 2.83, + "learning_rate": 2.4267305023244864e-06, + "loss": 1.4408, + "step": 35941 + }, + { + "epoch": 2.83, + "learning_rate": 2.4245167618744675e-06, + "loss": 1.4737, + "step": 35942 + }, + { + "epoch": 2.83, + "learning_rate": 2.4223040233805668e-06, + "loss": 1.4527, + "step": 35943 + }, + { + "epoch": 2.83, + "learning_rate": 2.4200922868577556e-06, + "loss": 1.45, + "step": 35944 + }, + { + "epoch": 2.83, + "learning_rate": 2.4178815523210883e-06, + "loss": 1.4791, + "step": 35945 + }, + { + "epoch": 2.83, + "learning_rate": 2.4156718197855697e-06, + "loss": 1.4374, + "step": 35946 + }, + { + "epoch": 2.83, + "learning_rate": 2.413463089266188e-06, + "loss": 1.4857, + "step": 35947 + }, + { + "epoch": 2.83, + "learning_rate": 2.411255360777947e-06, + "loss": 1.4409, + "step": 35948 + }, + { + "epoch": 2.83, + "learning_rate": 2.4090486343358195e-06, + "loss": 1.4046, + "step": 35949 + }, + { + "epoch": 2.83, + "learning_rate": 2.406842909954826e-06, + "loss": 1.4256, + "step": 35950 + }, + { + "epoch": 2.83, + "learning_rate": 2.404638187649904e-06, + "loss": 1.4786, + "step": 35951 + }, + { + "epoch": 2.83, + "learning_rate": 2.402434467436043e-06, + "loss": 1.4312, + "step": 35952 + }, + { + "epoch": 2.83, + "learning_rate": 2.400231749328213e-06, + "loss": 1.4021, + "step": 35953 + }, + { + "epoch": 2.83, + "learning_rate": 2.3980300333413527e-06, + "loss": 1.4695, + "step": 35954 + }, + { + "epoch": 2.83, + "learning_rate": 2.3958293194904166e-06, + "loss": 1.444, + "step": 35955 + }, + { + "epoch": 2.83, + "learning_rate": 2.393629607790343e-06, + "loss": 1.4152, + "step": 35956 + }, + { + "epoch": 2.83, + "learning_rate": 2.3914308982560692e-06, + "loss": 1.4394, + "step": 35957 + }, + { + "epoch": 2.83, + "learning_rate": 2.3892331909025177e-06, + "loss": 1.4043, + "step": 35958 + }, + { + "epoch": 2.83, + "learning_rate": 2.3870364857446087e-06, + "loss": 1.4304, + "step": 35959 + }, + { + "epoch": 2.83, + "learning_rate": 2.3848407827972816e-06, + "loss": 1.4368, + "step": 35960 + }, + { + "epoch": 2.83, + "learning_rate": 2.3826460820754236e-06, + "loss": 1.4228, + "step": 35961 + }, + { + "epoch": 2.83, + "learning_rate": 2.380452383593906e-06, + "loss": 1.4524, + "step": 35962 + }, + { + "epoch": 2.83, + "learning_rate": 2.378259687367684e-06, + "loss": 1.4204, + "step": 35963 + }, + { + "epoch": 2.83, + "learning_rate": 2.376067993411612e-06, + "loss": 1.4261, + "step": 35964 + }, + { + "epoch": 2.83, + "learning_rate": 2.373877301740562e-06, + "loss": 1.4464, + "step": 35965 + }, + { + "epoch": 2.83, + "learning_rate": 2.3716876123694216e-06, + "loss": 1.4364, + "step": 35966 + }, + { + "epoch": 2.83, + "learning_rate": 2.3694989253130457e-06, + "loss": 1.4396, + "step": 35967 + }, + { + "epoch": 2.83, + "learning_rate": 2.3673112405863224e-06, + "loss": 1.4785, + "step": 35968 + }, + { + "epoch": 2.83, + "learning_rate": 2.365124558204057e-06, + "loss": 1.4564, + "step": 35969 + }, + { + "epoch": 2.83, + "learning_rate": 2.3629388781811533e-06, + "loss": 1.4089, + "step": 35970 + }, + { + "epoch": 2.83, + "learning_rate": 2.3607542005324163e-06, + "loss": 1.4844, + "step": 35971 + }, + { + "epoch": 2.83, + "learning_rate": 2.3585705252726682e-06, + "loss": 1.4882, + "step": 35972 + }, + { + "epoch": 2.83, + "learning_rate": 2.3563878524167635e-06, + "loss": 1.4419, + "step": 35973 + }, + { + "epoch": 2.83, + "learning_rate": 2.3542061819795065e-06, + "loss": 1.43, + "step": 35974 + }, + { + "epoch": 2.83, + "learning_rate": 2.3520255139757195e-06, + "loss": 1.3838, + "step": 35975 + }, + { + "epoch": 2.83, + "learning_rate": 2.349845848420173e-06, + "loss": 1.4351, + "step": 35976 + }, + { + "epoch": 2.83, + "learning_rate": 2.347667185327723e-06, + "loss": 1.479, + "step": 35977 + }, + { + "epoch": 2.83, + "learning_rate": 2.3454895247131233e-06, + "loss": 1.4297, + "step": 35978 + }, + { + "epoch": 2.83, + "learning_rate": 2.343312866591163e-06, + "loss": 1.4158, + "step": 35979 + }, + { + "epoch": 2.83, + "learning_rate": 2.341137210976629e-06, + "loss": 1.4395, + "step": 35980 + }, + { + "epoch": 2.83, + "learning_rate": 2.338962557884294e-06, + "loss": 1.4364, + "step": 35981 + }, + { + "epoch": 2.83, + "learning_rate": 2.336788907328896e-06, + "loss": 1.4143, + "step": 35982 + }, + { + "epoch": 2.83, + "learning_rate": 2.334616259325223e-06, + "loss": 1.4416, + "step": 35983 + }, + { + "epoch": 2.83, + "learning_rate": 2.332444613888029e-06, + "loss": 1.4229, + "step": 35984 + }, + { + "epoch": 2.83, + "learning_rate": 2.3302739710320374e-06, + "loss": 1.4644, + "step": 35985 + }, + { + "epoch": 2.83, + "learning_rate": 2.328104330771985e-06, + "loss": 1.4392, + "step": 35986 + }, + { + "epoch": 2.83, + "learning_rate": 2.325935693122627e-06, + "loss": 1.4603, + "step": 35987 + }, + { + "epoch": 2.83, + "learning_rate": 2.3237680580986684e-06, + "loss": 1.404, + "step": 35988 + }, + { + "epoch": 2.83, + "learning_rate": 2.3216014257148474e-06, + "loss": 1.4135, + "step": 35989 + }, + { + "epoch": 2.83, + "learning_rate": 2.319435795985819e-06, + "loss": 1.4603, + "step": 35990 + }, + { + "epoch": 2.83, + "learning_rate": 2.3172711689263545e-06, + "loss": 1.4619, + "step": 35991 + }, + { + "epoch": 2.83, + "learning_rate": 2.315107544551109e-06, + "loss": 1.4443, + "step": 35992 + }, + { + "epoch": 2.83, + "learning_rate": 2.3129449228747877e-06, + "loss": 1.3894, + "step": 35993 + }, + { + "epoch": 2.83, + "learning_rate": 2.3107833039120784e-06, + "loss": 1.437, + "step": 35994 + }, + { + "epoch": 2.83, + "learning_rate": 2.3086226876776357e-06, + "loss": 1.4323, + "step": 35995 + }, + { + "epoch": 2.83, + "learning_rate": 2.3064630741861325e-06, + "loss": 1.4352, + "step": 35996 + }, + { + "epoch": 2.83, + "learning_rate": 2.3043044634522558e-06, + "loss": 1.4723, + "step": 35997 + }, + { + "epoch": 2.83, + "learning_rate": 2.302146855490644e-06, + "loss": 1.5074, + "step": 35998 + }, + { + "epoch": 2.83, + "learning_rate": 2.299990250315953e-06, + "loss": 1.4462, + "step": 35999 + }, + { + "epoch": 2.83, + "learning_rate": 2.2978346479428034e-06, + "loss": 1.4468, + "step": 36000 + }, + { + "epoch": 2.83, + "learning_rate": 2.295680048385867e-06, + "loss": 1.4438, + "step": 36001 + }, + { + "epoch": 2.83, + "learning_rate": 2.2935264516597663e-06, + "loss": 1.4519, + "step": 36002 + }, + { + "epoch": 2.83, + "learning_rate": 2.291373857779072e-06, + "loss": 1.438, + "step": 36003 + }, + { + "epoch": 2.83, + "learning_rate": 2.289222266758456e-06, + "loss": 1.3825, + "step": 36004 + }, + { + "epoch": 2.83, + "learning_rate": 2.287071678612523e-06, + "loss": 1.4723, + "step": 36005 + }, + { + "epoch": 2.83, + "learning_rate": 2.2849220933558287e-06, + "loss": 1.5298, + "step": 36006 + }, + { + "epoch": 2.83, + "learning_rate": 2.282773511003011e-06, + "loss": 1.3931, + "step": 36007 + }, + { + "epoch": 2.83, + "learning_rate": 2.280625931568658e-06, + "loss": 1.4528, + "step": 36008 + }, + { + "epoch": 2.83, + "learning_rate": 2.278479355067325e-06, + "loss": 1.3999, + "step": 36009 + }, + { + "epoch": 2.83, + "learning_rate": 2.276333781513584e-06, + "loss": 1.4344, + "step": 36010 + }, + { + "epoch": 2.83, + "learning_rate": 2.2741892109220396e-06, + "loss": 1.4821, + "step": 36011 + }, + { + "epoch": 2.83, + "learning_rate": 2.272045643307213e-06, + "loss": 1.4228, + "step": 36012 + }, + { + "epoch": 2.83, + "learning_rate": 2.2699030786836767e-06, + "loss": 1.4509, + "step": 36013 + }, + { + "epoch": 2.83, + "learning_rate": 2.2677615170659692e-06, + "loss": 1.4725, + "step": 36014 + }, + { + "epoch": 2.83, + "learning_rate": 2.2656209584686447e-06, + "loss": 1.4702, + "step": 36015 + }, + { + "epoch": 2.83, + "learning_rate": 2.2634814029062254e-06, + "loss": 1.4991, + "step": 36016 + }, + { + "epoch": 2.83, + "learning_rate": 2.261342850393233e-06, + "loss": 1.457, + "step": 36017 + }, + { + "epoch": 2.83, + "learning_rate": 2.259205300944206e-06, + "loss": 1.4626, + "step": 36018 + }, + { + "epoch": 2.83, + "learning_rate": 2.2570687545736322e-06, + "loss": 1.4564, + "step": 36019 + }, + { + "epoch": 2.83, + "learning_rate": 2.254933211296034e-06, + "loss": 1.459, + "step": 36020 + }, + { + "epoch": 2.83, + "learning_rate": 2.252798671125916e-06, + "loss": 1.4527, + "step": 36021 + }, + { + "epoch": 2.83, + "learning_rate": 2.2506651340777503e-06, + "loss": 1.4065, + "step": 36022 + }, + { + "epoch": 2.83, + "learning_rate": 2.2485326001660255e-06, + "loss": 1.4233, + "step": 36023 + }, + { + "epoch": 2.83, + "learning_rate": 2.2464010694052457e-06, + "loss": 1.4698, + "step": 36024 + }, + { + "epoch": 2.83, + "learning_rate": 2.2442705418098673e-06, + "loss": 1.4683, + "step": 36025 + }, + { + "epoch": 2.83, + "learning_rate": 2.2421410173943444e-06, + "loss": 1.4361, + "step": 36026 + }, + { + "epoch": 2.83, + "learning_rate": 2.240012496173149e-06, + "loss": 1.4528, + "step": 36027 + }, + { + "epoch": 2.83, + "learning_rate": 2.23788497816072e-06, + "loss": 1.4583, + "step": 36028 + }, + { + "epoch": 2.83, + "learning_rate": 2.235758463371512e-06, + "loss": 1.4288, + "step": 36029 + }, + { + "epoch": 2.83, + "learning_rate": 2.2336329518199638e-06, + "loss": 1.3762, + "step": 36030 + }, + { + "epoch": 2.83, + "learning_rate": 2.2315084435204966e-06, + "loss": 1.4363, + "step": 36031 + }, + { + "epoch": 2.84, + "learning_rate": 2.229384938487566e-06, + "loss": 1.4854, + "step": 36032 + }, + { + "epoch": 2.84, + "learning_rate": 2.227262436735544e-06, + "loss": 1.4992, + "step": 36033 + }, + { + "epoch": 2.84, + "learning_rate": 2.225140938278869e-06, + "loss": 1.424, + "step": 36034 + }, + { + "epoch": 2.84, + "learning_rate": 2.2230204431319286e-06, + "loss": 1.461, + "step": 36035 + }, + { + "epoch": 2.84, + "learning_rate": 2.220900951309146e-06, + "loss": 1.4455, + "step": 36036 + }, + { + "epoch": 2.84, + "learning_rate": 2.218782462824875e-06, + "loss": 1.4251, + "step": 36037 + }, + { + "epoch": 2.84, + "learning_rate": 2.2166649776935385e-06, + "loss": 1.4622, + "step": 36038 + }, + { + "epoch": 2.84, + "learning_rate": 2.2145484959294746e-06, + "loss": 1.5024, + "step": 36039 + }, + { + "epoch": 2.84, + "learning_rate": 2.2124330175470884e-06, + "loss": 1.4884, + "step": 36040 + }, + { + "epoch": 2.84, + "learning_rate": 2.2103185425607184e-06, + "loss": 1.4514, + "step": 36041 + }, + { + "epoch": 2.84, + "learning_rate": 2.2082050709847197e-06, + "loss": 1.4482, + "step": 36042 + }, + { + "epoch": 2.84, + "learning_rate": 2.2060926028334647e-06, + "loss": 1.5003, + "step": 36043 + }, + { + "epoch": 2.84, + "learning_rate": 2.2039811381212748e-06, + "loss": 1.4254, + "step": 36044 + }, + { + "epoch": 2.84, + "learning_rate": 2.2018706768624883e-06, + "loss": 1.421, + "step": 36045 + }, + { + "epoch": 2.84, + "learning_rate": 2.1997612190714444e-06, + "loss": 1.4428, + "step": 36046 + }, + { + "epoch": 2.84, + "learning_rate": 2.1976527647624642e-06, + "loss": 1.4491, + "step": 36047 + }, + { + "epoch": 2.84, + "learning_rate": 2.195545313949837e-06, + "loss": 1.428, + "step": 36048 + }, + { + "epoch": 2.84, + "learning_rate": 2.1934388666479173e-06, + "loss": 1.4235, + "step": 36049 + }, + { + "epoch": 2.84, + "learning_rate": 2.1913334228709777e-06, + "loss": 1.4054, + "step": 36050 + }, + { + "epoch": 2.84, + "learning_rate": 2.1892289826332897e-06, + "loss": 1.4957, + "step": 36051 + }, + { + "epoch": 2.84, + "learning_rate": 2.187125545949192e-06, + "loss": 1.4121, + "step": 36052 + }, + { + "epoch": 2.84, + "learning_rate": 2.18502311283294e-06, + "loss": 1.4319, + "step": 36053 + }, + { + "epoch": 2.84, + "learning_rate": 2.182921683298805e-06, + "loss": 1.4312, + "step": 36054 + }, + { + "epoch": 2.84, + "learning_rate": 2.1808212573610595e-06, + "loss": 1.4293, + "step": 36055 + }, + { + "epoch": 2.84, + "learning_rate": 2.1787218350339754e-06, + "loss": 1.3971, + "step": 36056 + }, + { + "epoch": 2.84, + "learning_rate": 2.176623416331774e-06, + "loss": 1.482, + "step": 36057 + }, + { + "epoch": 2.84, + "learning_rate": 2.174526001268745e-06, + "loss": 1.5202, + "step": 36058 + }, + { + "epoch": 2.84, + "learning_rate": 2.1724295898591093e-06, + "loss": 1.4907, + "step": 36059 + }, + { + "epoch": 2.84, + "learning_rate": 2.1703341821170726e-06, + "loss": 1.4252, + "step": 36060 + }, + { + "epoch": 2.84, + "learning_rate": 2.168239778056907e-06, + "loss": 1.448, + "step": 36061 + }, + { + "epoch": 2.84, + "learning_rate": 2.1661463776928013e-06, + "loss": 1.4549, + "step": 36062 + }, + { + "epoch": 2.84, + "learning_rate": 2.1640539810389936e-06, + "loss": 1.4036, + "step": 36063 + }, + { + "epoch": 2.84, + "learning_rate": 2.1619625881096726e-06, + "loss": 1.4447, + "step": 36064 + }, + { + "epoch": 2.84, + "learning_rate": 2.159872198919044e-06, + "loss": 1.4295, + "step": 36065 + }, + { + "epoch": 2.84, + "learning_rate": 2.1577828134812957e-06, + "loss": 1.4406, + "step": 36066 + }, + { + "epoch": 2.84, + "learning_rate": 2.1556944318106175e-06, + "loss": 1.4121, + "step": 36067 + }, + { + "epoch": 2.84, + "learning_rate": 2.15360705392118e-06, + "loss": 1.4007, + "step": 36068 + }, + { + "epoch": 2.84, + "learning_rate": 2.1515206798271732e-06, + "loss": 1.4793, + "step": 36069 + }, + { + "epoch": 2.84, + "learning_rate": 2.149435309542752e-06, + "loss": 1.4679, + "step": 36070 + }, + { + "epoch": 2.84, + "learning_rate": 2.1473509430820546e-06, + "loss": 1.4241, + "step": 36071 + }, + { + "epoch": 2.84, + "learning_rate": 2.14526758045927e-06, + "loss": 1.4263, + "step": 36072 + }, + { + "epoch": 2.84, + "learning_rate": 2.143185221688537e-06, + "loss": 1.4763, + "step": 36073 + }, + { + "epoch": 2.84, + "learning_rate": 2.141103866783944e-06, + "loss": 1.4787, + "step": 36074 + }, + { + "epoch": 2.84, + "learning_rate": 2.1390235157596967e-06, + "loss": 1.4598, + "step": 36075 + }, + { + "epoch": 2.84, + "learning_rate": 2.136944168629867e-06, + "loss": 1.4347, + "step": 36076 + }, + { + "epoch": 2.84, + "learning_rate": 2.1348658254085936e-06, + "loss": 1.4159, + "step": 36077 + }, + { + "epoch": 2.84, + "learning_rate": 2.1327884861099653e-06, + "loss": 1.4343, + "step": 36078 + }, + { + "epoch": 2.84, + "learning_rate": 2.1307121507481207e-06, + "loss": 1.4114, + "step": 36079 + }, + { + "epoch": 2.84, + "learning_rate": 2.1286368193371484e-06, + "loss": 1.4162, + "step": 36080 + }, + { + "epoch": 2.84, + "learning_rate": 2.1265624918911037e-06, + "loss": 1.415, + "step": 36081 + }, + { + "epoch": 2.84, + "learning_rate": 2.124489168424126e-06, + "loss": 1.4567, + "step": 36082 + }, + { + "epoch": 2.84, + "learning_rate": 2.122416848950237e-06, + "loss": 1.4852, + "step": 36083 + }, + { + "epoch": 2.84, + "learning_rate": 2.1203455334835586e-06, + "loss": 1.4287, + "step": 36084 + }, + { + "epoch": 2.84, + "learning_rate": 2.118275222038096e-06, + "loss": 1.4391, + "step": 36085 + }, + { + "epoch": 2.84, + "learning_rate": 2.1162059146279553e-06, + "loss": 1.4492, + "step": 36086 + }, + { + "epoch": 2.84, + "learning_rate": 2.114137611267175e-06, + "loss": 1.3952, + "step": 36087 + }, + { + "epoch": 2.84, + "learning_rate": 2.112070311969777e-06, + "loss": 1.4616, + "step": 36088 + }, + { + "epoch": 2.84, + "learning_rate": 2.1100040167498167e-06, + "loss": 1.4454, + "step": 36089 + }, + { + "epoch": 2.84, + "learning_rate": 2.1079387256213164e-06, + "loss": 1.4619, + "step": 36090 + }, + { + "epoch": 2.84, + "learning_rate": 2.1058744385982817e-06, + "loss": 1.459, + "step": 36091 + }, + { + "epoch": 2.84, + "learning_rate": 2.1038111556947512e-06, + "loss": 1.4874, + "step": 36092 + }, + { + "epoch": 2.84, + "learning_rate": 2.1017488769247304e-06, + "loss": 1.4513, + "step": 36093 + }, + { + "epoch": 2.84, + "learning_rate": 2.099687602302225e-06, + "loss": 1.4259, + "step": 36094 + }, + { + "epoch": 2.84, + "learning_rate": 2.097627331841223e-06, + "loss": 1.4343, + "step": 36095 + }, + { + "epoch": 2.84, + "learning_rate": 2.0955680655556972e-06, + "loss": 1.4278, + "step": 36096 + }, + { + "epoch": 2.84, + "learning_rate": 2.09350980345967e-06, + "loss": 1.4489, + "step": 36097 + }, + { + "epoch": 2.84, + "learning_rate": 2.0914525455670626e-06, + "loss": 1.5032, + "step": 36098 + }, + { + "epoch": 2.84, + "learning_rate": 2.0893962918918817e-06, + "loss": 1.4358, + "step": 36099 + }, + { + "epoch": 2.84, + "learning_rate": 2.087341042448082e-06, + "loss": 1.3875, + "step": 36100 + }, + { + "epoch": 2.84, + "learning_rate": 2.085286797249619e-06, + "loss": 1.4965, + "step": 36101 + }, + { + "epoch": 2.84, + "learning_rate": 2.0832335563103986e-06, + "loss": 1.4633, + "step": 36102 + }, + { + "epoch": 2.84, + "learning_rate": 2.081181319644426e-06, + "loss": 1.4734, + "step": 36103 + }, + { + "epoch": 2.84, + "learning_rate": 2.0791300872655903e-06, + "loss": 1.422, + "step": 36104 + }, + { + "epoch": 2.84, + "learning_rate": 2.0770798591878303e-06, + "loss": 1.4316, + "step": 36105 + }, + { + "epoch": 2.84, + "learning_rate": 2.0750306354250846e-06, + "loss": 1.4552, + "step": 36106 + }, + { + "epoch": 2.84, + "learning_rate": 2.072982415991242e-06, + "loss": 1.4015, + "step": 36107 + }, + { + "epoch": 2.84, + "learning_rate": 2.0709352009001925e-06, + "loss": 1.3916, + "step": 36108 + }, + { + "epoch": 2.84, + "learning_rate": 2.0688889901658735e-06, + "loss": 1.4962, + "step": 36109 + }, + { + "epoch": 2.84, + "learning_rate": 2.0668437838021745e-06, + "loss": 1.4066, + "step": 36110 + }, + { + "epoch": 2.84, + "learning_rate": 2.064799581822968e-06, + "loss": 1.4065, + "step": 36111 + }, + { + "epoch": 2.84, + "learning_rate": 2.0627563842421093e-06, + "loss": 1.4507, + "step": 36112 + }, + { + "epoch": 2.84, + "learning_rate": 2.0607141910735203e-06, + "loss": 1.4771, + "step": 36113 + }, + { + "epoch": 2.84, + "learning_rate": 2.0586730023310404e-06, + "loss": 1.4195, + "step": 36114 + }, + { + "epoch": 2.84, + "learning_rate": 2.0566328180285253e-06, + "loss": 1.4306, + "step": 36115 + }, + { + "epoch": 2.84, + "learning_rate": 2.0545936381798465e-06, + "loss": 1.4711, + "step": 36116 + }, + { + "epoch": 2.84, + "learning_rate": 2.052555462798827e-06, + "loss": 1.441, + "step": 36117 + }, + { + "epoch": 2.84, + "learning_rate": 2.050518291899289e-06, + "loss": 1.4199, + "step": 36118 + }, + { + "epoch": 2.84, + "learning_rate": 2.0484821254951045e-06, + "loss": 1.4745, + "step": 36119 + }, + { + "epoch": 2.84, + "learning_rate": 2.046446963600096e-06, + "loss": 1.4642, + "step": 36120 + }, + { + "epoch": 2.84, + "learning_rate": 2.0444128062280517e-06, + "loss": 1.442, + "step": 36121 + }, + { + "epoch": 2.84, + "learning_rate": 2.0423796533927784e-06, + "loss": 1.4696, + "step": 36122 + }, + { + "epoch": 2.84, + "learning_rate": 2.040347505108114e-06, + "loss": 1.4393, + "step": 36123 + }, + { + "epoch": 2.84, + "learning_rate": 2.038316361387832e-06, + "loss": 1.4199, + "step": 36124 + }, + { + "epoch": 2.84, + "learning_rate": 2.0362862222457366e-06, + "loss": 1.436, + "step": 36125 + }, + { + "epoch": 2.84, + "learning_rate": 2.034257087695601e-06, + "loss": 1.4161, + "step": 36126 + }, + { + "epoch": 2.84, + "learning_rate": 2.0322289577511976e-06, + "loss": 1.4652, + "step": 36127 + }, + { + "epoch": 2.84, + "learning_rate": 2.0302018324263146e-06, + "loss": 1.4142, + "step": 36128 + }, + { + "epoch": 2.84, + "learning_rate": 2.0281757117347088e-06, + "loss": 1.4512, + "step": 36129 + }, + { + "epoch": 2.84, + "learning_rate": 2.0261505956901347e-06, + "loss": 1.4426, + "step": 36130 + }, + { + "epoch": 2.84, + "learning_rate": 2.024126484306332e-06, + "loss": 1.4396, + "step": 36131 + }, + { + "epoch": 2.84, + "learning_rate": 2.0221033775970396e-06, + "loss": 1.4523, + "step": 36132 + }, + { + "epoch": 2.84, + "learning_rate": 2.020081275576013e-06, + "loss": 1.4389, + "step": 36133 + }, + { + "epoch": 2.84, + "learning_rate": 2.018060178256975e-06, + "loss": 1.4533, + "step": 36134 + }, + { + "epoch": 2.84, + "learning_rate": 2.0160400856536476e-06, + "loss": 1.4051, + "step": 36135 + }, + { + "epoch": 2.84, + "learning_rate": 2.014020997779736e-06, + "loss": 1.4227, + "step": 36136 + }, + { + "epoch": 2.84, + "learning_rate": 2.0120029146489638e-06, + "loss": 1.4308, + "step": 36137 + }, + { + "epoch": 2.84, + "learning_rate": 2.0099858362750355e-06, + "loss": 1.4208, + "step": 36138 + }, + { + "epoch": 2.84, + "learning_rate": 2.0079697626716072e-06, + "loss": 1.4397, + "step": 36139 + }, + { + "epoch": 2.84, + "learning_rate": 2.0059546938524186e-06, + "loss": 1.4958, + "step": 36140 + }, + { + "epoch": 2.84, + "learning_rate": 2.0039406298311243e-06, + "loss": 1.4053, + "step": 36141 + }, + { + "epoch": 2.84, + "learning_rate": 2.001927570621398e-06, + "loss": 1.4782, + "step": 36142 + }, + { + "epoch": 2.84, + "learning_rate": 1.999915516236894e-06, + "loss": 1.4585, + "step": 36143 + }, + { + "epoch": 2.84, + "learning_rate": 1.997904466691319e-06, + "loss": 1.4054, + "step": 36144 + }, + { + "epoch": 2.84, + "learning_rate": 1.9958944219982955e-06, + "loss": 1.434, + "step": 36145 + }, + { + "epoch": 2.84, + "learning_rate": 1.993885382171445e-06, + "loss": 1.4571, + "step": 36146 + }, + { + "epoch": 2.84, + "learning_rate": 1.9918773472244743e-06, + "loss": 1.4481, + "step": 36147 + }, + { + "epoch": 2.84, + "learning_rate": 1.989870317170955e-06, + "loss": 1.438, + "step": 36148 + }, + { + "epoch": 2.84, + "learning_rate": 1.9878642920245438e-06, + "loss": 1.469, + "step": 36149 + }, + { + "epoch": 2.84, + "learning_rate": 1.985859271798862e-06, + "loss": 1.4887, + "step": 36150 + }, + { + "epoch": 2.84, + "learning_rate": 1.9838552565074994e-06, + "loss": 1.4183, + "step": 36151 + }, + { + "epoch": 2.84, + "learning_rate": 1.9818522461640786e-06, + "loss": 1.4191, + "step": 36152 + }, + { + "epoch": 2.84, + "learning_rate": 1.9798502407822047e-06, + "loss": 1.4386, + "step": 36153 + }, + { + "epoch": 2.84, + "learning_rate": 1.9778492403754675e-06, + "loss": 1.423, + "step": 36154 + }, + { + "epoch": 2.84, + "learning_rate": 1.975849244957439e-06, + "loss": 1.4449, + "step": 36155 + }, + { + "epoch": 2.84, + "learning_rate": 1.973850254541709e-06, + "loss": 1.4356, + "step": 36156 + }, + { + "epoch": 2.84, + "learning_rate": 1.9718522691418493e-06, + "loss": 1.4791, + "step": 36157 + }, + { + "epoch": 2.84, + "learning_rate": 1.9698552887714327e-06, + "loss": 1.4509, + "step": 36158 + }, + { + "epoch": 2.85, + "learning_rate": 1.967859313443998e-06, + "loss": 1.481, + "step": 36159 + }, + { + "epoch": 2.85, + "learning_rate": 1.965864343173118e-06, + "loss": 1.4153, + "step": 36160 + }, + { + "epoch": 2.85, + "learning_rate": 1.963870377972332e-06, + "loss": 1.3959, + "step": 36161 + }, + { + "epoch": 2.85, + "learning_rate": 1.9618774178551623e-06, + "loss": 1.4241, + "step": 36162 + }, + { + "epoch": 2.85, + "learning_rate": 1.959885462835148e-06, + "loss": 1.4258, + "step": 36163 + }, + { + "epoch": 2.85, + "learning_rate": 1.9578945129258116e-06, + "loss": 1.4487, + "step": 36164 + }, + { + "epoch": 2.85, + "learning_rate": 1.9559045681406924e-06, + "loss": 1.5016, + "step": 36165 + }, + { + "epoch": 2.85, + "learning_rate": 1.9539156284932633e-06, + "loss": 1.431, + "step": 36166 + }, + { + "epoch": 2.85, + "learning_rate": 1.951927693997063e-06, + "loss": 1.4341, + "step": 36167 + }, + { + "epoch": 2.85, + "learning_rate": 1.9499407646655805e-06, + "loss": 1.4003, + "step": 36168 + }, + { + "epoch": 2.85, + "learning_rate": 1.9479548405122723e-06, + "loss": 1.4129, + "step": 36169 + }, + { + "epoch": 2.85, + "learning_rate": 1.9459699215506774e-06, + "loss": 1.4256, + "step": 36170 + }, + { + "epoch": 2.85, + "learning_rate": 1.943986007794218e-06, + "loss": 1.4828, + "step": 36171 + }, + { + "epoch": 2.85, + "learning_rate": 1.942003099256401e-06, + "loss": 1.4404, + "step": 36172 + }, + { + "epoch": 2.85, + "learning_rate": 1.9400211959506805e-06, + "loss": 1.5148, + "step": 36173 + }, + { + "epoch": 2.85, + "learning_rate": 1.938040297890514e-06, + "loss": 1.4478, + "step": 36174 + }, + { + "epoch": 2.85, + "learning_rate": 1.93606040508934e-06, + "loss": 1.4284, + "step": 36175 + }, + { + "epoch": 2.85, + "learning_rate": 1.934081517560615e-06, + "loss": 1.4619, + "step": 36176 + }, + { + "epoch": 2.85, + "learning_rate": 1.932103635317761e-06, + "loss": 1.4533, + "step": 36177 + }, + { + "epoch": 2.85, + "learning_rate": 1.9301267583742173e-06, + "loss": 1.4283, + "step": 36178 + }, + { + "epoch": 2.85, + "learning_rate": 1.9281508867433904e-06, + "loss": 1.4567, + "step": 36179 + }, + { + "epoch": 2.85, + "learning_rate": 1.9261760204387187e-06, + "loss": 1.4847, + "step": 36180 + }, + { + "epoch": 2.85, + "learning_rate": 1.9242021594735922e-06, + "loss": 1.4592, + "step": 36181 + }, + { + "epoch": 2.85, + "learning_rate": 1.9222293038614165e-06, + "loss": 1.4522, + "step": 36182 + }, + { + "epoch": 2.85, + "learning_rate": 1.9202574536155814e-06, + "loss": 1.4631, + "step": 36183 + }, + { + "epoch": 2.85, + "learning_rate": 1.918286608749492e-06, + "loss": 1.4201, + "step": 36184 + }, + { + "epoch": 2.85, + "learning_rate": 1.9163167692765215e-06, + "loss": 1.3976, + "step": 36185 + }, + { + "epoch": 2.85, + "learning_rate": 1.9143479352100256e-06, + "loss": 1.4559, + "step": 36186 + }, + { + "epoch": 2.85, + "learning_rate": 1.9123801065633935e-06, + "loss": 1.4512, + "step": 36187 + }, + { + "epoch": 2.85, + "learning_rate": 1.9104132833499817e-06, + "loss": 1.4829, + "step": 36188 + }, + { + "epoch": 2.85, + "learning_rate": 1.908447465583146e-06, + "loss": 1.4351, + "step": 36189 + }, + { + "epoch": 2.85, + "learning_rate": 1.906482653276209e-06, + "loss": 1.4476, + "step": 36190 + }, + { + "epoch": 2.85, + "learning_rate": 1.9045188464425598e-06, + "loss": 1.4752, + "step": 36191 + }, + { + "epoch": 2.85, + "learning_rate": 1.902556045095488e-06, + "loss": 1.4222, + "step": 36192 + }, + { + "epoch": 2.85, + "learning_rate": 1.9005942492483162e-06, + "loss": 1.4864, + "step": 36193 + }, + { + "epoch": 2.85, + "learning_rate": 1.8986334589144004e-06, + "loss": 1.4642, + "step": 36194 + }, + { + "epoch": 2.85, + "learning_rate": 1.8966736741070298e-06, + "loss": 1.4577, + "step": 36195 + }, + { + "epoch": 2.85, + "learning_rate": 1.8947148948395275e-06, + "loss": 1.5067, + "step": 36196 + }, + { + "epoch": 2.85, + "learning_rate": 1.8927571211251657e-06, + "loss": 1.4875, + "step": 36197 + }, + { + "epoch": 2.85, + "learning_rate": 1.8908003529772509e-06, + "loss": 1.4402, + "step": 36198 + }, + { + "epoch": 2.85, + "learning_rate": 1.888844590409072e-06, + "loss": 1.4748, + "step": 36199 + }, + { + "epoch": 2.85, + "learning_rate": 1.8868898334339021e-06, + "loss": 1.4312, + "step": 36200 + }, + { + "epoch": 2.85, + "learning_rate": 1.884936082065014e-06, + "loss": 1.4433, + "step": 36201 + }, + { + "epoch": 2.85, + "learning_rate": 1.8829833363156633e-06, + "loss": 1.4393, + "step": 36202 + }, + { + "epoch": 2.85, + "learning_rate": 1.8810315961991395e-06, + "loss": 1.4231, + "step": 36203 + }, + { + "epoch": 2.85, + "learning_rate": 1.879080861728649e-06, + "loss": 1.4374, + "step": 36204 + }, + { + "epoch": 2.85, + "learning_rate": 1.877131132917481e-06, + "loss": 1.4501, + "step": 36205 + }, + { + "epoch": 2.85, + "learning_rate": 1.8751824097788414e-06, + "loss": 1.4568, + "step": 36206 + }, + { + "epoch": 2.85, + "learning_rate": 1.87323469232597e-06, + "loss": 1.4235, + "step": 36207 + }, + { + "epoch": 2.85, + "learning_rate": 1.8712879805720892e-06, + "loss": 1.4482, + "step": 36208 + }, + { + "epoch": 2.85, + "learning_rate": 1.8693422745304388e-06, + "loss": 1.4424, + "step": 36209 + }, + { + "epoch": 2.85, + "learning_rate": 1.8673975742141911e-06, + "loss": 1.4277, + "step": 36210 + }, + { + "epoch": 2.85, + "learning_rate": 1.8654538796365692e-06, + "loss": 1.4493, + "step": 36211 + }, + { + "epoch": 2.85, + "learning_rate": 1.863511190810779e-06, + "loss": 1.4324, + "step": 36212 + }, + { + "epoch": 2.85, + "learning_rate": 1.8615695077499936e-06, + "loss": 1.4882, + "step": 36213 + }, + { + "epoch": 2.85, + "learning_rate": 1.8596288304673857e-06, + "loss": 1.4453, + "step": 36214 + }, + { + "epoch": 2.85, + "learning_rate": 1.857689158976161e-06, + "loss": 1.4439, + "step": 36215 + }, + { + "epoch": 2.85, + "learning_rate": 1.8557504932894762e-06, + "loss": 1.453, + "step": 36216 + }, + { + "epoch": 2.85, + "learning_rate": 1.853812833420487e-06, + "loss": 1.4722, + "step": 36217 + }, + { + "epoch": 2.85, + "learning_rate": 1.85187617938235e-06, + "loss": 1.4649, + "step": 36218 + }, + { + "epoch": 2.85, + "learning_rate": 1.8499405311882376e-06, + "loss": 1.4762, + "step": 36219 + }, + { + "epoch": 2.85, + "learning_rate": 1.8480058888512561e-06, + "loss": 1.4191, + "step": 36220 + }, + { + "epoch": 2.85, + "learning_rate": 1.8460722523845618e-06, + "loss": 1.4485, + "step": 36221 + }, + { + "epoch": 2.85, + "learning_rate": 1.844139621801294e-06, + "loss": 1.4483, + "step": 36222 + }, + { + "epoch": 2.85, + "learning_rate": 1.842207997114542e-06, + "loss": 1.4777, + "step": 36223 + }, + { + "epoch": 2.85, + "learning_rate": 1.8402773783374292e-06, + "loss": 1.431, + "step": 36224 + }, + { + "epoch": 2.85, + "learning_rate": 1.8383477654830946e-06, + "loss": 1.428, + "step": 36225 + }, + { + "epoch": 2.85, + "learning_rate": 1.8364191585646116e-06, + "loss": 1.4206, + "step": 36226 + }, + { + "epoch": 2.85, + "learning_rate": 1.8344915575950692e-06, + "loss": 1.4828, + "step": 36227 + }, + { + "epoch": 2.85, + "learning_rate": 1.8325649625875738e-06, + "loss": 1.4249, + "step": 36228 + }, + { + "epoch": 2.85, + "learning_rate": 1.8306393735551817e-06, + "loss": 1.4746, + "step": 36229 + }, + { + "epoch": 2.85, + "learning_rate": 1.828714790510999e-06, + "loss": 1.4162, + "step": 36230 + }, + { + "epoch": 2.85, + "learning_rate": 1.8267912134680651e-06, + "loss": 1.4459, + "step": 36231 + }, + { + "epoch": 2.85, + "learning_rate": 1.8248686424394532e-06, + "loss": 1.3936, + "step": 36232 + }, + { + "epoch": 2.85, + "learning_rate": 1.8229470774382194e-06, + "loss": 1.423, + "step": 36233 + }, + { + "epoch": 2.85, + "learning_rate": 1.8210265184773864e-06, + "loss": 1.4493, + "step": 36234 + }, + { + "epoch": 2.85, + "learning_rate": 1.8191069655700274e-06, + "loss": 1.4564, + "step": 36235 + }, + { + "epoch": 2.85, + "learning_rate": 1.8171884187291485e-06, + "loss": 1.4448, + "step": 36236 + }, + { + "epoch": 2.85, + "learning_rate": 1.815270877967806e-06, + "loss": 1.4887, + "step": 36237 + }, + { + "epoch": 2.85, + "learning_rate": 1.8133543432989727e-06, + "loss": 1.4617, + "step": 36238 + }, + { + "epoch": 2.85, + "learning_rate": 1.811438814735705e-06, + "loss": 1.4424, + "step": 36239 + }, + { + "epoch": 2.85, + "learning_rate": 1.8095242922909925e-06, + "loss": 1.3788, + "step": 36240 + }, + { + "epoch": 2.85, + "learning_rate": 1.807610775977808e-06, + "loss": 1.4387, + "step": 36241 + }, + { + "epoch": 2.85, + "learning_rate": 1.8056982658091912e-06, + "loss": 1.4305, + "step": 36242 + }, + { + "epoch": 2.85, + "learning_rate": 1.8037867617980983e-06, + "loss": 1.3969, + "step": 36243 + }, + { + "epoch": 2.85, + "learning_rate": 1.8018762639575024e-06, + "loss": 1.4413, + "step": 36244 + }, + { + "epoch": 2.85, + "learning_rate": 1.799966772300393e-06, + "loss": 1.4131, + "step": 36245 + }, + { + "epoch": 2.85, + "learning_rate": 1.7980582868397265e-06, + "loss": 1.4884, + "step": 36246 + }, + { + "epoch": 2.85, + "learning_rate": 1.796150807588459e-06, + "loss": 1.4372, + "step": 36247 + }, + { + "epoch": 2.85, + "learning_rate": 1.794244334559547e-06, + "loss": 1.4093, + "step": 36248 + }, + { + "epoch": 2.85, + "learning_rate": 1.7923388677659135e-06, + "loss": 1.4238, + "step": 36249 + }, + { + "epoch": 2.85, + "learning_rate": 1.7904344072205145e-06, + "loss": 1.441, + "step": 36250 + }, + { + "epoch": 2.85, + "learning_rate": 1.7885309529362735e-06, + "loss": 1.4193, + "step": 36251 + }, + { + "epoch": 2.85, + "learning_rate": 1.7866285049261298e-06, + "loss": 1.4382, + "step": 36252 + }, + { + "epoch": 2.85, + "learning_rate": 1.7847270632029898e-06, + "loss": 1.4151, + "step": 36253 + }, + { + "epoch": 2.85, + "learning_rate": 1.7828266277797597e-06, + "loss": 1.4499, + "step": 36254 + }, + { + "epoch": 2.85, + "learning_rate": 1.7809271986693296e-06, + "loss": 1.4616, + "step": 36255 + }, + { + "epoch": 2.85, + "learning_rate": 1.7790287758846223e-06, + "loss": 1.4244, + "step": 36256 + }, + { + "epoch": 2.85, + "learning_rate": 1.7771313594385272e-06, + "loss": 1.4414, + "step": 36257 + }, + { + "epoch": 2.85, + "learning_rate": 1.7752349493438844e-06, + "loss": 1.4493, + "step": 36258 + }, + { + "epoch": 2.85, + "learning_rate": 1.7733395456136167e-06, + "loss": 1.4658, + "step": 36259 + }, + { + "epoch": 2.85, + "learning_rate": 1.7714451482605808e-06, + "loss": 1.4165, + "step": 36260 + }, + { + "epoch": 2.85, + "learning_rate": 1.7695517572976158e-06, + "loss": 1.4293, + "step": 36261 + }, + { + "epoch": 2.85, + "learning_rate": 1.767659372737612e-06, + "loss": 1.4755, + "step": 36262 + }, + { + "epoch": 2.85, + "learning_rate": 1.7657679945933922e-06, + "loss": 1.404, + "step": 36263 + }, + { + "epoch": 2.85, + "learning_rate": 1.7638776228777962e-06, + "loss": 1.4193, + "step": 36264 + }, + { + "epoch": 2.85, + "learning_rate": 1.7619882576036638e-06, + "loss": 1.4477, + "step": 36265 + }, + { + "epoch": 2.85, + "learning_rate": 1.7600998987838345e-06, + "loss": 1.472, + "step": 36266 + }, + { + "epoch": 2.85, + "learning_rate": 1.7582125464311314e-06, + "loss": 1.4645, + "step": 36267 + }, + { + "epoch": 2.85, + "learning_rate": 1.7563262005583444e-06, + "loss": 1.4309, + "step": 36268 + }, + { + "epoch": 2.85, + "learning_rate": 1.7544408611783133e-06, + "loss": 1.4263, + "step": 36269 + }, + { + "epoch": 2.85, + "learning_rate": 1.7525565283038113e-06, + "loss": 1.448, + "step": 36270 + }, + { + "epoch": 2.85, + "learning_rate": 1.7506732019476278e-06, + "loss": 1.45, + "step": 36271 + }, + { + "epoch": 2.85, + "learning_rate": 1.7487908821225693e-06, + "loss": 1.439, + "step": 36272 + }, + { + "epoch": 2.85, + "learning_rate": 1.746909568841426e-06, + "loss": 1.4209, + "step": 36273 + }, + { + "epoch": 2.85, + "learning_rate": 1.745029262116937e-06, + "loss": 1.4746, + "step": 36274 + }, + { + "epoch": 2.85, + "learning_rate": 1.7431499619618927e-06, + "loss": 1.4234, + "step": 36275 + }, + { + "epoch": 2.85, + "learning_rate": 1.7412716683890326e-06, + "loss": 1.4847, + "step": 36276 + }, + { + "epoch": 2.85, + "learning_rate": 1.7393943814111467e-06, + "loss": 1.4237, + "step": 36277 + }, + { + "epoch": 2.85, + "learning_rate": 1.7375181010409244e-06, + "loss": 1.4755, + "step": 36278 + }, + { + "epoch": 2.85, + "learning_rate": 1.735642827291156e-06, + "loss": 1.4816, + "step": 36279 + }, + { + "epoch": 2.85, + "learning_rate": 1.7337685601745478e-06, + "loss": 1.5291, + "step": 36280 + }, + { + "epoch": 2.85, + "learning_rate": 1.7318952997038394e-06, + "loss": 1.4367, + "step": 36281 + }, + { + "epoch": 2.85, + "learning_rate": 1.7300230458917207e-06, + "loss": 1.4734, + "step": 36282 + }, + { + "epoch": 2.85, + "learning_rate": 1.7281517987509486e-06, + "loss": 1.4532, + "step": 36283 + }, + { + "epoch": 2.85, + "learning_rate": 1.7262815582941791e-06, + "loss": 1.3819, + "step": 36284 + }, + { + "epoch": 2.85, + "learning_rate": 1.7244123245341523e-06, + "loss": 1.4545, + "step": 36285 + }, + { + "epoch": 2.86, + "learning_rate": 1.7225440974835247e-06, + "loss": 1.4163, + "step": 36286 + }, + { + "epoch": 2.86, + "learning_rate": 1.7206768771550195e-06, + "loss": 1.409, + "step": 36287 + }, + { + "epoch": 2.86, + "learning_rate": 1.7188106635612597e-06, + "loss": 1.4301, + "step": 36288 + }, + { + "epoch": 2.86, + "learning_rate": 1.7169454567149688e-06, + "loss": 1.4147, + "step": 36289 + }, + { + "epoch": 2.86, + "learning_rate": 1.7150812566287863e-06, + "loss": 1.4397, + "step": 36290 + }, + { + "epoch": 2.86, + "learning_rate": 1.7132180633153859e-06, + "loss": 1.4084, + "step": 36291 + }, + { + "epoch": 2.86, + "learning_rate": 1.7113558767873735e-06, + "loss": 1.4295, + "step": 36292 + }, + { + "epoch": 2.86, + "learning_rate": 1.7094946970574397e-06, + "loss": 1.4847, + "step": 36293 + }, + { + "epoch": 2.86, + "learning_rate": 1.7076345241382072e-06, + "loss": 1.4469, + "step": 36294 + }, + { + "epoch": 2.86, + "learning_rate": 1.7057753580422828e-06, + "loss": 1.4233, + "step": 36295 + }, + { + "epoch": 2.86, + "learning_rate": 1.703917198782323e-06, + "loss": 1.4349, + "step": 36296 + }, + { + "epoch": 2.86, + "learning_rate": 1.7020600463709177e-06, + "loss": 1.424, + "step": 36297 + }, + { + "epoch": 2.86, + "learning_rate": 1.700203900820707e-06, + "loss": 1.5193, + "step": 36298 + }, + { + "epoch": 2.86, + "learning_rate": 1.6983487621442471e-06, + "loss": 1.4529, + "step": 36299 + }, + { + "epoch": 2.86, + "learning_rate": 1.6964946303541781e-06, + "loss": 1.4614, + "step": 36300 + }, + { + "epoch": 2.86, + "learning_rate": 1.6946415054630735e-06, + "loss": 1.4557, + "step": 36301 + }, + { + "epoch": 2.86, + "learning_rate": 1.6927893874835064e-06, + "loss": 1.5279, + "step": 36302 + }, + { + "epoch": 2.86, + "learning_rate": 1.69093827642805e-06, + "loss": 1.4201, + "step": 36303 + }, + { + "epoch": 2.86, + "learning_rate": 1.6890881723092942e-06, + "loss": 1.4633, + "step": 36304 + }, + { + "epoch": 2.86, + "learning_rate": 1.6872390751397624e-06, + "loss": 1.4341, + "step": 36305 + }, + { + "epoch": 2.86, + "learning_rate": 1.6853909849320447e-06, + "loss": 1.5004, + "step": 36306 + }, + { + "epoch": 2.86, + "learning_rate": 1.6835439016986806e-06, + "loss": 1.3987, + "step": 36307 + }, + { + "epoch": 2.86, + "learning_rate": 1.681697825452194e-06, + "loss": 1.435, + "step": 36308 + }, + { + "epoch": 2.86, + "learning_rate": 1.6798527562051244e-06, + "loss": 1.4309, + "step": 36309 + }, + { + "epoch": 2.86, + "learning_rate": 1.6780086939700289e-06, + "loss": 1.4849, + "step": 36310 + }, + { + "epoch": 2.86, + "learning_rate": 1.6761656387593968e-06, + "loss": 1.4571, + "step": 36311 + }, + { + "epoch": 2.86, + "learning_rate": 1.6743235905857356e-06, + "loss": 1.5078, + "step": 36312 + }, + { + "epoch": 2.86, + "learning_rate": 1.6724825494615512e-06, + "loss": 1.4416, + "step": 36313 + }, + { + "epoch": 2.86, + "learning_rate": 1.6706425153993842e-06, + "loss": 1.4097, + "step": 36314 + }, + { + "epoch": 2.86, + "learning_rate": 1.6688034884116908e-06, + "loss": 1.4359, + "step": 36315 + }, + { + "epoch": 2.86, + "learning_rate": 1.6669654685109612e-06, + "loss": 1.4894, + "step": 36316 + }, + { + "epoch": 2.86, + "learning_rate": 1.6651284557096856e-06, + "loss": 1.4722, + "step": 36317 + }, + { + "epoch": 2.86, + "learning_rate": 1.663292450020337e-06, + "loss": 1.3667, + "step": 36318 + }, + { + "epoch": 2.86, + "learning_rate": 1.6614574514553558e-06, + "loss": 1.4589, + "step": 36319 + }, + { + "epoch": 2.86, + "learning_rate": 1.6596234600272318e-06, + "loss": 1.4863, + "step": 36320 + }, + { + "epoch": 2.86, + "learning_rate": 1.6577904757484052e-06, + "loss": 1.4397, + "step": 36321 + }, + { + "epoch": 2.86, + "learning_rate": 1.655958498631299e-06, + "loss": 1.3791, + "step": 36322 + }, + { + "epoch": 2.86, + "learning_rate": 1.6541275286883872e-06, + "loss": 1.4358, + "step": 36323 + }, + { + "epoch": 2.86, + "learning_rate": 1.6522975659320924e-06, + "loss": 1.45, + "step": 36324 + }, + { + "epoch": 2.86, + "learning_rate": 1.6504686103748222e-06, + "loss": 1.4369, + "step": 36325 + }, + { + "epoch": 2.86, + "learning_rate": 1.6486406620289993e-06, + "loss": 1.4315, + "step": 36326 + }, + { + "epoch": 2.86, + "learning_rate": 1.6468137209070476e-06, + "loss": 1.4162, + "step": 36327 + }, + { + "epoch": 2.86, + "learning_rate": 1.6449877870213569e-06, + "loss": 1.4438, + "step": 36328 + }, + { + "epoch": 2.86, + "learning_rate": 1.643162860384334e-06, + "loss": 1.4743, + "step": 36329 + }, + { + "epoch": 2.86, + "learning_rate": 1.6413389410083689e-06, + "loss": 1.4419, + "step": 36330 + }, + { + "epoch": 2.86, + "learning_rate": 1.639516028905835e-06, + "loss": 1.4428, + "step": 36331 + }, + { + "epoch": 2.86, + "learning_rate": 1.6376941240891228e-06, + "loss": 1.4706, + "step": 36332 + }, + { + "epoch": 2.86, + "learning_rate": 1.6358732265705721e-06, + "loss": 1.4187, + "step": 36333 + }, + { + "epoch": 2.86, + "learning_rate": 1.6340533363625897e-06, + "loss": 1.3821, + "step": 36334 + }, + { + "epoch": 2.86, + "learning_rate": 1.6322344534775156e-06, + "loss": 1.3741, + "step": 36335 + }, + { + "epoch": 2.86, + "learning_rate": 1.6304165779276734e-06, + "loss": 1.4301, + "step": 36336 + }, + { + "epoch": 2.86, + "learning_rate": 1.6285997097254366e-06, + "loss": 1.4467, + "step": 36337 + }, + { + "epoch": 2.86, + "learning_rate": 1.6267838488831287e-06, + "loss": 1.4267, + "step": 36338 + }, + { + "epoch": 2.86, + "learning_rate": 1.624968995413073e-06, + "loss": 1.4933, + "step": 36339 + }, + { + "epoch": 2.86, + "learning_rate": 1.6231551493276095e-06, + "loss": 1.4811, + "step": 36340 + }, + { + "epoch": 2.86, + "learning_rate": 1.6213423106390455e-06, + "loss": 1.4187, + "step": 36341 + }, + { + "epoch": 2.86, + "learning_rate": 1.6195304793596708e-06, + "loss": 1.4301, + "step": 36342 + }, + { + "epoch": 2.86, + "learning_rate": 1.617719655501809e-06, + "loss": 1.428, + "step": 36343 + }, + { + "epoch": 2.86, + "learning_rate": 1.6159098390777336e-06, + "loss": 1.4303, + "step": 36344 + }, + { + "epoch": 2.86, + "learning_rate": 1.6141010300997515e-06, + "loss": 1.4593, + "step": 36345 + }, + { + "epoch": 2.86, + "learning_rate": 1.612293228580136e-06, + "loss": 1.4583, + "step": 36346 + }, + { + "epoch": 2.86, + "learning_rate": 1.6104864345311773e-06, + "loss": 1.4452, + "step": 36347 + }, + { + "epoch": 2.86, + "learning_rate": 1.608680647965116e-06, + "loss": 1.4969, + "step": 36348 + }, + { + "epoch": 2.86, + "learning_rate": 1.6068758688942251e-06, + "loss": 1.4095, + "step": 36349 + }, + { + "epoch": 2.86, + "learning_rate": 1.6050720973307617e-06, + "loss": 1.4479, + "step": 36350 + }, + { + "epoch": 2.86, + "learning_rate": 1.603269333286966e-06, + "loss": 1.4696, + "step": 36351 + }, + { + "epoch": 2.86, + "learning_rate": 1.6014675767750785e-06, + "loss": 1.4378, + "step": 36352 + }, + { + "epoch": 2.86, + "learning_rate": 1.599666827807322e-06, + "loss": 1.4399, + "step": 36353 + }, + { + "epoch": 2.86, + "learning_rate": 1.5978670863959543e-06, + "loss": 1.4323, + "step": 36354 + }, + { + "epoch": 2.86, + "learning_rate": 1.5960683525531648e-06, + "loss": 1.3648, + "step": 36355 + }, + { + "epoch": 2.86, + "learning_rate": 1.594270626291161e-06, + "loss": 1.469, + "step": 36356 + }, + { + "epoch": 2.86, + "learning_rate": 1.5924739076221827e-06, + "loss": 1.3986, + "step": 36357 + }, + { + "epoch": 2.86, + "learning_rate": 1.5906781965584037e-06, + "loss": 1.4699, + "step": 36358 + }, + { + "epoch": 2.86, + "learning_rate": 1.5888834931119975e-06, + "loss": 1.4816, + "step": 36359 + }, + { + "epoch": 2.86, + "learning_rate": 1.587089797295188e-06, + "loss": 1.4079, + "step": 36360 + }, + { + "epoch": 2.86, + "learning_rate": 1.5852971091201483e-06, + "loss": 1.4502, + "step": 36361 + }, + { + "epoch": 2.86, + "learning_rate": 1.5835054285990356e-06, + "loss": 1.478, + "step": 36362 + }, + { + "epoch": 2.86, + "learning_rate": 1.581714755744007e-06, + "loss": 1.4589, + "step": 36363 + }, + { + "epoch": 2.86, + "learning_rate": 1.5799250905672523e-06, + "loss": 1.4265, + "step": 36364 + }, + { + "epoch": 2.86, + "learning_rate": 1.5781364330808788e-06, + "loss": 1.4601, + "step": 36365 + }, + { + "epoch": 2.86, + "learning_rate": 1.5763487832970768e-06, + "loss": 1.4293, + "step": 36366 + }, + { + "epoch": 2.86, + "learning_rate": 1.5745621412279363e-06, + "loss": 1.4079, + "step": 36367 + }, + { + "epoch": 2.86, + "learning_rate": 1.5727765068856146e-06, + "loss": 1.4394, + "step": 36368 + }, + { + "epoch": 2.86, + "learning_rate": 1.5709918802822518e-06, + "loss": 1.4806, + "step": 36369 + }, + { + "epoch": 2.86, + "learning_rate": 1.5692082614299217e-06, + "loss": 1.4364, + "step": 36370 + }, + { + "epoch": 2.86, + "learning_rate": 1.5674256503407644e-06, + "loss": 1.4376, + "step": 36371 + }, + { + "epoch": 2.86, + "learning_rate": 1.5656440470268873e-06, + "loss": 1.43, + "step": 36372 + }, + { + "epoch": 2.86, + "learning_rate": 1.5638634515003467e-06, + "loss": 1.4799, + "step": 36373 + }, + { + "epoch": 2.86, + "learning_rate": 1.5620838637732835e-06, + "loss": 1.4708, + "step": 36374 + }, + { + "epoch": 2.86, + "learning_rate": 1.5603052838577379e-06, + "loss": 1.4148, + "step": 36375 + }, + { + "epoch": 2.86, + "learning_rate": 1.558527711765817e-06, + "loss": 1.4476, + "step": 36376 + }, + { + "epoch": 2.86, + "learning_rate": 1.5567511475095606e-06, + "loss": 1.4067, + "step": 36377 + }, + { + "epoch": 2.86, + "learning_rate": 1.5549755911010597e-06, + "loss": 1.4552, + "step": 36378 + }, + { + "epoch": 2.86, + "learning_rate": 1.5532010425523544e-06, + "loss": 1.4145, + "step": 36379 + }, + { + "epoch": 2.86, + "learning_rate": 1.5514275018755017e-06, + "loss": 1.4129, + "step": 36380 + }, + { + "epoch": 2.86, + "learning_rate": 1.5496549690825256e-06, + "loss": 1.4115, + "step": 36381 + }, + { + "epoch": 2.86, + "learning_rate": 1.547883444185466e-06, + "loss": 1.5016, + "step": 36382 + }, + { + "epoch": 2.86, + "learning_rate": 1.5461129271963635e-06, + "loss": 1.4242, + "step": 36383 + }, + { + "epoch": 2.86, + "learning_rate": 1.5443434181272251e-06, + "loss": 1.4274, + "step": 36384 + }, + { + "epoch": 2.86, + "learning_rate": 1.5425749169900914e-06, + "loss": 1.4275, + "step": 36385 + }, + { + "epoch": 2.86, + "learning_rate": 1.5408074237969192e-06, + "loss": 1.4266, + "step": 36386 + }, + { + "epoch": 2.86, + "learning_rate": 1.539040938559749e-06, + "loss": 1.447, + "step": 36387 + }, + { + "epoch": 2.86, + "learning_rate": 1.5372754612905714e-06, + "loss": 1.3724, + "step": 36388 + }, + { + "epoch": 2.86, + "learning_rate": 1.5355109920013597e-06, + "loss": 1.412, + "step": 36389 + }, + { + "epoch": 2.86, + "learning_rate": 1.5337475307040882e-06, + "loss": 1.4743, + "step": 36390 + }, + { + "epoch": 2.86, + "learning_rate": 1.5319850774107467e-06, + "loss": 1.5154, + "step": 36391 + }, + { + "epoch": 2.86, + "learning_rate": 1.5302236321332929e-06, + "loss": 1.4373, + "step": 36392 + }, + { + "epoch": 2.86, + "learning_rate": 1.5284631948837001e-06, + "loss": 1.4627, + "step": 36393 + }, + { + "epoch": 2.86, + "learning_rate": 1.5267037656738924e-06, + "loss": 1.4341, + "step": 36394 + }, + { + "epoch": 2.86, + "learning_rate": 1.5249453445158432e-06, + "loss": 1.4582, + "step": 36395 + }, + { + "epoch": 2.86, + "learning_rate": 1.5231879314214934e-06, + "loss": 1.4172, + "step": 36396 + }, + { + "epoch": 2.86, + "learning_rate": 1.5214315264027332e-06, + "loss": 1.4559, + "step": 36397 + }, + { + "epoch": 2.86, + "learning_rate": 1.5196761294715364e-06, + "loss": 1.4677, + "step": 36398 + }, + { + "epoch": 2.86, + "learning_rate": 1.5179217406397936e-06, + "loss": 1.439, + "step": 36399 + }, + { + "epoch": 2.86, + "learning_rate": 1.5161683599194118e-06, + "loss": 1.4213, + "step": 36400 + }, + { + "epoch": 2.86, + "learning_rate": 1.514415987322315e-06, + "loss": 1.4819, + "step": 36401 + }, + { + "epoch": 2.86, + "learning_rate": 1.5126646228603933e-06, + "loss": 1.4029, + "step": 36402 + }, + { + "epoch": 2.86, + "learning_rate": 1.5109142665455543e-06, + "loss": 1.4603, + "step": 36403 + }, + { + "epoch": 2.86, + "learning_rate": 1.5091649183896382e-06, + "loss": 1.4387, + "step": 36404 + }, + { + "epoch": 2.86, + "learning_rate": 1.5074165784045522e-06, + "loss": 1.4392, + "step": 36405 + }, + { + "epoch": 2.86, + "learning_rate": 1.5056692466021702e-06, + "loss": 1.3748, + "step": 36406 + }, + { + "epoch": 2.86, + "learning_rate": 1.5039229229943494e-06, + "loss": 1.462, + "step": 36407 + }, + { + "epoch": 2.86, + "learning_rate": 1.5021776075929304e-06, + "loss": 1.4178, + "step": 36408 + }, + { + "epoch": 2.86, + "learning_rate": 1.5004333004097869e-06, + "loss": 1.4744, + "step": 36409 + }, + { + "epoch": 2.86, + "learning_rate": 1.4986900014567593e-06, + "loss": 1.4534, + "step": 36410 + }, + { + "epoch": 2.86, + "learning_rate": 1.4969477107456718e-06, + "loss": 1.478, + "step": 36411 + }, + { + "epoch": 2.86, + "learning_rate": 1.4952064282883647e-06, + "loss": 1.4646, + "step": 36412 + }, + { + "epoch": 2.87, + "learning_rate": 1.4934661540966452e-06, + "loss": 1.4699, + "step": 36413 + }, + { + "epoch": 2.87, + "learning_rate": 1.4917268881823374e-06, + "loss": 1.4567, + "step": 36414 + }, + { + "epoch": 2.87, + "learning_rate": 1.4899886305572483e-06, + "loss": 1.4923, + "step": 36415 + }, + { + "epoch": 2.87, + "learning_rate": 1.488251381233202e-06, + "loss": 1.4158, + "step": 36416 + }, + { + "epoch": 2.87, + "learning_rate": 1.4865151402219389e-06, + "loss": 1.429, + "step": 36417 + }, + { + "epoch": 2.87, + "learning_rate": 1.4847799075353162e-06, + "loss": 1.413, + "step": 36418 + }, + { + "epoch": 2.87, + "learning_rate": 1.483045683185058e-06, + "loss": 1.4554, + "step": 36419 + }, + { + "epoch": 2.87, + "learning_rate": 1.4813124671829713e-06, + "loss": 1.4608, + "step": 36420 + }, + { + "epoch": 2.87, + "learning_rate": 1.4795802595408134e-06, + "loss": 1.4499, + "step": 36421 + }, + { + "epoch": 2.87, + "learning_rate": 1.477849060270342e-06, + "loss": 1.4658, + "step": 36422 + }, + { + "epoch": 2.87, + "learning_rate": 1.4761188693833136e-06, + "loss": 1.4534, + "step": 36423 + }, + { + "epoch": 2.87, + "learning_rate": 1.4743896868914694e-06, + "loss": 1.473, + "step": 36424 + }, + { + "epoch": 2.87, + "learning_rate": 1.4726615128065666e-06, + "loss": 1.4523, + "step": 36425 + }, + { + "epoch": 2.87, + "learning_rate": 1.470934347140329e-06, + "loss": 1.4234, + "step": 36426 + }, + { + "epoch": 2.87, + "learning_rate": 1.4692081899044804e-06, + "loss": 1.4255, + "step": 36427 + }, + { + "epoch": 2.87, + "learning_rate": 1.4674830411107285e-06, + "loss": 1.3814, + "step": 36428 + }, + { + "epoch": 2.87, + "learning_rate": 1.4657589007708137e-06, + "loss": 1.4703, + "step": 36429 + }, + { + "epoch": 2.87, + "learning_rate": 1.4640357688964266e-06, + "loss": 1.4267, + "step": 36430 + }, + { + "epoch": 2.87, + "learning_rate": 1.462313645499258e-06, + "loss": 1.4399, + "step": 36431 + }, + { + "epoch": 2.87, + "learning_rate": 1.4605925305910315e-06, + "loss": 1.4463, + "step": 36432 + }, + { + "epoch": 2.87, + "learning_rate": 1.4588724241833882e-06, + "loss": 1.4795, + "step": 36433 + }, + { + "epoch": 2.87, + "learning_rate": 1.4571533262880353e-06, + "loss": 1.4899, + "step": 36434 + }, + { + "epoch": 2.87, + "learning_rate": 1.4554352369166466e-06, + "loss": 1.4357, + "step": 36435 + }, + { + "epoch": 2.87, + "learning_rate": 1.4537181560808797e-06, + "loss": 1.4459, + "step": 36436 + }, + { + "epoch": 2.87, + "learning_rate": 1.4520020837923753e-06, + "loss": 1.4449, + "step": 36437 + }, + { + "epoch": 2.87, + "learning_rate": 1.450287020062807e-06, + "loss": 1.4104, + "step": 36438 + }, + { + "epoch": 2.87, + "learning_rate": 1.4485729649038324e-06, + "loss": 1.4178, + "step": 36439 + }, + { + "epoch": 2.87, + "learning_rate": 1.446859918327059e-06, + "loss": 1.4225, + "step": 36440 + }, + { + "epoch": 2.87, + "learning_rate": 1.4451478803441107e-06, + "loss": 1.4749, + "step": 36441 + }, + { + "epoch": 2.87, + "learning_rate": 1.4434368509666449e-06, + "loss": 1.4201, + "step": 36442 + }, + { + "epoch": 2.87, + "learning_rate": 1.441726830206269e-06, + "loss": 1.4132, + "step": 36443 + }, + { + "epoch": 2.87, + "learning_rate": 1.4400178180745902e-06, + "loss": 1.4294, + "step": 36444 + }, + { + "epoch": 2.87, + "learning_rate": 1.438309814583183e-06, + "loss": 1.438, + "step": 36445 + }, + { + "epoch": 2.87, + "learning_rate": 1.4366028197436874e-06, + "loss": 1.4759, + "step": 36446 + }, + { + "epoch": 2.87, + "learning_rate": 1.434896833567678e-06, + "loss": 1.4343, + "step": 36447 + }, + { + "epoch": 2.87, + "learning_rate": 1.433191856066712e-06, + "loss": 1.4634, + "step": 36448 + }, + { + "epoch": 2.87, + "learning_rate": 1.4314878872524139e-06, + "loss": 1.4435, + "step": 36449 + }, + { + "epoch": 2.87, + "learning_rate": 1.4297849271363072e-06, + "loss": 1.4412, + "step": 36450 + }, + { + "epoch": 2.87, + "learning_rate": 1.4280829757299828e-06, + "loss": 1.4143, + "step": 36451 + }, + { + "epoch": 2.87, + "learning_rate": 1.4263820330449816e-06, + "loss": 1.4675, + "step": 36452 + }, + { + "epoch": 2.87, + "learning_rate": 1.424682099092861e-06, + "loss": 1.4579, + "step": 36453 + }, + { + "epoch": 2.87, + "learning_rate": 1.422983173885145e-06, + "loss": 1.4756, + "step": 36454 + }, + { + "epoch": 2.87, + "learning_rate": 1.421285257433391e-06, + "loss": 1.4642, + "step": 36455 + }, + { + "epoch": 2.87, + "learning_rate": 1.4195883497491235e-06, + "loss": 1.4418, + "step": 36456 + }, + { + "epoch": 2.87, + "learning_rate": 1.417892450843866e-06, + "loss": 1.4621, + "step": 36457 + }, + { + "epoch": 2.87, + "learning_rate": 1.4161975607290933e-06, + "loss": 1.468, + "step": 36458 + }, + { + "epoch": 2.87, + "learning_rate": 1.4145036794163623e-06, + "loss": 1.4481, + "step": 36459 + }, + { + "epoch": 2.87, + "learning_rate": 1.412810806917164e-06, + "loss": 1.4426, + "step": 36460 + }, + { + "epoch": 2.87, + "learning_rate": 1.4111189432429726e-06, + "loss": 1.4334, + "step": 36461 + }, + { + "epoch": 2.87, + "learning_rate": 1.4094280884052788e-06, + "loss": 1.4744, + "step": 36462 + }, + { + "epoch": 2.87, + "learning_rate": 1.4077382424155903e-06, + "loss": 1.4123, + "step": 36463 + }, + { + "epoch": 2.87, + "learning_rate": 1.4060494052853478e-06, + "loss": 1.44, + "step": 36464 + }, + { + "epoch": 2.87, + "learning_rate": 1.4043615770260252e-06, + "loss": 1.3995, + "step": 36465 + }, + { + "epoch": 2.87, + "learning_rate": 1.4026747576490804e-06, + "loss": 1.4779, + "step": 36466 + }, + { + "epoch": 2.87, + "learning_rate": 1.4009889471659874e-06, + "loss": 1.4325, + "step": 36467 + }, + { + "epoch": 2.87, + "learning_rate": 1.3993041455881538e-06, + "loss": 1.4678, + "step": 36468 + }, + { + "epoch": 2.87, + "learning_rate": 1.3976203529270535e-06, + "loss": 1.4454, + "step": 36469 + }, + { + "epoch": 2.87, + "learning_rate": 1.395937569194111e-06, + "loss": 1.4275, + "step": 36470 + }, + { + "epoch": 2.87, + "learning_rate": 1.3942557944007504e-06, + "loss": 1.4899, + "step": 36471 + }, + { + "epoch": 2.87, + "learning_rate": 1.3925750285583625e-06, + "loss": 1.378, + "step": 36472 + }, + { + "epoch": 2.87, + "learning_rate": 1.390895271678405e-06, + "loss": 1.431, + "step": 36473 + }, + { + "epoch": 2.87, + "learning_rate": 1.3892165237722519e-06, + "loss": 1.4228, + "step": 36474 + }, + { + "epoch": 2.87, + "learning_rate": 1.3875387848512943e-06, + "loss": 1.4907, + "step": 36475 + }, + { + "epoch": 2.87, + "learning_rate": 1.3858620549269562e-06, + "loss": 1.4481, + "step": 36476 + }, + { + "epoch": 2.87, + "learning_rate": 1.3841863340105951e-06, + "loss": 1.4131, + "step": 36477 + }, + { + "epoch": 2.87, + "learning_rate": 1.3825116221136023e-06, + "loss": 1.5033, + "step": 36478 + }, + { + "epoch": 2.87, + "learning_rate": 1.3808379192473184e-06, + "loss": 1.4476, + "step": 36479 + }, + { + "epoch": 2.87, + "learning_rate": 1.3791652254231512e-06, + "loss": 1.4202, + "step": 36480 + }, + { + "epoch": 2.87, + "learning_rate": 1.3774935406524411e-06, + "loss": 1.4443, + "step": 36481 + }, + { + "epoch": 2.87, + "learning_rate": 1.3758228649465131e-06, + "loss": 1.4166, + "step": 36482 + }, + { + "epoch": 2.87, + "learning_rate": 1.374153198316741e-06, + "loss": 1.5018, + "step": 36483 + }, + { + "epoch": 2.87, + "learning_rate": 1.3724845407744488e-06, + "loss": 1.4402, + "step": 36484 + }, + { + "epoch": 2.87, + "learning_rate": 1.370816892330978e-06, + "loss": 1.424, + "step": 36485 + }, + { + "epoch": 2.87, + "learning_rate": 1.3691502529976194e-06, + "loss": 1.4568, + "step": 36486 + }, + { + "epoch": 2.87, + "learning_rate": 1.3674846227857138e-06, + "loss": 1.4576, + "step": 36487 + }, + { + "epoch": 2.87, + "learning_rate": 1.3658200017065857e-06, + "loss": 1.4719, + "step": 36488 + }, + { + "epoch": 2.87, + "learning_rate": 1.3641563897714925e-06, + "loss": 1.4155, + "step": 36489 + }, + { + "epoch": 2.87, + "learning_rate": 1.3624937869917752e-06, + "loss": 1.4525, + "step": 36490 + }, + { + "epoch": 2.87, + "learning_rate": 1.3608321933786914e-06, + "loss": 1.4168, + "step": 36491 + }, + { + "epoch": 2.87, + "learning_rate": 1.3591716089435157e-06, + "loss": 1.423, + "step": 36492 + }, + { + "epoch": 2.87, + "learning_rate": 1.3575120336975554e-06, + "loss": 1.5003, + "step": 36493 + }, + { + "epoch": 2.87, + "learning_rate": 1.3558534676520683e-06, + "loss": 1.4285, + "step": 36494 + }, + { + "epoch": 2.87, + "learning_rate": 1.3541959108182788e-06, + "loss": 1.4302, + "step": 36495 + }, + { + "epoch": 2.87, + "learning_rate": 1.3525393632074944e-06, + "loss": 1.4639, + "step": 36496 + }, + { + "epoch": 2.87, + "learning_rate": 1.3508838248309228e-06, + "loss": 1.4402, + "step": 36497 + }, + { + "epoch": 2.87, + "learning_rate": 1.3492292956998385e-06, + "loss": 1.3622, + "step": 36498 + }, + { + "epoch": 2.87, + "learning_rate": 1.3475757758254325e-06, + "loss": 1.4587, + "step": 36499 + }, + { + "epoch": 2.87, + "learning_rate": 1.3459232652189622e-06, + "loss": 1.411, + "step": 36500 + }, + { + "epoch": 2.87, + "learning_rate": 1.3442717638916355e-06, + "loss": 1.4611, + "step": 36501 + }, + { + "epoch": 2.87, + "learning_rate": 1.342621271854677e-06, + "loss": 1.4305, + "step": 36502 + }, + { + "epoch": 2.87, + "learning_rate": 1.3409717891192773e-06, + "loss": 1.3999, + "step": 36503 + }, + { + "epoch": 2.87, + "learning_rate": 1.3393233156966444e-06, + "loss": 1.4591, + "step": 36504 + }, + { + "epoch": 2.87, + "learning_rate": 1.3376758515979691e-06, + "loss": 1.4597, + "step": 36505 + }, + { + "epoch": 2.87, + "learning_rate": 1.336029396834426e-06, + "loss": 1.4325, + "step": 36506 + }, + { + "epoch": 2.87, + "learning_rate": 1.3343839514172228e-06, + "loss": 1.4522, + "step": 36507 + }, + { + "epoch": 2.87, + "learning_rate": 1.3327395153575005e-06, + "loss": 1.4381, + "step": 36508 + }, + { + "epoch": 2.87, + "learning_rate": 1.3310960886664335e-06, + "loss": 1.4327, + "step": 36509 + }, + { + "epoch": 2.87, + "learning_rate": 1.3294536713551962e-06, + "loss": 1.4612, + "step": 36510 + }, + { + "epoch": 2.87, + "learning_rate": 1.327812263434913e-06, + "loss": 1.4769, + "step": 36511 + }, + { + "epoch": 2.87, + "learning_rate": 1.326171864916742e-06, + "loss": 1.4654, + "step": 36512 + }, + { + "epoch": 2.87, + "learning_rate": 1.3245324758118236e-06, + "loss": 1.4161, + "step": 36513 + }, + { + "epoch": 2.87, + "learning_rate": 1.3228940961312827e-06, + "loss": 1.4068, + "step": 36514 + }, + { + "epoch": 2.87, + "learning_rate": 1.3212567258862438e-06, + "loss": 1.488, + "step": 36515 + }, + { + "epoch": 2.87, + "learning_rate": 1.3196203650878146e-06, + "loss": 1.4424, + "step": 36516 + }, + { + "epoch": 2.87, + "learning_rate": 1.3179850137471193e-06, + "loss": 1.4277, + "step": 36517 + }, + { + "epoch": 2.87, + "learning_rate": 1.3163506718752492e-06, + "loss": 1.4345, + "step": 36518 + }, + { + "epoch": 2.87, + "learning_rate": 1.3147173394833288e-06, + "loss": 1.4366, + "step": 36519 + }, + { + "epoch": 2.87, + "learning_rate": 1.3130850165823991e-06, + "loss": 1.4001, + "step": 36520 + }, + { + "epoch": 2.87, + "learning_rate": 1.3114537031836015e-06, + "loss": 1.4681, + "step": 36521 + }, + { + "epoch": 2.87, + "learning_rate": 1.3098233992979602e-06, + "loss": 1.4829, + "step": 36522 + }, + { + "epoch": 2.87, + "learning_rate": 1.3081941049365663e-06, + "loss": 1.4249, + "step": 36523 + }, + { + "epoch": 2.87, + "learning_rate": 1.3065658201104779e-06, + "loss": 1.4428, + "step": 36524 + }, + { + "epoch": 2.87, + "learning_rate": 1.3049385448307526e-06, + "loss": 1.4442, + "step": 36525 + }, + { + "epoch": 2.87, + "learning_rate": 1.3033122791084317e-06, + "loss": 1.5126, + "step": 36526 + }, + { + "epoch": 2.87, + "learning_rate": 1.3016870229545728e-06, + "loss": 1.4425, + "step": 36527 + }, + { + "epoch": 2.87, + "learning_rate": 1.3000627763802173e-06, + "loss": 1.4276, + "step": 36528 + }, + { + "epoch": 2.87, + "learning_rate": 1.2984395393963397e-06, + "loss": 1.4558, + "step": 36529 + }, + { + "epoch": 2.87, + "learning_rate": 1.2968173120140147e-06, + "loss": 1.4693, + "step": 36530 + }, + { + "epoch": 2.87, + "learning_rate": 1.2951960942442497e-06, + "loss": 1.4569, + "step": 36531 + }, + { + "epoch": 2.87, + "learning_rate": 1.2935758860980195e-06, + "loss": 1.4216, + "step": 36532 + }, + { + "epoch": 2.87, + "learning_rate": 1.2919566875863486e-06, + "loss": 1.4793, + "step": 36533 + }, + { + "epoch": 2.87, + "learning_rate": 1.2903384987202447e-06, + "loss": 1.3861, + "step": 36534 + }, + { + "epoch": 2.87, + "learning_rate": 1.2887213195106827e-06, + "loss": 1.464, + "step": 36535 + }, + { + "epoch": 2.87, + "learning_rate": 1.2871051499686036e-06, + "loss": 1.4309, + "step": 36536 + }, + { + "epoch": 2.87, + "learning_rate": 1.2854899901050485e-06, + "loss": 1.4537, + "step": 36537 + }, + { + "epoch": 2.87, + "learning_rate": 1.2838758399309257e-06, + "loss": 1.4238, + "step": 36538 + }, + { + "epoch": 2.87, + "learning_rate": 1.2822626994572427e-06, + "loss": 1.4128, + "step": 36539 + }, + { + "epoch": 2.88, + "learning_rate": 1.2806505686949076e-06, + "loss": 1.4385, + "step": 36540 + }, + { + "epoch": 2.88, + "learning_rate": 1.2790394476548782e-06, + "loss": 1.4462, + "step": 36541 + }, + { + "epoch": 2.88, + "learning_rate": 1.2774293363481125e-06, + "loss": 1.5027, + "step": 36542 + }, + { + "epoch": 2.88, + "learning_rate": 1.275820234785535e-06, + "loss": 1.4297, + "step": 36543 + }, + { + "epoch": 2.88, + "learning_rate": 1.274212142978054e-06, + "loss": 1.4697, + "step": 36544 + }, + { + "epoch": 2.88, + "learning_rate": 1.2726050609366101e-06, + "loss": 1.4746, + "step": 36545 + }, + { + "epoch": 2.88, + "learning_rate": 1.2709989886720784e-06, + "loss": 1.4367, + "step": 36546 + }, + { + "epoch": 2.88, + "learning_rate": 1.2693939261954167e-06, + "loss": 1.4092, + "step": 36547 + }, + { + "epoch": 2.88, + "learning_rate": 1.2677898735174664e-06, + "loss": 1.415, + "step": 36548 + }, + { + "epoch": 2.88, + "learning_rate": 1.2661868306491685e-06, + "loss": 1.4516, + "step": 36549 + }, + { + "epoch": 2.88, + "learning_rate": 1.2645847976013813e-06, + "loss": 1.415, + "step": 36550 + }, + { + "epoch": 2.88, + "learning_rate": 1.262983774384979e-06, + "loss": 1.3904, + "step": 36551 + }, + { + "epoch": 2.88, + "learning_rate": 1.261383761010837e-06, + "loss": 1.4682, + "step": 36552 + }, + { + "epoch": 2.88, + "learning_rate": 1.2597847574898123e-06, + "loss": 1.4747, + "step": 36553 + }, + { + "epoch": 2.88, + "learning_rate": 1.2581867638327804e-06, + "loss": 1.442, + "step": 36554 + }, + { + "epoch": 2.88, + "learning_rate": 1.256589780050582e-06, + "loss": 1.4414, + "step": 36555 + }, + { + "epoch": 2.88, + "learning_rate": 1.254993806154042e-06, + "loss": 1.4537, + "step": 36556 + }, + { + "epoch": 2.88, + "learning_rate": 1.253398842154002e-06, + "loss": 1.4154, + "step": 36557 + }, + { + "epoch": 2.88, + "learning_rate": 1.2518048880613196e-06, + "loss": 1.4058, + "step": 36558 + }, + { + "epoch": 2.88, + "learning_rate": 1.2502119438867865e-06, + "loss": 1.4026, + "step": 36559 + }, + { + "epoch": 2.88, + "learning_rate": 1.2486200096412269e-06, + "loss": 1.4336, + "step": 36560 + }, + { + "epoch": 2.88, + "learning_rate": 1.2470290853354492e-06, + "loss": 1.4583, + "step": 36561 + }, + { + "epoch": 2.88, + "learning_rate": 1.2454391709802615e-06, + "loss": 1.4053, + "step": 36562 + }, + { + "epoch": 2.88, + "learning_rate": 1.243850266586438e-06, + "loss": 1.4573, + "step": 36563 + }, + { + "epoch": 2.88, + "learning_rate": 1.2422623721647873e-06, + "loss": 1.4514, + "step": 36564 + }, + { + "epoch": 2.88, + "learning_rate": 1.2406754877260838e-06, + "loss": 1.4112, + "step": 36565 + }, + { + "epoch": 2.88, + "learning_rate": 1.239089613281119e-06, + "loss": 1.4238, + "step": 36566 + }, + { + "epoch": 2.88, + "learning_rate": 1.2375047488406176e-06, + "loss": 1.4175, + "step": 36567 + }, + { + "epoch": 2.88, + "learning_rate": 1.2359208944153709e-06, + "loss": 1.4508, + "step": 36568 + }, + { + "epoch": 2.88, + "learning_rate": 1.234338050016137e-06, + "loss": 1.4457, + "step": 36569 + }, + { + "epoch": 2.88, + "learning_rate": 1.2327562156536409e-06, + "loss": 1.4846, + "step": 36570 + }, + { + "epoch": 2.88, + "learning_rate": 1.2311753913386401e-06, + "loss": 1.4281, + "step": 36571 + }, + { + "epoch": 2.88, + "learning_rate": 1.22959557708186e-06, + "loss": 1.4397, + "step": 36572 + }, + { + "epoch": 2.88, + "learning_rate": 1.2280167728940416e-06, + "loss": 1.4979, + "step": 36573 + }, + { + "epoch": 2.88, + "learning_rate": 1.2264389787858598e-06, + "loss": 1.4454, + "step": 36574 + }, + { + "epoch": 2.88, + "learning_rate": 1.2248621947680725e-06, + "loss": 1.482, + "step": 36575 + }, + { + "epoch": 2.88, + "learning_rate": 1.2232864208513715e-06, + "loss": 1.4611, + "step": 36576 + }, + { + "epoch": 2.88, + "learning_rate": 1.221711657046448e-06, + "loss": 1.5196, + "step": 36577 + }, + { + "epoch": 2.88, + "learning_rate": 1.2201379033640102e-06, + "loss": 1.4448, + "step": 36578 + }, + { + "epoch": 2.88, + "learning_rate": 1.2185651598147328e-06, + "loss": 1.4151, + "step": 36579 + }, + { + "epoch": 2.88, + "learning_rate": 1.2169934264092906e-06, + "loss": 1.4508, + "step": 36580 + }, + { + "epoch": 2.88, + "learning_rate": 1.215422703158342e-06, + "loss": 1.3989, + "step": 36581 + }, + { + "epoch": 2.88, + "learning_rate": 1.2138529900725779e-06, + "loss": 1.4368, + "step": 36582 + }, + { + "epoch": 2.88, + "learning_rate": 1.212284287162657e-06, + "loss": 1.4275, + "step": 36583 + }, + { + "epoch": 2.88, + "learning_rate": 1.210716594439204e-06, + "loss": 1.4138, + "step": 36584 + }, + { + "epoch": 2.88, + "learning_rate": 1.2091499119128767e-06, + "loss": 1.4497, + "step": 36585 + }, + { + "epoch": 2.88, + "learning_rate": 1.2075842395943168e-06, + "loss": 1.4197, + "step": 36586 + }, + { + "epoch": 2.88, + "learning_rate": 1.2060195774941494e-06, + "loss": 1.4663, + "step": 36587 + }, + { + "epoch": 2.88, + "learning_rate": 1.204455925622999e-06, + "loss": 1.4412, + "step": 36588 + }, + { + "epoch": 2.88, + "learning_rate": 1.202893283991474e-06, + "loss": 1.4147, + "step": 36589 + }, + { + "epoch": 2.88, + "learning_rate": 1.201331652610199e-06, + "loss": 1.38, + "step": 36590 + }, + { + "epoch": 2.88, + "learning_rate": 1.1997710314897657e-06, + "loss": 1.4096, + "step": 36591 + }, + { + "epoch": 2.88, + "learning_rate": 1.1982114206407823e-06, + "loss": 1.4167, + "step": 36592 + }, + { + "epoch": 2.88, + "learning_rate": 1.1966528200738067e-06, + "loss": 1.4138, + "step": 36593 + }, + { + "epoch": 2.88, + "learning_rate": 1.1950952297994476e-06, + "loss": 1.4196, + "step": 36594 + }, + { + "epoch": 2.88, + "learning_rate": 1.1935386498282794e-06, + "loss": 1.4381, + "step": 36595 + }, + { + "epoch": 2.88, + "learning_rate": 1.1919830801708607e-06, + "loss": 1.4401, + "step": 36596 + }, + { + "epoch": 2.88, + "learning_rate": 1.1904285208377662e-06, + "loss": 1.4233, + "step": 36597 + }, + { + "epoch": 2.88, + "learning_rate": 1.1888749718395375e-06, + "loss": 1.4679, + "step": 36598 + }, + { + "epoch": 2.88, + "learning_rate": 1.1873224331867327e-06, + "loss": 1.3882, + "step": 36599 + }, + { + "epoch": 2.88, + "learning_rate": 1.1857709048898768e-06, + "loss": 1.4781, + "step": 36600 + }, + { + "epoch": 2.88, + "learning_rate": 1.1842203869595114e-06, + "loss": 1.4177, + "step": 36601 + }, + { + "epoch": 2.88, + "learning_rate": 1.182670879406178e-06, + "loss": 1.4748, + "step": 36602 + }, + { + "epoch": 2.88, + "learning_rate": 1.1811223822403849e-06, + "loss": 1.4257, + "step": 36603 + }, + { + "epoch": 2.88, + "learning_rate": 1.1795748954726404e-06, + "loss": 1.4191, + "step": 36604 + }, + { + "epoch": 2.88, + "learning_rate": 1.1780284191134525e-06, + "loss": 1.4672, + "step": 36605 + }, + { + "epoch": 2.88, + "learning_rate": 1.1764829531733465e-06, + "loss": 1.4876, + "step": 36606 + }, + { + "epoch": 2.88, + "learning_rate": 1.174938497662764e-06, + "loss": 1.4132, + "step": 36607 + }, + { + "epoch": 2.88, + "learning_rate": 1.1733950525922297e-06, + "loss": 1.4898, + "step": 36608 + }, + { + "epoch": 2.88, + "learning_rate": 1.1718526179722353e-06, + "loss": 1.4402, + "step": 36609 + }, + { + "epoch": 2.88, + "learning_rate": 1.170311193813206e-06, + "loss": 1.397, + "step": 36610 + }, + { + "epoch": 2.88, + "learning_rate": 1.168770780125633e-06, + "loss": 1.4317, + "step": 36611 + }, + { + "epoch": 2.88, + "learning_rate": 1.1672313769199914e-06, + "loss": 1.4652, + "step": 36612 + }, + { + "epoch": 2.88, + "learning_rate": 1.1656929842067064e-06, + "loss": 1.4422, + "step": 36613 + }, + { + "epoch": 2.88, + "learning_rate": 1.164155601996236e-06, + "loss": 1.4581, + "step": 36614 + }, + { + "epoch": 2.88, + "learning_rate": 1.1626192302990056e-06, + "loss": 1.4156, + "step": 36615 + }, + { + "epoch": 2.88, + "learning_rate": 1.1610838691254564e-06, + "loss": 1.3751, + "step": 36616 + }, + { + "epoch": 2.88, + "learning_rate": 1.1595495184860304e-06, + "loss": 1.451, + "step": 36617 + }, + { + "epoch": 2.88, + "learning_rate": 1.1580161783911024e-06, + "loss": 1.4441, + "step": 36618 + }, + { + "epoch": 2.88, + "learning_rate": 1.156483848851114e-06, + "loss": 1.4606, + "step": 36619 + }, + { + "epoch": 2.88, + "learning_rate": 1.154952529876474e-06, + "loss": 1.4659, + "step": 36620 + }, + { + "epoch": 2.88, + "learning_rate": 1.1534222214775568e-06, + "loss": 1.4198, + "step": 36621 + }, + { + "epoch": 2.88, + "learning_rate": 1.1518929236647544e-06, + "loss": 1.4322, + "step": 36622 + }, + { + "epoch": 2.88, + "learning_rate": 1.1503646364484752e-06, + "loss": 1.4173, + "step": 36623 + }, + { + "epoch": 2.88, + "learning_rate": 1.148837359839061e-06, + "loss": 1.4833, + "step": 36624 + }, + { + "epoch": 2.88, + "learning_rate": 1.1473110938469033e-06, + "loss": 1.4982, + "step": 36625 + }, + { + "epoch": 2.88, + "learning_rate": 1.145785838482377e-06, + "loss": 1.4901, + "step": 36626 + }, + { + "epoch": 2.88, + "learning_rate": 1.1442615937557909e-06, + "loss": 1.4147, + "step": 36627 + }, + { + "epoch": 2.88, + "learning_rate": 1.1427383596775364e-06, + "loss": 1.4073, + "step": 36628 + }, + { + "epoch": 2.88, + "learning_rate": 1.1412161362579553e-06, + "loss": 1.4571, + "step": 36629 + }, + { + "epoch": 2.88, + "learning_rate": 1.139694923507356e-06, + "loss": 1.4776, + "step": 36630 + }, + { + "epoch": 2.88, + "learning_rate": 1.1381747214360804e-06, + "loss": 1.4478, + "step": 36631 + }, + { + "epoch": 2.88, + "learning_rate": 1.1366555300544533e-06, + "loss": 1.4468, + "step": 36632 + }, + { + "epoch": 2.88, + "learning_rate": 1.1351373493727832e-06, + "loss": 1.4383, + "step": 36633 + }, + { + "epoch": 2.88, + "learning_rate": 1.133620179401379e-06, + "loss": 1.426, + "step": 36634 + }, + { + "epoch": 2.88, + "learning_rate": 1.1321040201505481e-06, + "loss": 1.4182, + "step": 36635 + }, + { + "epoch": 2.88, + "learning_rate": 1.1305888716305667e-06, + "loss": 1.45, + "step": 36636 + }, + { + "epoch": 2.88, + "learning_rate": 1.1290747338517592e-06, + "loss": 1.4293, + "step": 36637 + }, + { + "epoch": 2.88, + "learning_rate": 1.127561606824351e-06, + "loss": 1.463, + "step": 36638 + }, + { + "epoch": 2.88, + "learning_rate": 1.126049490558667e-06, + "loss": 1.4318, + "step": 36639 + }, + { + "epoch": 2.88, + "learning_rate": 1.1245383850649325e-06, + "loss": 1.4306, + "step": 36640 + }, + { + "epoch": 2.88, + "learning_rate": 1.1230282903534393e-06, + "loss": 1.4695, + "step": 36641 + }, + { + "epoch": 2.88, + "learning_rate": 1.1215192064344125e-06, + "loss": 1.4935, + "step": 36642 + }, + { + "epoch": 2.88, + "learning_rate": 1.1200111333181273e-06, + "loss": 1.4824, + "step": 36643 + }, + { + "epoch": 2.88, + "learning_rate": 1.1185040710148085e-06, + "loss": 1.4059, + "step": 36644 + }, + { + "epoch": 2.88, + "learning_rate": 1.1169980195346817e-06, + "loss": 1.4584, + "step": 36645 + }, + { + "epoch": 2.88, + "learning_rate": 1.1154929788879718e-06, + "loss": 1.4565, + "step": 36646 + }, + { + "epoch": 2.88, + "learning_rate": 1.1139889490849209e-06, + "loss": 1.4142, + "step": 36647 + }, + { + "epoch": 2.88, + "learning_rate": 1.1124859301357037e-06, + "loss": 1.4342, + "step": 36648 + }, + { + "epoch": 2.88, + "learning_rate": 1.1109839220505623e-06, + "loss": 1.4585, + "step": 36649 + }, + { + "epoch": 2.88, + "learning_rate": 1.109482924839672e-06, + "loss": 1.4308, + "step": 36650 + }, + { + "epoch": 2.88, + "learning_rate": 1.1079829385132244e-06, + "loss": 1.4774, + "step": 36651 + }, + { + "epoch": 2.88, + "learning_rate": 1.1064839630813949e-06, + "loss": 1.4729, + "step": 36652 + }, + { + "epoch": 2.88, + "learning_rate": 1.1049859985543918e-06, + "loss": 1.4593, + "step": 36653 + }, + { + "epoch": 2.88, + "learning_rate": 1.1034890449423572e-06, + "loss": 1.3945, + "step": 36654 + }, + { + "epoch": 2.88, + "learning_rate": 1.1019931022554662e-06, + "loss": 1.3559, + "step": 36655 + }, + { + "epoch": 2.88, + "learning_rate": 1.1004981705038773e-06, + "loss": 1.4884, + "step": 36656 + }, + { + "epoch": 2.88, + "learning_rate": 1.0990042496977324e-06, + "loss": 1.444, + "step": 36657 + }, + { + "epoch": 2.88, + "learning_rate": 1.0975113398471736e-06, + "loss": 1.4596, + "step": 36658 + }, + { + "epoch": 2.88, + "learning_rate": 1.0960194409623257e-06, + "loss": 1.4266, + "step": 36659 + }, + { + "epoch": 2.88, + "learning_rate": 1.0945285530533643e-06, + "loss": 1.4565, + "step": 36660 + }, + { + "epoch": 2.88, + "learning_rate": 1.093038676130381e-06, + "loss": 1.4324, + "step": 36661 + }, + { + "epoch": 2.88, + "learning_rate": 1.091549810203468e-06, + "loss": 1.4009, + "step": 36662 + }, + { + "epoch": 2.88, + "learning_rate": 1.0900619552827672e-06, + "loss": 1.4349, + "step": 36663 + }, + { + "epoch": 2.88, + "learning_rate": 1.0885751113783868e-06, + "loss": 1.4464, + "step": 36664 + }, + { + "epoch": 2.88, + "learning_rate": 1.087089278500386e-06, + "loss": 1.4086, + "step": 36665 + }, + { + "epoch": 2.88, + "learning_rate": 1.085604456658873e-06, + "loss": 1.4903, + "step": 36666 + }, + { + "epoch": 2.89, + "learning_rate": 1.0841206458639395e-06, + "loss": 1.4455, + "step": 36667 + }, + { + "epoch": 2.89, + "learning_rate": 1.0826378461256447e-06, + "loss": 1.3962, + "step": 36668 + }, + { + "epoch": 2.89, + "learning_rate": 1.0811560574540468e-06, + "loss": 1.4642, + "step": 36669 + }, + { + "epoch": 2.89, + "learning_rate": 1.0796752798592379e-06, + "loss": 1.4282, + "step": 36670 + }, + { + "epoch": 2.89, + "learning_rate": 1.0781955133512432e-06, + "loss": 1.414, + "step": 36671 + }, + { + "epoch": 2.89, + "learning_rate": 1.0767167579401216e-06, + "loss": 1.4488, + "step": 36672 + }, + { + "epoch": 2.89, + "learning_rate": 1.0752390136359145e-06, + "loss": 1.488, + "step": 36673 + }, + { + "epoch": 2.89, + "learning_rate": 1.0737622804486312e-06, + "loss": 1.4373, + "step": 36674 + }, + { + "epoch": 2.89, + "learning_rate": 1.07228655838833e-06, + "loss": 1.4037, + "step": 36675 + }, + { + "epoch": 2.89, + "learning_rate": 1.0708118474650197e-06, + "loss": 1.4188, + "step": 36676 + }, + { + "epoch": 2.89, + "learning_rate": 1.0693381476887086e-06, + "loss": 1.4803, + "step": 36677 + }, + { + "epoch": 2.89, + "learning_rate": 1.0678654590694225e-06, + "loss": 1.4286, + "step": 36678 + }, + { + "epoch": 2.89, + "learning_rate": 1.0663937816171197e-06, + "loss": 1.4687, + "step": 36679 + }, + { + "epoch": 2.89, + "learning_rate": 1.064923115341826e-06, + "loss": 1.4522, + "step": 36680 + }, + { + "epoch": 2.89, + "learning_rate": 1.0634534602535161e-06, + "loss": 1.45, + "step": 36681 + }, + { + "epoch": 2.89, + "learning_rate": 1.061984816362149e-06, + "loss": 1.4348, + "step": 36682 + }, + { + "epoch": 2.89, + "learning_rate": 1.0605171836777337e-06, + "loss": 1.4528, + "step": 36683 + }, + { + "epoch": 2.89, + "learning_rate": 1.059050562210212e-06, + "loss": 1.3836, + "step": 36684 + }, + { + "epoch": 2.89, + "learning_rate": 1.0575849519695423e-06, + "loss": 1.4761, + "step": 36685 + }, + { + "epoch": 2.89, + "learning_rate": 1.056120352965667e-06, + "loss": 1.4299, + "step": 36686 + }, + { + "epoch": 2.89, + "learning_rate": 1.0546567652085613e-06, + "loss": 1.373, + "step": 36687 + }, + { + "epoch": 2.89, + "learning_rate": 1.0531941887081342e-06, + "loss": 1.465, + "step": 36688 + }, + { + "epoch": 2.89, + "learning_rate": 1.0517326234743106e-06, + "loss": 1.4236, + "step": 36689 + }, + { + "epoch": 2.89, + "learning_rate": 1.050272069517033e-06, + "loss": 1.4431, + "step": 36690 + }, + { + "epoch": 2.89, + "learning_rate": 1.04881252684621e-06, + "loss": 1.4493, + "step": 36691 + }, + { + "epoch": 2.89, + "learning_rate": 1.0473539954717669e-06, + "loss": 1.4171, + "step": 36692 + }, + { + "epoch": 2.89, + "learning_rate": 1.0458964754035625e-06, + "loss": 1.5293, + "step": 36693 + }, + { + "epoch": 2.89, + "learning_rate": 1.044439966651539e-06, + "loss": 1.4191, + "step": 36694 + }, + { + "epoch": 2.89, + "learning_rate": 1.0429844692255718e-06, + "loss": 1.3975, + "step": 36695 + }, + { + "epoch": 2.89, + "learning_rate": 1.0415299831355362e-06, + "loss": 1.4383, + "step": 36696 + }, + { + "epoch": 2.89, + "learning_rate": 1.0400765083913075e-06, + "loss": 1.5011, + "step": 36697 + }, + { + "epoch": 2.89, + "learning_rate": 1.0386240450027617e-06, + "loss": 1.4612, + "step": 36698 + }, + { + "epoch": 2.89, + "learning_rate": 1.0371725929797402e-06, + "loss": 1.4919, + "step": 36699 + }, + { + "epoch": 2.89, + "learning_rate": 1.035722152332119e-06, + "loss": 1.4415, + "step": 36700 + }, + { + "epoch": 2.89, + "learning_rate": 1.03427272306974e-06, + "loss": 1.4066, + "step": 36701 + }, + { + "epoch": 2.89, + "learning_rate": 1.0328243052024454e-06, + "loss": 1.4009, + "step": 36702 + }, + { + "epoch": 2.89, + "learning_rate": 1.0313768987400606e-06, + "loss": 1.4629, + "step": 36703 + }, + { + "epoch": 2.89, + "learning_rate": 1.0299305036924277e-06, + "loss": 1.4597, + "step": 36704 + }, + { + "epoch": 2.89, + "learning_rate": 1.0284851200693555e-06, + "loss": 1.4309, + "step": 36705 + }, + { + "epoch": 2.89, + "learning_rate": 1.0270407478806531e-06, + "loss": 1.5032, + "step": 36706 + }, + { + "epoch": 2.89, + "learning_rate": 1.0255973871361456e-06, + "loss": 1.4995, + "step": 36707 + }, + { + "epoch": 2.89, + "learning_rate": 1.0241550378456088e-06, + "loss": 1.471, + "step": 36708 + }, + { + "epoch": 2.89, + "learning_rate": 1.022713700018868e-06, + "loss": 1.4373, + "step": 36709 + }, + { + "epoch": 2.89, + "learning_rate": 1.0212733736656653e-06, + "loss": 1.4792, + "step": 36710 + }, + { + "epoch": 2.89, + "learning_rate": 1.0198340587958097e-06, + "loss": 1.4583, + "step": 36711 + }, + { + "epoch": 2.89, + "learning_rate": 1.018395755419077e-06, + "loss": 1.4329, + "step": 36712 + }, + { + "epoch": 2.89, + "learning_rate": 1.0169584635452088e-06, + "loss": 1.424, + "step": 36713 + }, + { + "epoch": 2.89, + "learning_rate": 1.0155221831839977e-06, + "loss": 1.4166, + "step": 36714 + }, + { + "epoch": 2.89, + "learning_rate": 1.0140869143451525e-06, + "loss": 1.457, + "step": 36715 + }, + { + "epoch": 2.89, + "learning_rate": 1.0126526570384485e-06, + "loss": 1.4592, + "step": 36716 + }, + { + "epoch": 2.89, + "learning_rate": 1.0112194112736117e-06, + "loss": 1.4987, + "step": 36717 + }, + { + "epoch": 2.89, + "learning_rate": 1.0097871770603837e-06, + "loss": 1.4565, + "step": 36718 + }, + { + "epoch": 2.89, + "learning_rate": 1.008355954408474e-06, + "loss": 1.4349, + "step": 36719 + }, + { + "epoch": 2.89, + "learning_rate": 1.006925743327608e-06, + "loss": 1.4715, + "step": 36720 + }, + { + "epoch": 2.89, + "learning_rate": 1.0054965438274942e-06, + "loss": 1.4715, + "step": 36721 + }, + { + "epoch": 2.89, + "learning_rate": 1.0040683559178419e-06, + "loss": 1.4779, + "step": 36722 + }, + { + "epoch": 2.89, + "learning_rate": 1.0026411796083267e-06, + "loss": 1.3755, + "step": 36723 + }, + { + "epoch": 2.89, + "learning_rate": 1.001215014908674e-06, + "loss": 1.4465, + "step": 36724 + }, + { + "epoch": 2.89, + "learning_rate": 9.997898618285428e-07, + "loss": 1.4279, + "step": 36725 + }, + { + "epoch": 2.89, + "learning_rate": 9.983657203776086e-07, + "loss": 1.4483, + "step": 36726 + }, + { + "epoch": 2.89, + "learning_rate": 9.96942590565547e-07, + "loss": 1.4329, + "step": 36727 + }, + { + "epoch": 2.89, + "learning_rate": 9.955204724020338e-07, + "loss": 1.448, + "step": 36728 + }, + { + "epoch": 2.89, + "learning_rate": 9.940993658966946e-07, + "loss": 1.4756, + "step": 36729 + }, + { + "epoch": 2.89, + "learning_rate": 9.92679271059188e-07, + "loss": 1.4544, + "step": 36730 + }, + { + "epoch": 2.89, + "learning_rate": 9.912601878991566e-07, + "loss": 1.4018, + "step": 36731 + }, + { + "epoch": 2.89, + "learning_rate": 9.898421164262593e-07, + "loss": 1.4392, + "step": 36732 + }, + { + "epoch": 2.89, + "learning_rate": 9.884250566500717e-07, + "loss": 1.4442, + "step": 36733 + }, + { + "epoch": 2.89, + "learning_rate": 9.870090085802696e-07, + "loss": 1.4486, + "step": 36734 + }, + { + "epoch": 2.89, + "learning_rate": 9.85593972226445e-07, + "loss": 1.4303, + "step": 36735 + }, + { + "epoch": 2.89, + "learning_rate": 9.841799475981904e-07, + "loss": 1.4295, + "step": 36736 + }, + { + "epoch": 2.89, + "learning_rate": 9.827669347051315e-07, + "loss": 1.4399, + "step": 36737 + }, + { + "epoch": 2.89, + "learning_rate": 9.813549335568438e-07, + "loss": 1.4358, + "step": 36738 + }, + { + "epoch": 2.89, + "learning_rate": 9.799439441629364e-07, + "loss": 1.4309, + "step": 36739 + }, + { + "epoch": 2.89, + "learning_rate": 9.785339665329516e-07, + "loss": 1.4284, + "step": 36740 + }, + { + "epoch": 2.89, + "learning_rate": 9.771250006764985e-07, + "loss": 1.4651, + "step": 36741 + }, + { + "epoch": 2.89, + "learning_rate": 9.757170466031362e-07, + "loss": 1.4251, + "step": 36742 + }, + { + "epoch": 2.89, + "learning_rate": 9.743101043224067e-07, + "loss": 1.4815, + "step": 36743 + }, + { + "epoch": 2.89, + "learning_rate": 9.72904173843869e-07, + "loss": 1.462, + "step": 36744 + }, + { + "epoch": 2.89, + "learning_rate": 9.71499255177083e-07, + "loss": 1.4258, + "step": 36745 + }, + { + "epoch": 2.89, + "learning_rate": 9.700953483315565e-07, + "loss": 1.4804, + "step": 36746 + }, + { + "epoch": 2.89, + "learning_rate": 9.686924533168494e-07, + "loss": 1.4091, + "step": 36747 + }, + { + "epoch": 2.89, + "learning_rate": 9.672905701424872e-07, + "loss": 1.3791, + "step": 36748 + }, + { + "epoch": 2.89, + "learning_rate": 9.658896988179787e-07, + "loss": 1.4598, + "step": 36749 + }, + { + "epoch": 2.89, + "learning_rate": 9.644898393528334e-07, + "loss": 1.3885, + "step": 36750 + }, + { + "epoch": 2.89, + "learning_rate": 9.630909917565433e-07, + "loss": 1.4198, + "step": 36751 + }, + { + "epoch": 2.89, + "learning_rate": 9.616931560386342e-07, + "loss": 1.4385, + "step": 36752 + }, + { + "epoch": 2.89, + "learning_rate": 9.602963322085823e-07, + "loss": 1.4324, + "step": 36753 + }, + { + "epoch": 2.89, + "learning_rate": 9.589005202758626e-07, + "loss": 1.4083, + "step": 36754 + }, + { + "epoch": 2.89, + "learning_rate": 9.57505720249968e-07, + "loss": 1.4269, + "step": 36755 + }, + { + "epoch": 2.89, + "learning_rate": 9.561119321403577e-07, + "loss": 1.4055, + "step": 36756 + }, + { + "epoch": 2.89, + "learning_rate": 9.547191559565072e-07, + "loss": 1.4298, + "step": 36757 + }, + { + "epoch": 2.89, + "learning_rate": 9.533273917078587e-07, + "loss": 1.4286, + "step": 36758 + }, + { + "epoch": 2.89, + "learning_rate": 9.519366394038552e-07, + "loss": 1.4261, + "step": 36759 + }, + { + "epoch": 2.89, + "learning_rate": 9.505468990539555e-07, + "loss": 1.4461, + "step": 36760 + }, + { + "epoch": 2.89, + "learning_rate": 9.491581706676021e-07, + "loss": 1.4905, + "step": 36761 + }, + { + "epoch": 2.89, + "learning_rate": 9.477704542542041e-07, + "loss": 1.406, + "step": 36762 + }, + { + "epoch": 2.89, + "learning_rate": 9.463837498231875e-07, + "loss": 1.4494, + "step": 36763 + }, + { + "epoch": 2.89, + "learning_rate": 9.449980573839777e-07, + "loss": 1.3875, + "step": 36764 + }, + { + "epoch": 2.89, + "learning_rate": 9.436133769459675e-07, + "loss": 1.4798, + "step": 36765 + }, + { + "epoch": 2.89, + "learning_rate": 9.422297085185826e-07, + "loss": 1.4566, + "step": 36766 + }, + { + "epoch": 2.89, + "learning_rate": 9.408470521111821e-07, + "loss": 1.4719, + "step": 36767 + }, + { + "epoch": 2.89, + "learning_rate": 9.394654077331754e-07, + "loss": 1.4101, + "step": 36768 + }, + { + "epoch": 2.89, + "learning_rate": 9.38084775393938e-07, + "loss": 1.4155, + "step": 36769 + }, + { + "epoch": 2.89, + "learning_rate": 9.367051551028625e-07, + "loss": 1.4821, + "step": 36770 + }, + { + "epoch": 2.89, + "learning_rate": 9.35326546869275e-07, + "loss": 1.4473, + "step": 36771 + }, + { + "epoch": 2.89, + "learning_rate": 9.339489507025844e-07, + "loss": 1.3944, + "step": 36772 + }, + { + "epoch": 2.89, + "learning_rate": 9.325723666120999e-07, + "loss": 1.4771, + "step": 36773 + }, + { + "epoch": 2.89, + "learning_rate": 9.311967946071975e-07, + "loss": 1.4555, + "step": 36774 + }, + { + "epoch": 2.89, + "learning_rate": 9.298222346972028e-07, + "loss": 1.4744, + "step": 36775 + }, + { + "epoch": 2.89, + "learning_rate": 9.284486868914586e-07, + "loss": 1.4322, + "step": 36776 + }, + { + "epoch": 2.89, + "learning_rate": 9.270761511992741e-07, + "loss": 1.4206, + "step": 36777 + }, + { + "epoch": 2.89, + "learning_rate": 9.257046276299751e-07, + "loss": 1.4453, + "step": 36778 + }, + { + "epoch": 2.89, + "learning_rate": 9.243341161928875e-07, + "loss": 1.4159, + "step": 36779 + }, + { + "epoch": 2.89, + "learning_rate": 9.229646168972871e-07, + "loss": 1.4307, + "step": 36780 + }, + { + "epoch": 2.89, + "learning_rate": 9.215961297524999e-07, + "loss": 1.4268, + "step": 36781 + }, + { + "epoch": 2.89, + "learning_rate": 9.202286547678018e-07, + "loss": 1.4703, + "step": 36782 + }, + { + "epoch": 2.89, + "learning_rate": 9.188621919525019e-07, + "loss": 1.5082, + "step": 36783 + }, + { + "epoch": 2.89, + "learning_rate": 9.174967413158263e-07, + "loss": 1.4668, + "step": 36784 + }, + { + "epoch": 2.89, + "learning_rate": 9.161323028671008e-07, + "loss": 1.5056, + "step": 36785 + }, + { + "epoch": 2.89, + "learning_rate": 9.147688766155514e-07, + "loss": 1.4519, + "step": 36786 + }, + { + "epoch": 2.89, + "learning_rate": 9.134064625704707e-07, + "loss": 1.4866, + "step": 36787 + }, + { + "epoch": 2.89, + "learning_rate": 9.120450607410678e-07, + "loss": 1.48, + "step": 36788 + }, + { + "epoch": 2.89, + "learning_rate": 9.106846711366023e-07, + "loss": 1.4205, + "step": 36789 + }, + { + "epoch": 2.89, + "learning_rate": 9.093252937663331e-07, + "loss": 1.4374, + "step": 36790 + }, + { + "epoch": 2.89, + "learning_rate": 9.07966928639453e-07, + "loss": 1.4691, + "step": 36791 + }, + { + "epoch": 2.89, + "learning_rate": 9.066095757652047e-07, + "loss": 1.473, + "step": 36792 + }, + { + "epoch": 2.89, + "learning_rate": 9.052532351528141e-07, + "loss": 1.4161, + "step": 36793 + }, + { + "epoch": 2.89, + "learning_rate": 9.038979068114571e-07, + "loss": 1.4353, + "step": 36794 + }, + { + "epoch": 2.9, + "learning_rate": 9.025435907503598e-07, + "loss": 1.4545, + "step": 36795 + }, + { + "epoch": 2.9, + "learning_rate": 9.011902869787313e-07, + "loss": 1.4339, + "step": 36796 + }, + { + "epoch": 2.9, + "learning_rate": 8.998379955057145e-07, + "loss": 1.3829, + "step": 36797 + }, + { + "epoch": 2.9, + "learning_rate": 8.984867163405351e-07, + "loss": 1.4288, + "step": 36798 + }, + { + "epoch": 2.9, + "learning_rate": 8.971364494923361e-07, + "loss": 1.4383, + "step": 36799 + }, + { + "epoch": 2.9, + "learning_rate": 8.957871949703099e-07, + "loss": 1.4305, + "step": 36800 + }, + { + "epoch": 2.9, + "learning_rate": 8.94438952783616e-07, + "loss": 1.4174, + "step": 36801 + }, + { + "epoch": 2.9, + "learning_rate": 8.930917229413804e-07, + "loss": 1.4243, + "step": 36802 + }, + { + "epoch": 2.9, + "learning_rate": 8.917455054527789e-07, + "loss": 1.4925, + "step": 36803 + }, + { + "epoch": 2.9, + "learning_rate": 8.904003003269378e-07, + "loss": 1.4232, + "step": 36804 + }, + { + "epoch": 2.9, + "learning_rate": 8.89056107572983e-07, + "loss": 1.4419, + "step": 36805 + }, + { + "epoch": 2.9, + "learning_rate": 8.877129272000572e-07, + "loss": 1.4546, + "step": 36806 + }, + { + "epoch": 2.9, + "learning_rate": 8.863707592172864e-07, + "loss": 1.4317, + "step": 36807 + }, + { + "epoch": 2.9, + "learning_rate": 8.850296036337468e-07, + "loss": 1.4779, + "step": 36808 + }, + { + "epoch": 2.9, + "learning_rate": 8.836894604585809e-07, + "loss": 1.4406, + "step": 36809 + }, + { + "epoch": 2.9, + "learning_rate": 8.823503297008816e-07, + "loss": 1.4496, + "step": 36810 + }, + { + "epoch": 2.9, + "learning_rate": 8.810122113697249e-07, + "loss": 1.4371, + "step": 36811 + }, + { + "epoch": 2.9, + "learning_rate": 8.796751054742035e-07, + "loss": 1.4483, + "step": 36812 + }, + { + "epoch": 2.9, + "learning_rate": 8.783390120233935e-07, + "loss": 1.4917, + "step": 36813 + }, + { + "epoch": 2.9, + "learning_rate": 8.77003931026371e-07, + "loss": 1.4738, + "step": 36814 + }, + { + "epoch": 2.9, + "learning_rate": 8.756698624922121e-07, + "loss": 1.4496, + "step": 36815 + }, + { + "epoch": 2.9, + "learning_rate": 8.743368064299427e-07, + "loss": 1.4569, + "step": 36816 + }, + { + "epoch": 2.9, + "learning_rate": 8.730047628486558e-07, + "loss": 1.467, + "step": 36817 + }, + { + "epoch": 2.9, + "learning_rate": 8.716737317573441e-07, + "loss": 1.4317, + "step": 36818 + }, + { + "epoch": 2.9, + "learning_rate": 8.703437131650837e-07, + "loss": 1.4536, + "step": 36819 + }, + { + "epoch": 2.9, + "learning_rate": 8.690147070809006e-07, + "loss": 1.4503, + "step": 36820 + }, + { + "epoch": 2.9, + "learning_rate": 8.676867135138044e-07, + "loss": 1.4201, + "step": 36821 + }, + { + "epoch": 2.9, + "learning_rate": 8.663597324728211e-07, + "loss": 1.4595, + "step": 36822 + }, + { + "epoch": 2.9, + "learning_rate": 8.650337639669435e-07, + "loss": 1.4182, + "step": 36823 + }, + { + "epoch": 2.9, + "learning_rate": 8.637088080051979e-07, + "loss": 1.4295, + "step": 36824 + }, + { + "epoch": 2.9, + "learning_rate": 8.62384864596577e-07, + "loss": 1.4627, + "step": 36825 + }, + { + "epoch": 2.9, + "learning_rate": 8.610619337500401e-07, + "loss": 1.4787, + "step": 36826 + }, + { + "epoch": 2.9, + "learning_rate": 8.597400154746137e-07, + "loss": 1.4371, + "step": 36827 + }, + { + "epoch": 2.9, + "learning_rate": 8.584191097792403e-07, + "loss": 1.4336, + "step": 36828 + }, + { + "epoch": 2.9, + "learning_rate": 8.570992166728962e-07, + "loss": 1.4044, + "step": 36829 + }, + { + "epoch": 2.9, + "learning_rate": 8.55780336164541e-07, + "loss": 1.4833, + "step": 36830 + }, + { + "epoch": 2.9, + "learning_rate": 8.54462468263134e-07, + "loss": 1.4611, + "step": 36831 + }, + { + "epoch": 2.9, + "learning_rate": 8.531456129776182e-07, + "loss": 1.4883, + "step": 36832 + }, + { + "epoch": 2.9, + "learning_rate": 8.51829770316953e-07, + "loss": 1.4774, + "step": 36833 + }, + { + "epoch": 2.9, + "learning_rate": 8.505149402900479e-07, + "loss": 1.4102, + "step": 36834 + }, + { + "epoch": 2.9, + "learning_rate": 8.492011229058293e-07, + "loss": 1.4633, + "step": 36835 + }, + { + "epoch": 2.9, + "learning_rate": 8.478883181732399e-07, + "loss": 1.4597, + "step": 36836 + }, + { + "epoch": 2.9, + "learning_rate": 8.465765261011891e-07, + "loss": 1.4763, + "step": 36837 + }, + { + "epoch": 2.9, + "learning_rate": 8.452657466985535e-07, + "loss": 1.4285, + "step": 36838 + }, + { + "epoch": 2.9, + "learning_rate": 8.439559799742591e-07, + "loss": 1.4604, + "step": 36839 + }, + { + "epoch": 2.9, + "learning_rate": 8.426472259371985e-07, + "loss": 1.4118, + "step": 36840 + }, + { + "epoch": 2.9, + "learning_rate": 8.413394845962485e-07, + "loss": 1.3908, + "step": 36841 + }, + { + "epoch": 2.9, + "learning_rate": 8.400327559602849e-07, + "loss": 1.512, + "step": 36842 + }, + { + "epoch": 2.9, + "learning_rate": 8.387270400382007e-07, + "loss": 1.4486, + "step": 36843 + }, + { + "epoch": 2.9, + "learning_rate": 8.374223368388389e-07, + "loss": 1.4087, + "step": 36844 + }, + { + "epoch": 2.9, + "learning_rate": 8.36118646371059e-07, + "loss": 1.4465, + "step": 36845 + }, + { + "epoch": 2.9, + "learning_rate": 8.348159686437206e-07, + "loss": 1.4804, + "step": 36846 + }, + { + "epoch": 2.9, + "learning_rate": 8.335143036656666e-07, + "loss": 1.4543, + "step": 36847 + }, + { + "epoch": 2.9, + "learning_rate": 8.322136514457234e-07, + "loss": 1.4045, + "step": 36848 + }, + { + "epoch": 2.9, + "learning_rate": 8.309140119927504e-07, + "loss": 1.4349, + "step": 36849 + }, + { + "epoch": 2.9, + "learning_rate": 8.296153853155407e-07, + "loss": 1.4338, + "step": 36850 + }, + { + "epoch": 2.9, + "learning_rate": 8.283177714229205e-07, + "loss": 1.4786, + "step": 36851 + }, + { + "epoch": 2.9, + "learning_rate": 8.270211703237162e-07, + "loss": 1.4776, + "step": 36852 + }, + { + "epoch": 2.9, + "learning_rate": 8.257255820267039e-07, + "loss": 1.4271, + "step": 36853 + }, + { + "epoch": 2.9, + "learning_rate": 8.244310065407101e-07, + "loss": 1.4431, + "step": 36854 + }, + { + "epoch": 2.9, + "learning_rate": 8.231374438744942e-07, + "loss": 1.4675, + "step": 36855 + }, + { + "epoch": 2.9, + "learning_rate": 8.218448940368493e-07, + "loss": 1.4414, + "step": 36856 + }, + { + "epoch": 2.9, + "learning_rate": 8.205533570365686e-07, + "loss": 1.4399, + "step": 36857 + }, + { + "epoch": 2.9, + "learning_rate": 8.192628328823947e-07, + "loss": 1.411, + "step": 36858 + }, + { + "epoch": 2.9, + "learning_rate": 8.179733215831041e-07, + "loss": 1.4438, + "step": 36859 + }, + { + "epoch": 2.9, + "learning_rate": 8.166848231474565e-07, + "loss": 1.4106, + "step": 36860 + }, + { + "epoch": 2.9, + "learning_rate": 8.153973375841948e-07, + "loss": 1.4417, + "step": 36861 + }, + { + "epoch": 2.9, + "learning_rate": 8.141108649020456e-07, + "loss": 1.3859, + "step": 36862 + }, + { + "epoch": 2.9, + "learning_rate": 8.128254051097516e-07, + "loss": 1.4707, + "step": 36863 + }, + { + "epoch": 2.9, + "learning_rate": 8.115409582160559e-07, + "loss": 1.4687, + "step": 36864 + }, + { + "epoch": 2.9, + "learning_rate": 8.102575242296683e-07, + "loss": 1.4719, + "step": 36865 + }, + { + "epoch": 2.9, + "learning_rate": 8.089751031592983e-07, + "loss": 1.4368, + "step": 36866 + }, + { + "epoch": 2.9, + "learning_rate": 8.076936950136725e-07, + "loss": 1.4644, + "step": 36867 + }, + { + "epoch": 2.9, + "learning_rate": 8.064132998014505e-07, + "loss": 1.472, + "step": 36868 + }, + { + "epoch": 2.9, + "learning_rate": 8.051339175313587e-07, + "loss": 1.4269, + "step": 36869 + }, + { + "epoch": 2.9, + "learning_rate": 8.038555482120901e-07, + "loss": 1.4376, + "step": 36870 + }, + { + "epoch": 2.9, + "learning_rate": 8.025781918523044e-07, + "loss": 1.4279, + "step": 36871 + }, + { + "epoch": 2.9, + "learning_rate": 8.013018484606615e-07, + "loss": 1.4369, + "step": 36872 + }, + { + "epoch": 2.9, + "learning_rate": 8.000265180458543e-07, + "loss": 1.4687, + "step": 36873 + }, + { + "epoch": 2.9, + "learning_rate": 7.987522006165426e-07, + "loss": 1.4208, + "step": 36874 + }, + { + "epoch": 2.9, + "learning_rate": 7.974788961813527e-07, + "loss": 1.4543, + "step": 36875 + }, + { + "epoch": 2.9, + "learning_rate": 7.962066047489446e-07, + "loss": 1.4494, + "step": 36876 + }, + { + "epoch": 2.9, + "learning_rate": 7.949353263279612e-07, + "loss": 1.5095, + "step": 36877 + }, + { + "epoch": 2.9, + "learning_rate": 7.93665060927029e-07, + "loss": 1.4007, + "step": 36878 + }, + { + "epoch": 2.9, + "learning_rate": 7.923958085547744e-07, + "loss": 1.4134, + "step": 36879 + }, + { + "epoch": 2.9, + "learning_rate": 7.911275692198072e-07, + "loss": 1.4718, + "step": 36880 + }, + { + "epoch": 2.9, + "learning_rate": 7.89860342930737e-07, + "loss": 1.4417, + "step": 36881 + }, + { + "epoch": 2.9, + "learning_rate": 7.885941296961906e-07, + "loss": 1.4486, + "step": 36882 + }, + { + "epoch": 2.9, + "learning_rate": 7.873289295247442e-07, + "loss": 1.4678, + "step": 36883 + }, + { + "epoch": 2.9, + "learning_rate": 7.86064742424991e-07, + "loss": 1.4465, + "step": 36884 + }, + { + "epoch": 2.9, + "learning_rate": 7.848015684055076e-07, + "loss": 1.4401, + "step": 36885 + }, + { + "epoch": 2.9, + "learning_rate": 7.835394074748869e-07, + "loss": 1.4901, + "step": 36886 + }, + { + "epoch": 2.9, + "learning_rate": 7.822782596416722e-07, + "loss": 1.3786, + "step": 36887 + }, + { + "epoch": 2.9, + "learning_rate": 7.810181249144731e-07, + "loss": 1.4659, + "step": 36888 + }, + { + "epoch": 2.9, + "learning_rate": 7.797590033017831e-07, + "loss": 1.4323, + "step": 36889 + }, + { + "epoch": 2.9, + "learning_rate": 7.785008948121951e-07, + "loss": 1.4284, + "step": 36890 + }, + { + "epoch": 2.9, + "learning_rate": 7.772437994542524e-07, + "loss": 1.4289, + "step": 36891 + }, + { + "epoch": 2.9, + "learning_rate": 7.759877172364648e-07, + "loss": 1.4805, + "step": 36892 + }, + { + "epoch": 2.9, + "learning_rate": 7.747326481673754e-07, + "loss": 1.4839, + "step": 36893 + }, + { + "epoch": 2.9, + "learning_rate": 7.734785922554943e-07, + "loss": 1.4513, + "step": 36894 + }, + { + "epoch": 2.9, + "learning_rate": 7.722255495093477e-07, + "loss": 1.4257, + "step": 36895 + }, + { + "epoch": 2.9, + "learning_rate": 7.709735199374456e-07, + "loss": 1.4602, + "step": 36896 + }, + { + "epoch": 2.9, + "learning_rate": 7.697225035482646e-07, + "loss": 1.3968, + "step": 36897 + }, + { + "epoch": 2.9, + "learning_rate": 7.684725003503311e-07, + "loss": 1.4574, + "step": 36898 + }, + { + "epoch": 2.9, + "learning_rate": 7.672235103521219e-07, + "loss": 1.4218, + "step": 36899 + }, + { + "epoch": 2.9, + "learning_rate": 7.659755335620965e-07, + "loss": 1.4461, + "step": 36900 + }, + { + "epoch": 2.9, + "learning_rate": 7.647285699887484e-07, + "loss": 1.4395, + "step": 36901 + }, + { + "epoch": 2.9, + "learning_rate": 7.634826196405375e-07, + "loss": 1.4446, + "step": 36902 + }, + { + "epoch": 2.9, + "learning_rate": 7.622376825259236e-07, + "loss": 1.4395, + "step": 36903 + }, + { + "epoch": 2.9, + "learning_rate": 7.609937586533665e-07, + "loss": 1.4515, + "step": 36904 + }, + { + "epoch": 2.9, + "learning_rate": 7.59750848031293e-07, + "loss": 1.4409, + "step": 36905 + }, + { + "epoch": 2.9, + "learning_rate": 7.58508950668163e-07, + "loss": 1.5041, + "step": 36906 + }, + { + "epoch": 2.9, + "learning_rate": 7.572680665724029e-07, + "loss": 1.4339, + "step": 36907 + }, + { + "epoch": 2.9, + "learning_rate": 7.560281957524228e-07, + "loss": 1.4288, + "step": 36908 + }, + { + "epoch": 2.9, + "learning_rate": 7.547893382166659e-07, + "loss": 1.4165, + "step": 36909 + }, + { + "epoch": 2.9, + "learning_rate": 7.535514939735088e-07, + "loss": 1.4252, + "step": 36910 + }, + { + "epoch": 2.9, + "learning_rate": 7.523146630313781e-07, + "loss": 1.443, + "step": 36911 + }, + { + "epoch": 2.9, + "learning_rate": 7.510788453986838e-07, + "loss": 1.4384, + "step": 36912 + }, + { + "epoch": 2.9, + "learning_rate": 7.498440410837858e-07, + "loss": 1.4766, + "step": 36913 + }, + { + "epoch": 2.9, + "learning_rate": 7.486102500950941e-07, + "loss": 1.4864, + "step": 36914 + }, + { + "epoch": 2.9, + "learning_rate": 7.473774724409853e-07, + "loss": 1.3953, + "step": 36915 + }, + { + "epoch": 2.9, + "learning_rate": 7.461457081298028e-07, + "loss": 1.4346, + "step": 36916 + }, + { + "epoch": 2.9, + "learning_rate": 7.449149571699398e-07, + "loss": 1.4958, + "step": 36917 + }, + { + "epoch": 2.9, + "learning_rate": 7.43685219569723e-07, + "loss": 1.4667, + "step": 36918 + }, + { + "epoch": 2.9, + "learning_rate": 7.424564953375289e-07, + "loss": 1.4699, + "step": 36919 + }, + { + "epoch": 2.9, + "learning_rate": 7.412287844816845e-07, + "loss": 1.4384, + "step": 36920 + }, + { + "epoch": 2.9, + "learning_rate": 7.400020870105328e-07, + "loss": 1.4445, + "step": 36921 + }, + { + "epoch": 2.91, + "learning_rate": 7.38776402932384e-07, + "loss": 1.4782, + "step": 36922 + }, + { + "epoch": 2.91, + "learning_rate": 7.375517322555813e-07, + "loss": 1.4647, + "step": 36923 + }, + { + "epoch": 2.91, + "learning_rate": 7.363280749884349e-07, + "loss": 1.4121, + "step": 36924 + }, + { + "epoch": 2.91, + "learning_rate": 7.351054311392546e-07, + "loss": 1.4147, + "step": 36925 + }, + { + "epoch": 2.91, + "learning_rate": 7.338838007163339e-07, + "loss": 1.4592, + "step": 36926 + }, + { + "epoch": 2.91, + "learning_rate": 7.326631837279662e-07, + "loss": 1.3914, + "step": 36927 + }, + { + "epoch": 2.91, + "learning_rate": 7.314435801824448e-07, + "loss": 1.468, + "step": 36928 + }, + { + "epoch": 2.91, + "learning_rate": 7.302249900880464e-07, + "loss": 1.3865, + "step": 36929 + }, + { + "epoch": 2.91, + "learning_rate": 7.290074134530477e-07, + "loss": 1.4552, + "step": 36930 + }, + { + "epoch": 2.91, + "learning_rate": 7.277908502857255e-07, + "loss": 1.5316, + "step": 36931 + }, + { + "epoch": 2.91, + "learning_rate": 7.265753005943231e-07, + "loss": 1.4628, + "step": 36932 + }, + { + "epoch": 2.91, + "learning_rate": 7.25360764387084e-07, + "loss": 1.4555, + "step": 36933 + }, + { + "epoch": 2.91, + "learning_rate": 7.241472416722849e-07, + "loss": 1.4146, + "step": 36934 + }, + { + "epoch": 2.91, + "learning_rate": 7.229347324581359e-07, + "loss": 1.3827, + "step": 36935 + }, + { + "epoch": 2.91, + "learning_rate": 7.217232367528969e-07, + "loss": 1.4071, + "step": 36936 + }, + { + "epoch": 2.91, + "learning_rate": 7.205127545647616e-07, + "loss": 1.4072, + "step": 36937 + }, + { + "epoch": 2.91, + "learning_rate": 7.193032859019732e-07, + "loss": 1.4261, + "step": 36938 + }, + { + "epoch": 2.91, + "learning_rate": 7.180948307727418e-07, + "loss": 1.4052, + "step": 36939 + }, + { + "epoch": 2.91, + "learning_rate": 7.168873891852611e-07, + "loss": 1.3951, + "step": 36940 + }, + { + "epoch": 2.91, + "learning_rate": 7.156809611477243e-07, + "loss": 1.4757, + "step": 36941 + }, + { + "epoch": 2.91, + "learning_rate": 7.144755466683416e-07, + "loss": 1.4627, + "step": 36942 + }, + { + "epoch": 2.91, + "learning_rate": 7.132711457552898e-07, + "loss": 1.4686, + "step": 36943 + }, + { + "epoch": 2.91, + "learning_rate": 7.120677584167456e-07, + "loss": 1.4515, + "step": 36944 + }, + { + "epoch": 2.91, + "learning_rate": 7.108653846608691e-07, + "loss": 1.4504, + "step": 36945 + }, + { + "epoch": 2.91, + "learning_rate": 7.096640244958374e-07, + "loss": 1.4431, + "step": 36946 + }, + { + "epoch": 2.91, + "learning_rate": 7.084636779297936e-07, + "loss": 1.4493, + "step": 36947 + }, + { + "epoch": 2.91, + "learning_rate": 7.072643449709148e-07, + "loss": 1.4502, + "step": 36948 + }, + { + "epoch": 2.91, + "learning_rate": 7.060660256273109e-07, + "loss": 1.4397, + "step": 36949 + }, + { + "epoch": 2.91, + "learning_rate": 7.048687199071424e-07, + "loss": 1.428, + "step": 36950 + }, + { + "epoch": 2.91, + "learning_rate": 7.036724278185024e-07, + "loss": 1.4253, + "step": 36951 + }, + { + "epoch": 2.91, + "learning_rate": 7.024771493695513e-07, + "loss": 1.4567, + "step": 36952 + }, + { + "epoch": 2.91, + "learning_rate": 7.012828845683994e-07, + "loss": 1.4094, + "step": 36953 + }, + { + "epoch": 2.91, + "learning_rate": 7.000896334231398e-07, + "loss": 1.4429, + "step": 36954 + }, + { + "epoch": 2.91, + "learning_rate": 6.988973959418831e-07, + "loss": 1.4407, + "step": 36955 + }, + { + "epoch": 2.91, + "learning_rate": 6.977061721327226e-07, + "loss": 1.4305, + "step": 36956 + }, + { + "epoch": 2.91, + "learning_rate": 6.965159620037353e-07, + "loss": 1.4901, + "step": 36957 + }, + { + "epoch": 2.91, + "learning_rate": 6.953267655630146e-07, + "loss": 1.4433, + "step": 36958 + }, + { + "epoch": 2.91, + "learning_rate": 6.941385828186541e-07, + "loss": 1.4541, + "step": 36959 + }, + { + "epoch": 2.91, + "learning_rate": 6.929514137786807e-07, + "loss": 1.4108, + "step": 36960 + }, + { + "epoch": 2.91, + "learning_rate": 6.917652584511712e-07, + "loss": 1.4201, + "step": 36961 + }, + { + "epoch": 2.91, + "learning_rate": 6.90580116844186e-07, + "loss": 1.4823, + "step": 36962 + }, + { + "epoch": 2.91, + "learning_rate": 6.893959889657685e-07, + "loss": 1.4335, + "step": 36963 + }, + { + "epoch": 2.91, + "learning_rate": 6.882128748239457e-07, + "loss": 1.4228, + "step": 36964 + }, + { + "epoch": 2.91, + "learning_rate": 6.870307744267611e-07, + "loss": 1.4465, + "step": 36965 + }, + { + "epoch": 2.91, + "learning_rate": 6.858496877822417e-07, + "loss": 1.427, + "step": 36966 + }, + { + "epoch": 2.91, + "learning_rate": 6.846696148984144e-07, + "loss": 1.492, + "step": 36967 + }, + { + "epoch": 2.91, + "learning_rate": 6.834905557832726e-07, + "loss": 1.4458, + "step": 36968 + }, + { + "epoch": 2.91, + "learning_rate": 6.823125104448268e-07, + "loss": 1.4367, + "step": 36969 + }, + { + "epoch": 2.91, + "learning_rate": 6.811354788910872e-07, + "loss": 1.4353, + "step": 36970 + }, + { + "epoch": 2.91, + "learning_rate": 6.799594611300307e-07, + "loss": 1.4756, + "step": 36971 + }, + { + "epoch": 2.91, + "learning_rate": 6.78784457169651e-07, + "loss": 1.464, + "step": 36972 + }, + { + "epoch": 2.91, + "learning_rate": 6.77610467017925e-07, + "loss": 1.4305, + "step": 36973 + }, + { + "epoch": 2.91, + "learning_rate": 6.76437490682813e-07, + "loss": 1.409, + "step": 36974 + }, + { + "epoch": 2.91, + "learning_rate": 6.752655281722918e-07, + "loss": 1.4564, + "step": 36975 + }, + { + "epoch": 2.91, + "learning_rate": 6.74094579494322e-07, + "loss": 1.466, + "step": 36976 + }, + { + "epoch": 2.91, + "learning_rate": 6.729246446568304e-07, + "loss": 1.4559, + "step": 36977 + }, + { + "epoch": 2.91, + "learning_rate": 6.717557236677773e-07, + "loss": 1.3857, + "step": 36978 + }, + { + "epoch": 2.91, + "learning_rate": 6.705878165351064e-07, + "loss": 1.4436, + "step": 36979 + }, + { + "epoch": 2.91, + "learning_rate": 6.694209232667446e-07, + "loss": 1.4477, + "step": 36980 + }, + { + "epoch": 2.91, + "learning_rate": 6.682550438705859e-07, + "loss": 1.4855, + "step": 36981 + }, + { + "epoch": 2.91, + "learning_rate": 6.670901783545735e-07, + "loss": 1.4737, + "step": 36982 + }, + { + "epoch": 2.91, + "learning_rate": 6.659263267266179e-07, + "loss": 1.433, + "step": 36983 + }, + { + "epoch": 2.91, + "learning_rate": 6.647634889945963e-07, + "loss": 1.4108, + "step": 36984 + }, + { + "epoch": 2.91, + "learning_rate": 6.636016651664355e-07, + "loss": 1.4063, + "step": 36985 + }, + { + "epoch": 2.91, + "learning_rate": 6.624408552500127e-07, + "loss": 1.4891, + "step": 36986 + }, + { + "epoch": 2.91, + "learning_rate": 6.612810592532048e-07, + "loss": 1.482, + "step": 36987 + }, + { + "epoch": 2.91, + "learning_rate": 6.601222771838721e-07, + "loss": 1.4881, + "step": 36988 + }, + { + "epoch": 2.91, + "learning_rate": 6.589645090499085e-07, + "loss": 1.4542, + "step": 36989 + }, + { + "epoch": 2.91, + "learning_rate": 6.578077548591576e-07, + "loss": 1.4318, + "step": 36990 + }, + { + "epoch": 2.91, + "learning_rate": 6.566520146194798e-07, + "loss": 1.4868, + "step": 36991 + }, + { + "epoch": 2.91, + "learning_rate": 6.554972883387189e-07, + "loss": 1.4473, + "step": 36992 + }, + { + "epoch": 2.91, + "learning_rate": 6.543435760247185e-07, + "loss": 1.455, + "step": 36993 + }, + { + "epoch": 2.91, + "learning_rate": 6.531908776853057e-07, + "loss": 1.4594, + "step": 36994 + }, + { + "epoch": 2.91, + "learning_rate": 6.520391933283076e-07, + "loss": 1.402, + "step": 36995 + }, + { + "epoch": 2.91, + "learning_rate": 6.508885229615512e-07, + "loss": 1.4089, + "step": 36996 + }, + { + "epoch": 2.91, + "learning_rate": 6.497388665928471e-07, + "loss": 1.4798, + "step": 36997 + }, + { + "epoch": 2.91, + "learning_rate": 6.48590224229989e-07, + "loss": 1.4416, + "step": 36998 + }, + { + "epoch": 2.91, + "learning_rate": 6.474425958808038e-07, + "loss": 1.4478, + "step": 36999 + }, + { + "epoch": 2.91, + "learning_rate": 6.462959815530522e-07, + "loss": 1.4577, + "step": 37000 + }, + { + "epoch": 2.91, + "learning_rate": 6.451503812545278e-07, + "loss": 1.4983, + "step": 37001 + }, + { + "epoch": 2.91, + "learning_rate": 6.440057949930078e-07, + "loss": 1.4215, + "step": 37002 + }, + { + "epoch": 2.91, + "learning_rate": 6.428622227762692e-07, + "loss": 1.44, + "step": 37003 + }, + { + "epoch": 2.91, + "learning_rate": 6.417196646120726e-07, + "loss": 1.4452, + "step": 37004 + }, + { + "epoch": 2.91, + "learning_rate": 6.405781205081784e-07, + "loss": 1.4652, + "step": 37005 + }, + { + "epoch": 2.91, + "learning_rate": 6.39437590472347e-07, + "loss": 1.4743, + "step": 37006 + }, + { + "epoch": 2.91, + "learning_rate": 6.382980745123056e-07, + "loss": 1.4659, + "step": 37007 + }, + { + "epoch": 2.91, + "learning_rate": 6.371595726357815e-07, + "loss": 1.4185, + "step": 37008 + }, + { + "epoch": 2.91, + "learning_rate": 6.360220848505349e-07, + "loss": 1.3977, + "step": 37009 + }, + { + "epoch": 2.91, + "learning_rate": 6.348856111642598e-07, + "loss": 1.4341, + "step": 37010 + }, + { + "epoch": 2.91, + "learning_rate": 6.337501515846998e-07, + "loss": 1.4082, + "step": 37011 + }, + { + "epoch": 2.91, + "learning_rate": 6.326157061195325e-07, + "loss": 1.4359, + "step": 37012 + }, + { + "epoch": 2.91, + "learning_rate": 6.314822747764847e-07, + "loss": 1.4219, + "step": 37013 + }, + { + "epoch": 2.91, + "learning_rate": 6.303498575632504e-07, + "loss": 1.4351, + "step": 37014 + }, + { + "epoch": 2.91, + "learning_rate": 6.292184544875067e-07, + "loss": 1.4999, + "step": 37015 + }, + { + "epoch": 2.91, + "learning_rate": 6.280880655569309e-07, + "loss": 1.3828, + "step": 37016 + }, + { + "epoch": 2.91, + "learning_rate": 6.269586907792168e-07, + "loss": 1.4204, + "step": 37017 + }, + { + "epoch": 2.91, + "learning_rate": 6.258303301620249e-07, + "loss": 1.4672, + "step": 37018 + }, + { + "epoch": 2.91, + "learning_rate": 6.247029837130158e-07, + "loss": 1.4422, + "step": 37019 + }, + { + "epoch": 2.91, + "learning_rate": 6.235766514398166e-07, + "loss": 1.4198, + "step": 37020 + }, + { + "epoch": 2.91, + "learning_rate": 6.224513333501213e-07, + "loss": 1.3874, + "step": 37021 + }, + { + "epoch": 2.91, + "learning_rate": 6.213270294515404e-07, + "loss": 1.4794, + "step": 37022 + }, + { + "epoch": 2.91, + "learning_rate": 6.202037397517346e-07, + "loss": 1.4272, + "step": 37023 + }, + { + "epoch": 2.91, + "learning_rate": 6.190814642582809e-07, + "loss": 1.4457, + "step": 37024 + }, + { + "epoch": 2.91, + "learning_rate": 6.1796020297884e-07, + "loss": 1.4431, + "step": 37025 + }, + { + "epoch": 2.91, + "learning_rate": 6.168399559210224e-07, + "loss": 1.4162, + "step": 37026 + }, + { + "epoch": 2.91, + "learning_rate": 6.157207230924222e-07, + "loss": 1.436, + "step": 37027 + }, + { + "epoch": 2.91, + "learning_rate": 6.146025045006331e-07, + "loss": 1.4787, + "step": 37028 + }, + { + "epoch": 2.91, + "learning_rate": 6.134853001532658e-07, + "loss": 1.4056, + "step": 37029 + }, + { + "epoch": 2.91, + "learning_rate": 6.123691100578976e-07, + "loss": 1.4623, + "step": 37030 + }, + { + "epoch": 2.91, + "learning_rate": 6.11253934222089e-07, + "loss": 1.4417, + "step": 37031 + }, + { + "epoch": 2.91, + "learning_rate": 6.101397726534341e-07, + "loss": 1.4635, + "step": 37032 + }, + { + "epoch": 2.91, + "learning_rate": 6.090266253594933e-07, + "loss": 1.4466, + "step": 37033 + }, + { + "epoch": 2.91, + "learning_rate": 6.079144923478108e-07, + "loss": 1.4499, + "step": 37034 + }, + { + "epoch": 2.91, + "learning_rate": 6.06803373625947e-07, + "loss": 1.4623, + "step": 37035 + }, + { + "epoch": 2.91, + "learning_rate": 6.056932692014627e-07, + "loss": 1.481, + "step": 37036 + }, + { + "epoch": 2.91, + "learning_rate": 6.045841790818684e-07, + "loss": 1.4338, + "step": 37037 + }, + { + "epoch": 2.91, + "learning_rate": 6.034761032747082e-07, + "loss": 1.4517, + "step": 37038 + }, + { + "epoch": 2.91, + "learning_rate": 6.023690417874926e-07, + "loss": 1.4183, + "step": 37039 + }, + { + "epoch": 2.91, + "learning_rate": 6.012629946277492e-07, + "loss": 1.4401, + "step": 37040 + }, + { + "epoch": 2.91, + "learning_rate": 6.001579618029884e-07, + "loss": 1.4898, + "step": 37041 + }, + { + "epoch": 2.91, + "learning_rate": 5.990539433207043e-07, + "loss": 1.4228, + "step": 37042 + }, + { + "epoch": 2.91, + "learning_rate": 5.979509391884074e-07, + "loss": 1.4853, + "step": 37043 + }, + { + "epoch": 2.91, + "learning_rate": 5.968489494135753e-07, + "loss": 1.4005, + "step": 37044 + }, + { + "epoch": 2.91, + "learning_rate": 5.957479740036853e-07, + "loss": 1.3924, + "step": 37045 + }, + { + "epoch": 2.91, + "learning_rate": 5.946480129662146e-07, + "loss": 1.4571, + "step": 37046 + }, + { + "epoch": 2.91, + "learning_rate": 5.935490663086572e-07, + "loss": 1.4521, + "step": 37047 + }, + { + "epoch": 2.91, + "learning_rate": 5.924511340384408e-07, + "loss": 1.4679, + "step": 37048 + }, + { + "epoch": 2.92, + "learning_rate": 5.913542161630092e-07, + "loss": 1.4575, + "step": 37049 + }, + { + "epoch": 2.92, + "learning_rate": 5.902583126898563e-07, + "loss": 1.4975, + "step": 37050 + }, + { + "epoch": 2.92, + "learning_rate": 5.891634236263931e-07, + "loss": 1.4999, + "step": 37051 + }, + { + "epoch": 2.92, + "learning_rate": 5.880695489800635e-07, + "loss": 1.4208, + "step": 37052 + }, + { + "epoch": 2.92, + "learning_rate": 5.869766887582783e-07, + "loss": 1.434, + "step": 37053 + }, + { + "epoch": 2.92, + "learning_rate": 5.858848429684648e-07, + "loss": 1.469, + "step": 37054 + }, + { + "epoch": 2.92, + "learning_rate": 5.847940116180505e-07, + "loss": 1.4825, + "step": 37055 + }, + { + "epoch": 2.92, + "learning_rate": 5.837041947144294e-07, + "loss": 1.4325, + "step": 37056 + }, + { + "epoch": 2.92, + "learning_rate": 5.826153922650123e-07, + "loss": 1.4666, + "step": 37057 + }, + { + "epoch": 2.92, + "learning_rate": 5.815276042771599e-07, + "loss": 1.4528, + "step": 37058 + }, + { + "epoch": 2.92, + "learning_rate": 5.80440830758283e-07, + "loss": 1.4158, + "step": 37059 + }, + { + "epoch": 2.92, + "learning_rate": 5.793550717157758e-07, + "loss": 1.4388, + "step": 37060 + }, + { + "epoch": 2.92, + "learning_rate": 5.782703271569822e-07, + "loss": 1.4198, + "step": 37061 + }, + { + "epoch": 2.92, + "learning_rate": 5.77186597089263e-07, + "loss": 1.4711, + "step": 37062 + }, + { + "epoch": 2.92, + "learning_rate": 5.761038815199958e-07, + "loss": 1.4473, + "step": 37063 + }, + { + "epoch": 2.92, + "learning_rate": 5.750221804565247e-07, + "loss": 1.4619, + "step": 37064 + }, + { + "epoch": 2.92, + "learning_rate": 5.739414939061937e-07, + "loss": 1.4291, + "step": 37065 + }, + { + "epoch": 2.92, + "learning_rate": 5.72861821876347e-07, + "loss": 1.4304, + "step": 37066 + }, + { + "epoch": 2.92, + "learning_rate": 5.717831643742954e-07, + "loss": 1.465, + "step": 37067 + }, + { + "epoch": 2.92, + "learning_rate": 5.70705521407383e-07, + "loss": 1.3993, + "step": 37068 + }, + { + "epoch": 2.92, + "learning_rate": 5.696288929829206e-07, + "loss": 1.4516, + "step": 37069 + }, + { + "epoch": 2.92, + "learning_rate": 5.685532791082026e-07, + "loss": 1.4203, + "step": 37070 + }, + { + "epoch": 2.92, + "learning_rate": 5.674786797905562e-07, + "loss": 1.4729, + "step": 37071 + }, + { + "epoch": 2.92, + "learning_rate": 5.664050950372589e-07, + "loss": 1.4207, + "step": 37072 + }, + { + "epoch": 2.92, + "learning_rate": 5.653325248556051e-07, + "loss": 1.4549, + "step": 37073 + }, + { + "epoch": 2.92, + "learning_rate": 5.642609692528888e-07, + "loss": 1.3821, + "step": 37074 + }, + { + "epoch": 2.92, + "learning_rate": 5.631904282363709e-07, + "loss": 1.463, + "step": 37075 + }, + { + "epoch": 2.92, + "learning_rate": 5.621209018133121e-07, + "loss": 1.4691, + "step": 37076 + }, + { + "epoch": 2.92, + "learning_rate": 5.610523899910068e-07, + "loss": 1.4933, + "step": 37077 + }, + { + "epoch": 2.92, + "learning_rate": 5.599848927766826e-07, + "loss": 1.4488, + "step": 37078 + }, + { + "epoch": 2.92, + "learning_rate": 5.589184101775835e-07, + "loss": 1.4079, + "step": 37079 + }, + { + "epoch": 2.92, + "learning_rate": 5.578529422009537e-07, + "loss": 1.4486, + "step": 37080 + }, + { + "epoch": 2.92, + "learning_rate": 5.567884888540542e-07, + "loss": 1.4937, + "step": 37081 + }, + { + "epoch": 2.92, + "learning_rate": 5.557250501440791e-07, + "loss": 1.4054, + "step": 37082 + }, + { + "epoch": 2.92, + "learning_rate": 5.546626260782561e-07, + "loss": 1.4805, + "step": 37083 + }, + { + "epoch": 2.92, + "learning_rate": 5.536012166638127e-07, + "loss": 1.5109, + "step": 37084 + }, + { + "epoch": 2.92, + "learning_rate": 5.52540821907943e-07, + "loss": 1.4892, + "step": 37085 + }, + { + "epoch": 2.92, + "learning_rate": 5.514814418178581e-07, + "loss": 1.3923, + "step": 37086 + }, + { + "epoch": 2.92, + "learning_rate": 5.504230764007355e-07, + "loss": 1.4524, + "step": 37087 + }, + { + "epoch": 2.92, + "learning_rate": 5.49365725663753e-07, + "loss": 1.4126, + "step": 37088 + }, + { + "epoch": 2.92, + "learning_rate": 5.483093896141211e-07, + "loss": 1.4253, + "step": 37089 + }, + { + "epoch": 2.92, + "learning_rate": 5.472540682589843e-07, + "loss": 1.4637, + "step": 37090 + }, + { + "epoch": 2.92, + "learning_rate": 5.461997616055203e-07, + "loss": 1.4524, + "step": 37091 + }, + { + "epoch": 2.92, + "learning_rate": 5.451464696608898e-07, + "loss": 1.4123, + "step": 37092 + }, + { + "epoch": 2.92, + "learning_rate": 5.440941924322373e-07, + "loss": 1.4494, + "step": 37093 + }, + { + "epoch": 2.92, + "learning_rate": 5.43042929926707e-07, + "loss": 1.4365, + "step": 37094 + }, + { + "epoch": 2.92, + "learning_rate": 5.419926821514431e-07, + "loss": 1.3675, + "step": 37095 + }, + { + "epoch": 2.92, + "learning_rate": 5.409434491135567e-07, + "loss": 1.4774, + "step": 37096 + }, + { + "epoch": 2.92, + "learning_rate": 5.39895230820192e-07, + "loss": 1.4244, + "step": 37097 + }, + { + "epoch": 2.92, + "learning_rate": 5.388480272784601e-07, + "loss": 1.4559, + "step": 37098 + }, + { + "epoch": 2.92, + "learning_rate": 5.378018384954719e-07, + "loss": 1.43, + "step": 37099 + }, + { + "epoch": 2.92, + "learning_rate": 5.367566644783383e-07, + "loss": 1.4426, + "step": 37100 + }, + { + "epoch": 2.92, + "learning_rate": 5.357125052341371e-07, + "loss": 1.3898, + "step": 37101 + }, + { + "epoch": 2.92, + "learning_rate": 5.346693607699625e-07, + "loss": 1.4483, + "step": 37102 + }, + { + "epoch": 2.92, + "learning_rate": 5.336272310929091e-07, + "loss": 1.409, + "step": 37103 + }, + { + "epoch": 2.92, + "learning_rate": 5.325861162100375e-07, + "loss": 1.4351, + "step": 37104 + }, + { + "epoch": 2.92, + "learning_rate": 5.315460161284423e-07, + "loss": 1.4556, + "step": 37105 + }, + { + "epoch": 2.92, + "learning_rate": 5.305069308551513e-07, + "loss": 1.4258, + "step": 37106 + }, + { + "epoch": 2.92, + "learning_rate": 5.294688603972253e-07, + "loss": 1.4185, + "step": 37107 + }, + { + "epoch": 2.92, + "learning_rate": 5.284318047617254e-07, + "loss": 1.4559, + "step": 37108 + }, + { + "epoch": 2.92, + "learning_rate": 5.273957639556958e-07, + "loss": 1.4549, + "step": 37109 + }, + { + "epoch": 2.92, + "learning_rate": 5.263607379861645e-07, + "loss": 1.4439, + "step": 37110 + }, + { + "epoch": 2.92, + "learning_rate": 5.25326726860159e-07, + "loss": 1.4388, + "step": 37111 + }, + { + "epoch": 2.92, + "learning_rate": 5.242937305846906e-07, + "loss": 1.464, + "step": 37112 + }, + { + "epoch": 2.92, + "learning_rate": 5.232617491667701e-07, + "loss": 1.4145, + "step": 37113 + }, + { + "epoch": 2.92, + "learning_rate": 5.222307826134253e-07, + "loss": 1.4871, + "step": 37114 + }, + { + "epoch": 2.92, + "learning_rate": 5.212008309316506e-07, + "loss": 1.4486, + "step": 37115 + }, + { + "epoch": 2.92, + "learning_rate": 5.201718941284239e-07, + "loss": 1.4812, + "step": 37116 + }, + { + "epoch": 2.92, + "learning_rate": 5.191439722107393e-07, + "loss": 1.4507, + "step": 37117 + }, + { + "epoch": 2.92, + "learning_rate": 5.181170651855915e-07, + "loss": 1.39, + "step": 37118 + }, + { + "epoch": 2.92, + "learning_rate": 5.170911730599248e-07, + "loss": 1.4342, + "step": 37119 + }, + { + "epoch": 2.92, + "learning_rate": 5.160662958407335e-07, + "loss": 1.4156, + "step": 37120 + }, + { + "epoch": 2.92, + "learning_rate": 5.150424335349457e-07, + "loss": 1.4235, + "step": 37121 + }, + { + "epoch": 2.92, + "learning_rate": 5.140195861495223e-07, + "loss": 1.4332, + "step": 37122 + }, + { + "epoch": 2.92, + "learning_rate": 5.129977536914242e-07, + "loss": 1.4721, + "step": 37123 + }, + { + "epoch": 2.92, + "learning_rate": 5.119769361675629e-07, + "loss": 1.4313, + "step": 37124 + }, + { + "epoch": 2.92, + "learning_rate": 5.109571335848994e-07, + "loss": 1.4262, + "step": 37125 + }, + { + "epoch": 2.92, + "learning_rate": 5.099383459503448e-07, + "loss": 1.4431, + "step": 37126 + }, + { + "epoch": 2.92, + "learning_rate": 5.089205732707935e-07, + "loss": 1.4663, + "step": 37127 + }, + { + "epoch": 2.92, + "learning_rate": 5.0790381555319e-07, + "loss": 1.4663, + "step": 37128 + }, + { + "epoch": 2.92, + "learning_rate": 5.068880728044289e-07, + "loss": 1.4676, + "step": 37129 + }, + { + "epoch": 2.92, + "learning_rate": 5.058733450313878e-07, + "loss": 1.4346, + "step": 37130 + }, + { + "epoch": 2.92, + "learning_rate": 5.048596322409615e-07, + "loss": 1.4981, + "step": 37131 + }, + { + "epoch": 2.92, + "learning_rate": 5.038469344400609e-07, + "loss": 1.4702, + "step": 37132 + }, + { + "epoch": 2.92, + "learning_rate": 5.028352516355305e-07, + "loss": 1.4501, + "step": 37133 + }, + { + "epoch": 2.92, + "learning_rate": 5.018245838342483e-07, + "loss": 1.4182, + "step": 37134 + }, + { + "epoch": 2.92, + "learning_rate": 5.008149310430753e-07, + "loss": 1.4625, + "step": 37135 + }, + { + "epoch": 2.92, + "learning_rate": 4.998062932688728e-07, + "loss": 1.4457, + "step": 37136 + }, + { + "epoch": 2.92, + "learning_rate": 4.987986705184854e-07, + "loss": 1.4733, + "step": 37137 + }, + { + "epoch": 2.92, + "learning_rate": 4.977920627987575e-07, + "loss": 1.4629, + "step": 37138 + }, + { + "epoch": 2.92, + "learning_rate": 4.96786470116517e-07, + "loss": 1.4296, + "step": 37139 + }, + { + "epoch": 2.92, + "learning_rate": 4.957818924785917e-07, + "loss": 1.4247, + "step": 37140 + }, + { + "epoch": 2.92, + "learning_rate": 4.947783298917929e-07, + "loss": 1.4485, + "step": 37141 + }, + { + "epoch": 2.92, + "learning_rate": 4.937757823629651e-07, + "loss": 1.4458, + "step": 37142 + }, + { + "epoch": 2.92, + "learning_rate": 4.927742498988862e-07, + "loss": 1.4407, + "step": 37143 + }, + { + "epoch": 2.92, + "learning_rate": 4.917737325063675e-07, + "loss": 1.4231, + "step": 37144 + }, + { + "epoch": 2.92, + "learning_rate": 4.907742301921868e-07, + "loss": 1.4765, + "step": 37145 + }, + { + "epoch": 2.92, + "learning_rate": 4.897757429631555e-07, + "loss": 1.416, + "step": 37146 + }, + { + "epoch": 2.92, + "learning_rate": 4.887782708260346e-07, + "loss": 1.4343, + "step": 37147 + }, + { + "epoch": 2.92, + "learning_rate": 4.877818137876022e-07, + "loss": 1.4919, + "step": 37148 + }, + { + "epoch": 2.92, + "learning_rate": 4.867863718546361e-07, + "loss": 1.4254, + "step": 37149 + }, + { + "epoch": 2.92, + "learning_rate": 4.85791945033881e-07, + "loss": 1.4077, + "step": 37150 + }, + { + "epoch": 2.92, + "learning_rate": 4.847985333320647e-07, + "loss": 1.3866, + "step": 37151 + }, + { + "epoch": 2.92, + "learning_rate": 4.83806136755982e-07, + "loss": 1.45, + "step": 37152 + }, + { + "epoch": 2.92, + "learning_rate": 4.82814755312344e-07, + "loss": 1.4375, + "step": 37153 + }, + { + "epoch": 2.92, + "learning_rate": 4.818243890078788e-07, + "loss": 1.3966, + "step": 37154 + }, + { + "epoch": 2.92, + "learning_rate": 4.808350378493142e-07, + "loss": 1.4056, + "step": 37155 + }, + { + "epoch": 2.92, + "learning_rate": 4.798467018433616e-07, + "loss": 1.4295, + "step": 37156 + }, + { + "epoch": 2.92, + "learning_rate": 4.788593809967489e-07, + "loss": 1.4658, + "step": 37157 + }, + { + "epoch": 2.92, + "learning_rate": 4.778730753161542e-07, + "loss": 1.4316, + "step": 37158 + }, + { + "epoch": 2.92, + "learning_rate": 4.768877848083052e-07, + "loss": 1.4337, + "step": 37159 + }, + { + "epoch": 2.92, + "learning_rate": 4.7590350947986353e-07, + "loss": 1.4507, + "step": 37160 + }, + { + "epoch": 2.92, + "learning_rate": 4.749202493375237e-07, + "loss": 1.4959, + "step": 37161 + }, + { + "epoch": 2.92, + "learning_rate": 4.739380043879637e-07, + "loss": 1.3826, + "step": 37162 + }, + { + "epoch": 2.92, + "learning_rate": 4.729567746378449e-07, + "loss": 1.3945, + "step": 37163 + }, + { + "epoch": 2.92, + "learning_rate": 4.719765600938452e-07, + "loss": 1.4555, + "step": 37164 + }, + { + "epoch": 2.92, + "learning_rate": 4.7099736076259274e-07, + "loss": 1.451, + "step": 37165 + }, + { + "epoch": 2.92, + "learning_rate": 4.700191766507655e-07, + "loss": 1.4414, + "step": 37166 + }, + { + "epoch": 2.92, + "learning_rate": 4.6904200776499145e-07, + "loss": 1.4778, + "step": 37167 + }, + { + "epoch": 2.92, + "learning_rate": 4.680658541118987e-07, + "loss": 1.4237, + "step": 37168 + }, + { + "epoch": 2.92, + "learning_rate": 4.6709071569811517e-07, + "loss": 1.429, + "step": 37169 + }, + { + "epoch": 2.92, + "learning_rate": 4.66116592530269e-07, + "loss": 1.5003, + "step": 37170 + }, + { + "epoch": 2.92, + "learning_rate": 4.651434846149715e-07, + "loss": 1.4308, + "step": 37171 + }, + { + "epoch": 2.92, + "learning_rate": 4.641713919588341e-07, + "loss": 1.4922, + "step": 37172 + }, + { + "epoch": 2.92, + "learning_rate": 4.6320031456845153e-07, + "loss": 1.4255, + "step": 37173 + }, + { + "epoch": 2.92, + "learning_rate": 4.6223025245041844e-07, + "loss": 1.4273, + "step": 37174 + }, + { + "epoch": 2.92, + "learning_rate": 4.6126120561131296e-07, + "loss": 1.4606, + "step": 37175 + }, + { + "epoch": 2.93, + "learning_rate": 4.602931740577298e-07, + "loss": 1.4497, + "step": 37176 + }, + { + "epoch": 2.93, + "learning_rate": 4.5932615779621373e-07, + "loss": 1.4498, + "step": 37177 + }, + { + "epoch": 2.93, + "learning_rate": 4.5836015683337615e-07, + "loss": 1.4704, + "step": 37178 + }, + { + "epoch": 2.93, + "learning_rate": 4.5739517117572843e-07, + "loss": 1.4413, + "step": 37179 + }, + { + "epoch": 2.93, + "learning_rate": 4.5643120082984874e-07, + "loss": 1.4706, + "step": 37180 + }, + { + "epoch": 2.93, + "learning_rate": 4.554682458022818e-07, + "loss": 1.4637, + "step": 37181 + }, + { + "epoch": 2.93, + "learning_rate": 4.5450630609955576e-07, + "loss": 1.4302, + "step": 37182 + }, + { + "epoch": 2.93, + "learning_rate": 4.535453817282153e-07, + "loss": 1.4441, + "step": 37183 + }, + { + "epoch": 2.93, + "learning_rate": 4.52585472694772e-07, + "loss": 1.4677, + "step": 37184 + }, + { + "epoch": 2.93, + "learning_rate": 4.5162657900573717e-07, + "loss": 1.424, + "step": 37185 + }, + { + "epoch": 2.93, + "learning_rate": 4.5066870066763904e-07, + "loss": 1.5204, + "step": 37186 + }, + { + "epoch": 2.93, + "learning_rate": 4.497118376869724e-07, + "loss": 1.4127, + "step": 37187 + }, + { + "epoch": 2.93, + "learning_rate": 4.48755990070232e-07, + "loss": 1.4797, + "step": 37188 + }, + { + "epoch": 2.93, + "learning_rate": 4.47801157823896e-07, + "loss": 1.437, + "step": 37189 + }, + { + "epoch": 2.93, + "learning_rate": 4.4684734095447595e-07, + "loss": 1.4762, + "step": 37190 + }, + { + "epoch": 2.93, + "learning_rate": 4.4589453946843323e-07, + "loss": 1.4072, + "step": 37191 + }, + { + "epoch": 2.93, + "learning_rate": 4.4494275337221274e-07, + "loss": 1.413, + "step": 37192 + }, + { + "epoch": 2.93, + "learning_rate": 4.4399198267232593e-07, + "loss": 1.5018, + "step": 37193 + }, + { + "epoch": 2.93, + "learning_rate": 4.4304222737520103e-07, + "loss": 1.4073, + "step": 37194 + }, + { + "epoch": 2.93, + "learning_rate": 4.4209348748726614e-07, + "loss": 1.4792, + "step": 37195 + }, + { + "epoch": 2.93, + "learning_rate": 4.411457630149995e-07, + "loss": 1.4646, + "step": 37196 + }, + { + "epoch": 2.93, + "learning_rate": 4.4019905396482923e-07, + "loss": 1.4644, + "step": 37197 + }, + { + "epoch": 2.93, + "learning_rate": 4.392533603431503e-07, + "loss": 1.4648, + "step": 37198 + }, + { + "epoch": 2.93, + "learning_rate": 4.383086821564241e-07, + "loss": 1.4486, + "step": 37199 + }, + { + "epoch": 2.93, + "learning_rate": 4.3736501941104565e-07, + "loss": 1.4675, + "step": 37200 + }, + { + "epoch": 2.93, + "learning_rate": 4.364223721134097e-07, + "loss": 1.4173, + "step": 37201 + }, + { + "epoch": 2.93, + "learning_rate": 4.354807402699445e-07, + "loss": 1.4745, + "step": 37202 + }, + { + "epoch": 2.93, + "learning_rate": 4.3454012388701163e-07, + "loss": 1.4129, + "step": 37203 + }, + { + "epoch": 2.93, + "learning_rate": 4.3360052297102264e-07, + "loss": 1.4639, + "step": 37204 + }, + { + "epoch": 2.93, + "learning_rate": 4.3266193752835575e-07, + "loss": 1.4686, + "step": 37205 + }, + { + "epoch": 2.93, + "learning_rate": 4.3172436756537254e-07, + "loss": 1.5114, + "step": 37206 + }, + { + "epoch": 2.93, + "learning_rate": 4.307878130884346e-07, + "loss": 1.4785, + "step": 37207 + }, + { + "epoch": 2.93, + "learning_rate": 4.298522741039201e-07, + "loss": 1.4548, + "step": 37208 + }, + { + "epoch": 2.93, + "learning_rate": 4.289177506181574e-07, + "loss": 1.4722, + "step": 37209 + }, + { + "epoch": 2.93, + "learning_rate": 4.2798424263750795e-07, + "loss": 1.4418, + "step": 37210 + }, + { + "epoch": 2.93, + "learning_rate": 4.270517501683168e-07, + "loss": 1.3994, + "step": 37211 + }, + { + "epoch": 2.93, + "learning_rate": 4.261202732168789e-07, + "loss": 1.432, + "step": 37212 + }, + { + "epoch": 2.93, + "learning_rate": 4.251898117895558e-07, + "loss": 1.4217, + "step": 37213 + }, + { + "epoch": 2.93, + "learning_rate": 4.242603658926591e-07, + "loss": 1.4339, + "step": 37214 + }, + { + "epoch": 2.93, + "learning_rate": 4.2333193553248377e-07, + "loss": 1.3771, + "step": 37215 + }, + { + "epoch": 2.93, + "learning_rate": 4.2240452071534146e-07, + "loss": 1.4398, + "step": 37216 + }, + { + "epoch": 2.93, + "learning_rate": 4.214781214475271e-07, + "loss": 1.3488, + "step": 37217 + }, + { + "epoch": 2.93, + "learning_rate": 4.205527377353357e-07, + "loss": 1.4545, + "step": 37218 + }, + { + "epoch": 2.93, + "learning_rate": 4.196283695850455e-07, + "loss": 1.3792, + "step": 37219 + }, + { + "epoch": 2.93, + "learning_rate": 4.187050170029349e-07, + "loss": 1.4696, + "step": 37220 + }, + { + "epoch": 2.93, + "learning_rate": 4.177826799952655e-07, + "loss": 1.4637, + "step": 37221 + }, + { + "epoch": 2.93, + "learning_rate": 4.168613585683156e-07, + "loss": 1.4415, + "step": 37222 + }, + { + "epoch": 2.93, + "learning_rate": 4.1594105272833024e-07, + "loss": 1.4392, + "step": 37223 + }, + { + "epoch": 2.93, + "learning_rate": 4.1502176248153776e-07, + "loss": 1.4373, + "step": 37224 + }, + { + "epoch": 2.93, + "learning_rate": 4.141034878342164e-07, + "loss": 1.397, + "step": 37225 + }, + { + "epoch": 2.93, + "learning_rate": 4.1318622879257803e-07, + "loss": 1.4312, + "step": 37226 + }, + { + "epoch": 2.93, + "learning_rate": 4.122699853628675e-07, + "loss": 1.442, + "step": 37227 + }, + { + "epoch": 2.93, + "learning_rate": 4.113547575512799e-07, + "loss": 1.4736, + "step": 37228 + }, + { + "epoch": 2.93, + "learning_rate": 4.1044054536406025e-07, + "loss": 1.4194, + "step": 37229 + }, + { + "epoch": 2.93, + "learning_rate": 4.0952734880738694e-07, + "loss": 1.4727, + "step": 37230 + }, + { + "epoch": 2.93, + "learning_rate": 4.0861516788747163e-07, + "loss": 1.4687, + "step": 37231 + }, + { + "epoch": 2.93, + "learning_rate": 4.077040026105094e-07, + "loss": 1.4144, + "step": 37232 + }, + { + "epoch": 2.93, + "learning_rate": 4.0679385298267866e-07, + "loss": 1.4423, + "step": 37233 + }, + { + "epoch": 2.93, + "learning_rate": 4.058847190101744e-07, + "loss": 1.4576, + "step": 37234 + }, + { + "epoch": 2.93, + "learning_rate": 4.0497660069917505e-07, + "loss": 1.4478, + "step": 37235 + }, + { + "epoch": 2.93, + "learning_rate": 4.04069498055809e-07, + "loss": 1.4251, + "step": 37236 + }, + { + "epoch": 2.93, + "learning_rate": 4.031634110862547e-07, + "loss": 1.4677, + "step": 37237 + }, + { + "epoch": 2.93, + "learning_rate": 4.022583397966739e-07, + "loss": 1.4543, + "step": 37238 + }, + { + "epoch": 2.93, + "learning_rate": 4.013542841932116e-07, + "loss": 1.4707, + "step": 37239 + }, + { + "epoch": 2.93, + "learning_rate": 4.004512442819796e-07, + "loss": 1.4627, + "step": 37240 + }, + { + "epoch": 2.93, + "learning_rate": 3.995492200691397e-07, + "loss": 1.4609, + "step": 37241 + }, + { + "epoch": 2.93, + "learning_rate": 3.9864821156082026e-07, + "loss": 1.428, + "step": 37242 + }, + { + "epoch": 2.93, + "learning_rate": 3.9774821876309984e-07, + "loss": 1.4563, + "step": 37243 + }, + { + "epoch": 2.93, + "learning_rate": 3.968492416821234e-07, + "loss": 1.4583, + "step": 37244 + }, + { + "epoch": 2.93, + "learning_rate": 3.959512803239695e-07, + "loss": 1.4215, + "step": 37245 + }, + { + "epoch": 2.93, + "learning_rate": 3.950543346947499e-07, + "loss": 1.4582, + "step": 37246 + }, + { + "epoch": 2.93, + "learning_rate": 3.941584048005597e-07, + "loss": 1.4176, + "step": 37247 + }, + { + "epoch": 2.93, + "learning_rate": 3.932634906474774e-07, + "loss": 1.4238, + "step": 37248 + }, + { + "epoch": 2.93, + "learning_rate": 3.923695922415815e-07, + "loss": 1.3941, + "step": 37249 + }, + { + "epoch": 2.93, + "learning_rate": 3.9147670958891706e-07, + "loss": 1.4525, + "step": 37250 + }, + { + "epoch": 2.93, + "learning_rate": 3.905848426955793e-07, + "loss": 1.3849, + "step": 37251 + }, + { + "epoch": 2.93, + "learning_rate": 3.8969399156761336e-07, + "loss": 1.4508, + "step": 37252 + }, + { + "epoch": 2.93, + "learning_rate": 3.8880415621104776e-07, + "loss": 1.4119, + "step": 37253 + }, + { + "epoch": 2.93, + "learning_rate": 3.879153366319443e-07, + "loss": 1.4133, + "step": 37254 + }, + { + "epoch": 2.93, + "learning_rate": 3.8702753283633147e-07, + "loss": 1.4335, + "step": 37255 + }, + { + "epoch": 2.93, + "learning_rate": 3.861407448302545e-07, + "loss": 1.5, + "step": 37256 + }, + { + "epoch": 2.93, + "learning_rate": 3.8525497261969187e-07, + "loss": 1.4712, + "step": 37257 + }, + { + "epoch": 2.93, + "learning_rate": 3.843702162107054e-07, + "loss": 1.4124, + "step": 37258 + }, + { + "epoch": 2.93, + "learning_rate": 3.834864756092737e-07, + "loss": 1.4538, + "step": 37259 + }, + { + "epoch": 2.93, + "learning_rate": 3.8260375082139193e-07, + "loss": 1.5048, + "step": 37260 + }, + { + "epoch": 2.93, + "learning_rate": 3.8172204185308865e-07, + "loss": 1.3976, + "step": 37261 + }, + { + "epoch": 2.93, + "learning_rate": 3.80841348710309e-07, + "loss": 1.4549, + "step": 37262 + }, + { + "epoch": 2.93, + "learning_rate": 3.7996167139904833e-07, + "loss": 1.4656, + "step": 37263 + }, + { + "epoch": 2.93, + "learning_rate": 3.7908300992530174e-07, + "loss": 1.4238, + "step": 37264 + }, + { + "epoch": 2.93, + "learning_rate": 3.782053642949978e-07, + "loss": 1.4509, + "step": 37265 + }, + { + "epoch": 2.93, + "learning_rate": 3.773287345140985e-07, + "loss": 1.4515, + "step": 37266 + }, + { + "epoch": 2.93, + "learning_rate": 3.7645312058858234e-07, + "loss": 1.4263, + "step": 37267 + }, + { + "epoch": 2.93, + "learning_rate": 3.7557852252439457e-07, + "loss": 1.4285, + "step": 37268 + }, + { + "epoch": 2.93, + "learning_rate": 3.747049403274471e-07, + "loss": 1.4508, + "step": 37269 + }, + { + "epoch": 2.93, + "learning_rate": 3.738323740036686e-07, + "loss": 1.4589, + "step": 37270 + }, + { + "epoch": 2.93, + "learning_rate": 3.7296082355900426e-07, + "loss": 1.4899, + "step": 37271 + }, + { + "epoch": 2.93, + "learning_rate": 3.7209028899938265e-07, + "loss": 1.4417, + "step": 37272 + }, + { + "epoch": 2.93, + "learning_rate": 3.712207703306824e-07, + "loss": 1.3617, + "step": 37273 + }, + { + "epoch": 2.93, + "learning_rate": 3.7035226755881553e-07, + "loss": 1.451, + "step": 37274 + }, + { + "epoch": 2.93, + "learning_rate": 3.694847806896939e-07, + "loss": 1.4395, + "step": 37275 + }, + { + "epoch": 2.93, + "learning_rate": 3.6861830972919614e-07, + "loss": 1.4541, + "step": 37276 + }, + { + "epoch": 2.93, + "learning_rate": 3.677528546832176e-07, + "loss": 1.428, + "step": 37277 + }, + { + "epoch": 2.93, + "learning_rate": 3.6688841555760353e-07, + "loss": 1.4204, + "step": 37278 + }, + { + "epoch": 2.93, + "learning_rate": 3.6602499235824924e-07, + "loss": 1.3997, + "step": 37279 + }, + { + "epoch": 2.93, + "learning_rate": 3.651625850910167e-07, + "loss": 1.4565, + "step": 37280 + }, + { + "epoch": 2.93, + "learning_rate": 3.643011937617513e-07, + "loss": 1.3966, + "step": 37281 + }, + { + "epoch": 2.93, + "learning_rate": 3.6344081837629823e-07, + "loss": 1.424, + "step": 37282 + }, + { + "epoch": 2.93, + "learning_rate": 3.625814589405196e-07, + "loss": 1.39, + "step": 37283 + }, + { + "epoch": 2.93, + "learning_rate": 3.6172311546022737e-07, + "loss": 1.473, + "step": 37284 + }, + { + "epoch": 2.93, + "learning_rate": 3.6086578794126684e-07, + "loss": 1.4305, + "step": 37285 + }, + { + "epoch": 2.93, + "learning_rate": 3.6000947638943347e-07, + "loss": 1.4625, + "step": 37286 + }, + { + "epoch": 2.93, + "learning_rate": 3.591541808105558e-07, + "loss": 1.4044, + "step": 37287 + }, + { + "epoch": 2.93, + "learning_rate": 3.582999012104626e-07, + "loss": 1.4579, + "step": 37288 + }, + { + "epoch": 2.93, + "learning_rate": 3.5744663759491586e-07, + "loss": 1.4914, + "step": 37289 + }, + { + "epoch": 2.93, + "learning_rate": 3.5659438996974434e-07, + "loss": 1.4681, + "step": 37290 + }, + { + "epoch": 2.93, + "learning_rate": 3.5574315834071e-07, + "loss": 1.4817, + "step": 37291 + }, + { + "epoch": 2.93, + "learning_rate": 3.548929427135916e-07, + "loss": 1.4407, + "step": 37292 + }, + { + "epoch": 2.93, + "learning_rate": 3.540437430941678e-07, + "loss": 1.441, + "step": 37293 + }, + { + "epoch": 2.93, + "learning_rate": 3.5319555948821745e-07, + "loss": 1.4626, + "step": 37294 + }, + { + "epoch": 2.93, + "learning_rate": 3.5234839190148577e-07, + "loss": 1.398, + "step": 37295 + }, + { + "epoch": 2.93, + "learning_rate": 3.515022403397183e-07, + "loss": 1.4629, + "step": 37296 + }, + { + "epoch": 2.93, + "learning_rate": 3.5065710480867704e-07, + "loss": 1.4695, + "step": 37297 + }, + { + "epoch": 2.93, + "learning_rate": 3.498129853140741e-07, + "loss": 1.4604, + "step": 37298 + }, + { + "epoch": 2.93, + "learning_rate": 3.489698818616715e-07, + "loss": 1.4729, + "step": 37299 + }, + { + "epoch": 2.93, + "learning_rate": 3.481277944571814e-07, + "loss": 1.4923, + "step": 37300 + }, + { + "epoch": 2.93, + "learning_rate": 3.472867231063159e-07, + "loss": 1.4314, + "step": 37301 + }, + { + "epoch": 2.93, + "learning_rate": 3.4644666781478705e-07, + "loss": 1.4817, + "step": 37302 + }, + { + "epoch": 2.94, + "learning_rate": 3.456076285882903e-07, + "loss": 1.4097, + "step": 37303 + }, + { + "epoch": 2.94, + "learning_rate": 3.447696054325377e-07, + "loss": 1.4018, + "step": 37304 + }, + { + "epoch": 2.94, + "learning_rate": 3.4393259835322485e-07, + "loss": 1.427, + "step": 37305 + }, + { + "epoch": 2.94, + "learning_rate": 3.4309660735601374e-07, + "loss": 1.4767, + "step": 37306 + }, + { + "epoch": 2.94, + "learning_rate": 3.4226163244658323e-07, + "loss": 1.4864, + "step": 37307 + }, + { + "epoch": 2.94, + "learning_rate": 3.414276736306121e-07, + "loss": 1.4556, + "step": 37308 + }, + { + "epoch": 2.94, + "learning_rate": 3.4059473091376243e-07, + "loss": 1.4413, + "step": 37309 + }, + { + "epoch": 2.94, + "learning_rate": 3.397628043016798e-07, + "loss": 1.3895, + "step": 37310 + }, + { + "epoch": 2.94, + "learning_rate": 3.389318938000263e-07, + "loss": 1.463, + "step": 37311 + }, + { + "epoch": 2.94, + "learning_rate": 3.381019994144307e-07, + "loss": 1.4357, + "step": 37312 + }, + { + "epoch": 2.94, + "learning_rate": 3.37273121150522e-07, + "loss": 1.3704, + "step": 37313 + }, + { + "epoch": 2.94, + "learning_rate": 3.364452590139455e-07, + "loss": 1.4502, + "step": 37314 + }, + { + "epoch": 2.94, + "learning_rate": 3.356184130103301e-07, + "loss": 1.5115, + "step": 37315 + }, + { + "epoch": 2.94, + "learning_rate": 3.347925831452547e-07, + "loss": 1.4662, + "step": 37316 + }, + { + "epoch": 2.94, + "learning_rate": 3.3396776942434813e-07, + "loss": 1.4141, + "step": 37317 + }, + { + "epoch": 2.94, + "learning_rate": 3.331439718532225e-07, + "loss": 1.5025, + "step": 37318 + }, + { + "epoch": 2.94, + "learning_rate": 3.323211904374401e-07, + "loss": 1.4572, + "step": 37319 + }, + { + "epoch": 2.94, + "learning_rate": 3.3149942518261305e-07, + "loss": 1.4081, + "step": 37320 + }, + { + "epoch": 2.94, + "learning_rate": 3.3067867609430363e-07, + "loss": 1.4517, + "step": 37321 + }, + { + "epoch": 2.94, + "learning_rate": 3.298589431780907e-07, + "loss": 1.5046, + "step": 37322 + }, + { + "epoch": 2.94, + "learning_rate": 3.290402264395531e-07, + "loss": 1.4393, + "step": 37323 + }, + { + "epoch": 2.94, + "learning_rate": 3.282225258842197e-07, + "loss": 1.4451, + "step": 37324 + }, + { + "epoch": 2.94, + "learning_rate": 3.2740584151766947e-07, + "loss": 1.4396, + "step": 37325 + }, + { + "epoch": 2.94, + "learning_rate": 3.265901733454479e-07, + "loss": 1.4464, + "step": 37326 + }, + { + "epoch": 2.94, + "learning_rate": 3.257755213730673e-07, + "loss": 1.4093, + "step": 37327 + }, + { + "epoch": 2.94, + "learning_rate": 3.2496188560607317e-07, + "loss": 1.4501, + "step": 37328 + }, + { + "epoch": 2.94, + "learning_rate": 3.2414926604999446e-07, + "loss": 1.488, + "step": 37329 + }, + { + "epoch": 2.94, + "learning_rate": 3.2333766271034345e-07, + "loss": 1.4263, + "step": 37330 + }, + { + "epoch": 2.94, + "learning_rate": 3.2252707559263237e-07, + "loss": 1.4527, + "step": 37331 + }, + { + "epoch": 2.94, + "learning_rate": 3.2171750470237343e-07, + "loss": 1.492, + "step": 37332 + }, + { + "epoch": 2.94, + "learning_rate": 3.2090895004504567e-07, + "loss": 1.4574, + "step": 37333 + }, + { + "epoch": 2.94, + "learning_rate": 3.2010141162614465e-07, + "loss": 1.4508, + "step": 37334 + }, + { + "epoch": 2.94, + "learning_rate": 3.1929488945114933e-07, + "loss": 1.4543, + "step": 37335 + }, + { + "epoch": 2.94, + "learning_rate": 3.1848938352553865e-07, + "loss": 1.4397, + "step": 37336 + }, + { + "epoch": 2.94, + "learning_rate": 3.1768489385479154e-07, + "loss": 1.428, + "step": 37337 + }, + { + "epoch": 2.94, + "learning_rate": 3.1688142044437035e-07, + "loss": 1.4226, + "step": 37338 + }, + { + "epoch": 2.94, + "learning_rate": 3.160789632997207e-07, + "loss": 1.4188, + "step": 37339 + }, + { + "epoch": 2.94, + "learning_rate": 3.1527752242628824e-07, + "loss": 1.4026, + "step": 37340 + }, + { + "epoch": 2.94, + "learning_rate": 3.144770978295019e-07, + "loss": 1.4878, + "step": 37341 + }, + { + "epoch": 2.94, + "learning_rate": 3.1367768951484073e-07, + "loss": 1.4021, + "step": 37342 + }, + { + "epoch": 2.94, + "learning_rate": 3.128792974876837e-07, + "loss": 1.4217, + "step": 37343 + }, + { + "epoch": 2.94, + "learning_rate": 3.1208192175347647e-07, + "loss": 1.4511, + "step": 37344 + }, + { + "epoch": 2.94, + "learning_rate": 3.1128556231763134e-07, + "loss": 1.4397, + "step": 37345 + }, + { + "epoch": 2.94, + "learning_rate": 3.104902191855607e-07, + "loss": 1.4243, + "step": 37346 + }, + { + "epoch": 2.94, + "learning_rate": 3.096958923626436e-07, + "loss": 1.4893, + "step": 37347 + }, + { + "epoch": 2.94, + "learning_rate": 3.089025818542923e-07, + "loss": 1.4416, + "step": 37348 + }, + { + "epoch": 2.94, + "learning_rate": 3.0811028766588585e-07, + "loss": 1.4512, + "step": 37349 + }, + { + "epoch": 2.94, + "learning_rate": 3.073190098027867e-07, + "loss": 1.4862, + "step": 37350 + }, + { + "epoch": 2.94, + "learning_rate": 3.0652874827040705e-07, + "loss": 1.4501, + "step": 37351 + }, + { + "epoch": 2.94, + "learning_rate": 3.0573950307407614e-07, + "loss": 1.4205, + "step": 37352 + }, + { + "epoch": 2.94, + "learning_rate": 3.0495127421917285e-07, + "loss": 1.5091, + "step": 37353 + }, + { + "epoch": 2.94, + "learning_rate": 3.0416406171104303e-07, + "loss": 1.4897, + "step": 37354 + }, + { + "epoch": 2.94, + "learning_rate": 3.033778655550323e-07, + "loss": 1.4575, + "step": 37355 + }, + { + "epoch": 2.94, + "learning_rate": 3.025926857564698e-07, + "loss": 1.5006, + "step": 37356 + }, + { + "epoch": 2.94, + "learning_rate": 3.018085223206845e-07, + "loss": 1.3943, + "step": 37357 + }, + { + "epoch": 2.94, + "learning_rate": 3.010253752530223e-07, + "loss": 1.4588, + "step": 37358 + }, + { + "epoch": 2.94, + "learning_rate": 3.002432445587788e-07, + "loss": 1.4743, + "step": 37359 + }, + { + "epoch": 2.94, + "learning_rate": 2.994621302432831e-07, + "loss": 1.47, + "step": 37360 + }, + { + "epoch": 2.94, + "learning_rate": 2.986820323118311e-07, + "loss": 1.4332, + "step": 37361 + }, + { + "epoch": 2.94, + "learning_rate": 2.9790295076970175e-07, + "loss": 1.4056, + "step": 37362 + }, + { + "epoch": 2.94, + "learning_rate": 2.9712488562220747e-07, + "loss": 1.4811, + "step": 37363 + }, + { + "epoch": 2.94, + "learning_rate": 2.963478368746108e-07, + "loss": 1.4382, + "step": 37364 + }, + { + "epoch": 2.94, + "learning_rate": 2.955718045322075e-07, + "loss": 1.4338, + "step": 37365 + }, + { + "epoch": 2.94, + "learning_rate": 2.9479678860026e-07, + "loss": 1.4269, + "step": 37366 + }, + { + "epoch": 2.94, + "learning_rate": 2.9402278908403074e-07, + "loss": 1.4388, + "step": 37367 + }, + { + "epoch": 2.94, + "learning_rate": 2.932498059887656e-07, + "loss": 1.3933, + "step": 37368 + }, + { + "epoch": 2.94, + "learning_rate": 2.924778393197269e-07, + "loss": 1.4438, + "step": 37369 + }, + { + "epoch": 2.94, + "learning_rate": 2.917068890821439e-07, + "loss": 1.4701, + "step": 37370 + }, + { + "epoch": 2.94, + "learning_rate": 2.909369552812457e-07, + "loss": 1.4494, + "step": 37371 + }, + { + "epoch": 2.94, + "learning_rate": 2.9016803792227815e-07, + "loss": 1.4151, + "step": 37372 + }, + { + "epoch": 2.94, + "learning_rate": 2.894001370104537e-07, + "loss": 1.477, + "step": 37373 + }, + { + "epoch": 2.94, + "learning_rate": 2.8863325255098493e-07, + "loss": 1.4342, + "step": 37374 + }, + { + "epoch": 2.94, + "learning_rate": 2.8786738454906754e-07, + "loss": 1.4373, + "step": 37375 + }, + { + "epoch": 2.94, + "learning_rate": 2.871025330099308e-07, + "loss": 1.3971, + "step": 37376 + }, + { + "epoch": 2.94, + "learning_rate": 2.8633869793873723e-07, + "loss": 1.3755, + "step": 37377 + }, + { + "epoch": 2.94, + "learning_rate": 2.8557587934069923e-07, + "loss": 1.4173, + "step": 37378 + }, + { + "epoch": 2.94, + "learning_rate": 2.848140772209628e-07, + "loss": 1.4574, + "step": 37379 + }, + { + "epoch": 2.94, + "learning_rate": 2.8405329158474044e-07, + "loss": 1.4627, + "step": 37380 + }, + { + "epoch": 2.94, + "learning_rate": 2.8329352243714466e-07, + "loss": 1.431, + "step": 37381 + }, + { + "epoch": 2.94, + "learning_rate": 2.8253476978338797e-07, + "loss": 1.4331, + "step": 37382 + }, + { + "epoch": 2.94, + "learning_rate": 2.817770336285996e-07, + "loss": 1.4476, + "step": 37383 + }, + { + "epoch": 2.94, + "learning_rate": 2.8102031397792546e-07, + "loss": 1.471, + "step": 37384 + }, + { + "epoch": 2.94, + "learning_rate": 2.802646108364948e-07, + "loss": 1.4476, + "step": 37385 + }, + { + "epoch": 2.94, + "learning_rate": 2.7950992420943677e-07, + "loss": 1.4332, + "step": 37386 + }, + { + "epoch": 2.94, + "learning_rate": 2.787562541018973e-07, + "loss": 1.4458, + "step": 37387 + }, + { + "epoch": 2.94, + "learning_rate": 2.780036005189723e-07, + "loss": 1.4457, + "step": 37388 + }, + { + "epoch": 2.94, + "learning_rate": 2.7725196346579104e-07, + "loss": 1.4549, + "step": 37389 + }, + { + "epoch": 2.94, + "learning_rate": 2.7650134294743273e-07, + "loss": 1.4257, + "step": 37390 + }, + { + "epoch": 2.94, + "learning_rate": 2.7575173896901005e-07, + "loss": 1.4164, + "step": 37391 + }, + { + "epoch": 2.94, + "learning_rate": 2.750031515356188e-07, + "loss": 1.4965, + "step": 37392 + }, + { + "epoch": 2.94, + "learning_rate": 2.7425558065232165e-07, + "loss": 1.4255, + "step": 37393 + }, + { + "epoch": 2.94, + "learning_rate": 2.735090263241979e-07, + "loss": 1.4932, + "step": 37394 + }, + { + "epoch": 2.94, + "learning_rate": 2.727634885563268e-07, + "loss": 1.4696, + "step": 37395 + }, + { + "epoch": 2.94, + "learning_rate": 2.720189673537709e-07, + "loss": 1.5018, + "step": 37396 + }, + { + "epoch": 2.94, + "learning_rate": 2.7127546272155966e-07, + "loss": 1.4669, + "step": 37397 + }, + { + "epoch": 2.94, + "learning_rate": 2.7053297466478885e-07, + "loss": 1.424, + "step": 37398 + }, + { + "epoch": 2.94, + "learning_rate": 2.6979150318845454e-07, + "loss": 1.465, + "step": 37399 + }, + { + "epoch": 2.94, + "learning_rate": 2.6905104829760273e-07, + "loss": 1.4629, + "step": 37400 + }, + { + "epoch": 2.94, + "learning_rate": 2.683116099972793e-07, + "loss": 1.4684, + "step": 37401 + }, + { + "epoch": 2.94, + "learning_rate": 2.675731882924803e-07, + "loss": 1.4786, + "step": 37402 + }, + { + "epoch": 2.94, + "learning_rate": 2.668357831882517e-07, + "loss": 1.4695, + "step": 37403 + }, + { + "epoch": 2.94, + "learning_rate": 2.660993946895562e-07, + "loss": 1.4507, + "step": 37404 + }, + { + "epoch": 2.94, + "learning_rate": 2.653640228014231e-07, + "loss": 1.4401, + "step": 37405 + }, + { + "epoch": 2.94, + "learning_rate": 2.6462966752883175e-07, + "loss": 1.4791, + "step": 37406 + }, + { + "epoch": 2.94, + "learning_rate": 2.6389632887679477e-07, + "loss": 1.4587, + "step": 37407 + }, + { + "epoch": 2.94, + "learning_rate": 2.631640068502583e-07, + "loss": 1.4485, + "step": 37408 + }, + { + "epoch": 2.94, + "learning_rate": 2.6243270145420157e-07, + "loss": 1.4915, + "step": 37409 + }, + { + "epoch": 2.94, + "learning_rate": 2.617024126935874e-07, + "loss": 1.4473, + "step": 37410 + }, + { + "epoch": 2.94, + "learning_rate": 2.6097314057339503e-07, + "loss": 1.4122, + "step": 37411 + }, + { + "epoch": 2.94, + "learning_rate": 2.602448850985539e-07, + "loss": 1.4401, + "step": 37412 + }, + { + "epoch": 2.94, + "learning_rate": 2.595176462740267e-07, + "loss": 1.4694, + "step": 37413 + }, + { + "epoch": 2.94, + "learning_rate": 2.5879142410474286e-07, + "loss": 1.4639, + "step": 37414 + }, + { + "epoch": 2.94, + "learning_rate": 2.5806621859561507e-07, + "loss": 1.4459, + "step": 37415 + }, + { + "epoch": 2.94, + "learning_rate": 2.5734202975158933e-07, + "loss": 1.4815, + "step": 37416 + }, + { + "epoch": 2.94, + "learning_rate": 2.566188575775785e-07, + "loss": 1.4006, + "step": 37417 + }, + { + "epoch": 2.94, + "learning_rate": 2.5589670207849524e-07, + "loss": 1.4035, + "step": 37418 + }, + { + "epoch": 2.94, + "learning_rate": 2.551755632592356e-07, + "loss": 1.4545, + "step": 37419 + }, + { + "epoch": 2.94, + "learning_rate": 2.5445544112469574e-07, + "loss": 1.4076, + "step": 37420 + }, + { + "epoch": 2.94, + "learning_rate": 2.537363356797717e-07, + "loss": 1.4655, + "step": 37421 + }, + { + "epoch": 2.94, + "learning_rate": 2.530182469293429e-07, + "loss": 1.4563, + "step": 37422 + }, + { + "epoch": 2.94, + "learning_rate": 2.523011748782722e-07, + "loss": 1.4806, + "step": 37423 + }, + { + "epoch": 2.94, + "learning_rate": 2.515851195314389e-07, + "loss": 1.4214, + "step": 37424 + }, + { + "epoch": 2.94, + "learning_rate": 2.508700808937059e-07, + "loss": 1.4459, + "step": 37425 + }, + { + "epoch": 2.94, + "learning_rate": 2.5015605896993585e-07, + "loss": 1.4751, + "step": 37426 + }, + { + "epoch": 2.94, + "learning_rate": 2.494430537649583e-07, + "loss": 1.4391, + "step": 37427 + }, + { + "epoch": 2.94, + "learning_rate": 2.4873106528363605e-07, + "loss": 1.4506, + "step": 37428 + }, + { + "epoch": 2.94, + "learning_rate": 2.480200935307819e-07, + "loss": 1.4823, + "step": 37429 + }, + { + "epoch": 2.95, + "learning_rate": 2.473101385112253e-07, + "loss": 1.4716, + "step": 37430 + }, + { + "epoch": 2.95, + "learning_rate": 2.466012002297957e-07, + "loss": 1.4997, + "step": 37431 + }, + { + "epoch": 2.95, + "learning_rate": 2.458932786913059e-07, + "loss": 1.4547, + "step": 37432 + }, + { + "epoch": 2.95, + "learning_rate": 2.4518637390055215e-07, + "loss": 1.4593, + "step": 37433 + }, + { + "epoch": 2.95, + "learning_rate": 2.4448048586234724e-07, + "loss": 1.5219, + "step": 37434 + }, + { + "epoch": 2.95, + "learning_rate": 2.437756145814873e-07, + "loss": 1.4553, + "step": 37435 + }, + { + "epoch": 2.95, + "learning_rate": 2.4307176006273523e-07, + "loss": 1.4523, + "step": 37436 + }, + { + "epoch": 2.95, + "learning_rate": 2.423689223108871e-07, + "loss": 1.4483, + "step": 37437 + }, + { + "epoch": 2.95, + "learning_rate": 2.416671013307059e-07, + "loss": 1.4249, + "step": 37438 + }, + { + "epoch": 2.95, + "learning_rate": 2.40966297126971e-07, + "loss": 1.3747, + "step": 37439 + }, + { + "epoch": 2.95, + "learning_rate": 2.402665097044287e-07, + "loss": 1.4535, + "step": 37440 + }, + { + "epoch": 2.95, + "learning_rate": 2.3956773906784186e-07, + "loss": 1.3786, + "step": 37441 + }, + { + "epoch": 2.95, + "learning_rate": 2.3886998522192334e-07, + "loss": 1.4038, + "step": 37442 + }, + { + "epoch": 2.95, + "learning_rate": 2.3817324817145267e-07, + "loss": 1.4606, + "step": 37443 + }, + { + "epoch": 2.95, + "learning_rate": 2.3747752792112608e-07, + "loss": 1.4485, + "step": 37444 + }, + { + "epoch": 2.95, + "learning_rate": 2.3678282447568974e-07, + "loss": 1.4851, + "step": 37445 + }, + { + "epoch": 2.95, + "learning_rate": 2.3608913783983995e-07, + "loss": 1.4343, + "step": 37446 + }, + { + "epoch": 2.95, + "learning_rate": 2.3539646801830624e-07, + "loss": 1.4261, + "step": 37447 + }, + { + "epoch": 2.95, + "learning_rate": 2.3470481501578486e-07, + "loss": 1.4645, + "step": 37448 + }, + { + "epoch": 2.95, + "learning_rate": 2.3401417883697205e-07, + "loss": 1.4435, + "step": 37449 + }, + { + "epoch": 2.95, + "learning_rate": 2.3332455948656404e-07, + "loss": 1.4413, + "step": 37450 + }, + { + "epoch": 2.95, + "learning_rate": 2.3263595696922377e-07, + "loss": 1.3938, + "step": 37451 + }, + { + "epoch": 2.95, + "learning_rate": 2.3194837128963085e-07, + "loss": 1.4195, + "step": 37452 + }, + { + "epoch": 2.95, + "learning_rate": 2.3126180245246485e-07, + "loss": 1.4114, + "step": 37453 + }, + { + "epoch": 2.95, + "learning_rate": 2.305762504623887e-07, + "loss": 1.4453, + "step": 37454 + }, + { + "epoch": 2.95, + "learning_rate": 2.2989171532403206e-07, + "loss": 1.4995, + "step": 37455 + }, + { + "epoch": 2.95, + "learning_rate": 2.292081970420745e-07, + "loss": 1.405, + "step": 37456 + }, + { + "epoch": 2.95, + "learning_rate": 2.2852569562114564e-07, + "loss": 1.456, + "step": 37457 + }, + { + "epoch": 2.95, + "learning_rate": 2.2784421106587514e-07, + "loss": 1.4058, + "step": 37458 + }, + { + "epoch": 2.95, + "learning_rate": 2.2716374338089261e-07, + "loss": 1.4232, + "step": 37459 + }, + { + "epoch": 2.95, + "learning_rate": 2.26484292570811e-07, + "loss": 1.47, + "step": 37460 + }, + { + "epoch": 2.95, + "learning_rate": 2.2580585864024337e-07, + "loss": 1.3986, + "step": 37461 + }, + { + "epoch": 2.95, + "learning_rate": 2.2512844159380262e-07, + "loss": 1.4062, + "step": 37462 + }, + { + "epoch": 2.95, + "learning_rate": 2.2445204143610174e-07, + "loss": 1.4866, + "step": 37463 + }, + { + "epoch": 2.95, + "learning_rate": 2.2377665817170375e-07, + "loss": 1.4386, + "step": 37464 + }, + { + "epoch": 2.95, + "learning_rate": 2.2310229180522166e-07, + "loss": 1.4953, + "step": 37465 + }, + { + "epoch": 2.95, + "learning_rate": 2.2242894234121845e-07, + "loss": 1.4382, + "step": 37466 + }, + { + "epoch": 2.95, + "learning_rate": 2.2175660978425714e-07, + "loss": 1.427, + "step": 37467 + }, + { + "epoch": 2.95, + "learning_rate": 2.2108529413893405e-07, + "loss": 1.4132, + "step": 37468 + }, + { + "epoch": 2.95, + "learning_rate": 2.2041499540976226e-07, + "loss": 1.4598, + "step": 37469 + }, + { + "epoch": 2.95, + "learning_rate": 2.1974571360133808e-07, + "loss": 1.4309, + "step": 37470 + }, + { + "epoch": 2.95, + "learning_rate": 2.1907744871817457e-07, + "loss": 1.5215, + "step": 37471 + }, + { + "epoch": 2.95, + "learning_rate": 2.1841020076481807e-07, + "loss": 1.3913, + "step": 37472 + }, + { + "epoch": 2.95, + "learning_rate": 2.1774396974581499e-07, + "loss": 1.4406, + "step": 37473 + }, + { + "epoch": 2.95, + "learning_rate": 2.170787556656617e-07, + "loss": 1.4476, + "step": 37474 + }, + { + "epoch": 2.95, + "learning_rate": 2.1641455852888788e-07, + "loss": 1.4589, + "step": 37475 + }, + { + "epoch": 2.95, + "learning_rate": 2.1575137833999e-07, + "loss": 1.4342, + "step": 37476 + }, + { + "epoch": 2.95, + "learning_rate": 2.1508921510349775e-07, + "loss": 1.4184, + "step": 37477 + }, + { + "epoch": 2.95, + "learning_rate": 2.1442806882389084e-07, + "loss": 1.4283, + "step": 37478 + }, + { + "epoch": 2.95, + "learning_rate": 2.1376793950564908e-07, + "loss": 1.4632, + "step": 37479 + }, + { + "epoch": 2.95, + "learning_rate": 2.1310882715326883e-07, + "loss": 1.3676, + "step": 37480 + }, + { + "epoch": 2.95, + "learning_rate": 2.1245073177122986e-07, + "loss": 1.4404, + "step": 37481 + }, + { + "epoch": 2.95, + "learning_rate": 2.117936533639786e-07, + "loss": 1.4406, + "step": 37482 + }, + { + "epoch": 2.95, + "learning_rate": 2.1113759193599477e-07, + "loss": 1.4419, + "step": 37483 + }, + { + "epoch": 2.95, + "learning_rate": 2.1048254749172488e-07, + "loss": 1.426, + "step": 37484 + }, + { + "epoch": 2.95, + "learning_rate": 2.0982852003561535e-07, + "loss": 1.4737, + "step": 37485 + }, + { + "epoch": 2.95, + "learning_rate": 2.091755095721126e-07, + "loss": 1.4511, + "step": 37486 + }, + { + "epoch": 2.95, + "learning_rate": 2.0852351610564644e-07, + "loss": 1.4251, + "step": 37487 + }, + { + "epoch": 2.95, + "learning_rate": 2.0787253964064664e-07, + "loss": 1.4394, + "step": 37488 + }, + { + "epoch": 2.95, + "learning_rate": 2.0722258018152637e-07, + "loss": 1.4607, + "step": 37489 + }, + { + "epoch": 2.95, + "learning_rate": 2.0657363773269876e-07, + "loss": 1.4843, + "step": 37490 + }, + { + "epoch": 2.95, + "learning_rate": 2.0592571229857692e-07, + "loss": 1.4151, + "step": 37491 + }, + { + "epoch": 2.95, + "learning_rate": 2.0527880388355732e-07, + "loss": 1.3983, + "step": 37492 + }, + { + "epoch": 2.95, + "learning_rate": 2.0463291249201984e-07, + "loss": 1.4785, + "step": 37493 + }, + { + "epoch": 2.95, + "learning_rate": 2.039880381283776e-07, + "loss": 1.4071, + "step": 37494 + }, + { + "epoch": 2.95, + "learning_rate": 2.0334418079699378e-07, + "loss": 1.4598, + "step": 37495 + }, + { + "epoch": 2.95, + "learning_rate": 2.0270134050223154e-07, + "loss": 1.4949, + "step": 37496 + }, + { + "epoch": 2.95, + "learning_rate": 2.0205951724845405e-07, + "loss": 1.456, + "step": 37497 + }, + { + "epoch": 2.95, + "learning_rate": 2.014187110400245e-07, + "loss": 1.4683, + "step": 37498 + }, + { + "epoch": 2.95, + "learning_rate": 2.0077892188132273e-07, + "loss": 1.4186, + "step": 37499 + }, + { + "epoch": 2.95, + "learning_rate": 2.0014014977664528e-07, + "loss": 1.4957, + "step": 37500 + }, + { + "epoch": 2.95, + "learning_rate": 1.9950239473035533e-07, + "loss": 1.4108, + "step": 37501 + }, + { + "epoch": 2.95, + "learning_rate": 1.9886565674676614e-07, + "loss": 1.4589, + "step": 37502 + }, + { + "epoch": 2.95, + "learning_rate": 1.9822993583022419e-07, + "loss": 1.4582, + "step": 37503 + }, + { + "epoch": 2.95, + "learning_rate": 1.9759523198502603e-07, + "loss": 1.4194, + "step": 37504 + }, + { + "epoch": 2.95, + "learning_rate": 1.9696154521550157e-07, + "loss": 1.4238, + "step": 37505 + }, + { + "epoch": 2.95, + "learning_rate": 1.9632887552593068e-07, + "loss": 1.4424, + "step": 37506 + }, + { + "epoch": 2.95, + "learning_rate": 1.9569722292060995e-07, + "loss": 1.4343, + "step": 37507 + }, + { + "epoch": 2.95, + "learning_rate": 1.9506658740385262e-07, + "loss": 1.4424, + "step": 37508 + }, + { + "epoch": 2.95, + "learning_rate": 1.9443696897992188e-07, + "loss": 1.4663, + "step": 37509 + }, + { + "epoch": 2.95, + "learning_rate": 1.9380836765308106e-07, + "loss": 1.3837, + "step": 37510 + }, + { + "epoch": 2.95, + "learning_rate": 1.9318078342762667e-07, + "loss": 1.4436, + "step": 37511 + }, + { + "epoch": 2.95, + "learning_rate": 1.9255421630778867e-07, + "loss": 1.4273, + "step": 37512 + }, + { + "epoch": 2.95, + "learning_rate": 1.91928666297847e-07, + "loss": 1.4415, + "step": 37513 + }, + { + "epoch": 2.95, + "learning_rate": 1.913041334020482e-07, + "loss": 1.4213, + "step": 37514 + }, + { + "epoch": 2.95, + "learning_rate": 1.9068061762460561e-07, + "loss": 1.4328, + "step": 37515 + }, + { + "epoch": 2.95, + "learning_rate": 1.9005811896978252e-07, + "loss": 1.4754, + "step": 37516 + }, + { + "epoch": 2.95, + "learning_rate": 1.8943663744179217e-07, + "loss": 1.4916, + "step": 37517 + }, + { + "epoch": 2.95, + "learning_rate": 1.8881617304484786e-07, + "loss": 1.415, + "step": 37518 + }, + { + "epoch": 2.95, + "learning_rate": 1.8819672578316291e-07, + "loss": 1.4325, + "step": 37519 + }, + { + "epoch": 2.95, + "learning_rate": 1.8757829566096728e-07, + "loss": 1.408, + "step": 37520 + }, + { + "epoch": 2.95, + "learning_rate": 1.8696088268242427e-07, + "loss": 1.4897, + "step": 37521 + }, + { + "epoch": 2.95, + "learning_rate": 1.863444868517472e-07, + "loss": 1.5002, + "step": 37522 + }, + { + "epoch": 2.95, + "learning_rate": 1.8572910817311604e-07, + "loss": 1.4895, + "step": 37523 + }, + { + "epoch": 2.95, + "learning_rate": 1.8511474665072746e-07, + "loss": 1.4764, + "step": 37524 + }, + { + "epoch": 2.95, + "learning_rate": 1.8450140228871147e-07, + "loss": 1.4519, + "step": 37525 + }, + { + "epoch": 2.95, + "learning_rate": 1.8388907509126472e-07, + "loss": 1.4576, + "step": 37526 + }, + { + "epoch": 2.95, + "learning_rate": 1.8327776506255055e-07, + "loss": 1.4406, + "step": 37527 + }, + { + "epoch": 2.95, + "learning_rate": 1.826674722066823e-07, + "loss": 1.4291, + "step": 37528 + }, + { + "epoch": 2.95, + "learning_rate": 1.8205819652784004e-07, + "loss": 1.4184, + "step": 37529 + }, + { + "epoch": 2.95, + "learning_rate": 1.8144993803013708e-07, + "loss": 1.4415, + "step": 37530 + }, + { + "epoch": 2.95, + "learning_rate": 1.8084269671772012e-07, + "loss": 1.4293, + "step": 37531 + }, + { + "epoch": 2.95, + "learning_rate": 1.8023647259470254e-07, + "loss": 1.4444, + "step": 37532 + }, + { + "epoch": 2.95, + "learning_rate": 1.796312656651977e-07, + "loss": 1.4376, + "step": 37533 + }, + { + "epoch": 2.95, + "learning_rate": 1.79027075933319e-07, + "loss": 1.4194, + "step": 37534 + }, + { + "epoch": 2.95, + "learning_rate": 1.784239034031798e-07, + "loss": 1.4133, + "step": 37535 + }, + { + "epoch": 2.95, + "learning_rate": 1.7782174807886017e-07, + "loss": 1.4646, + "step": 37536 + }, + { + "epoch": 2.95, + "learning_rate": 1.7722060996444022e-07, + "loss": 1.4582, + "step": 37537 + }, + { + "epoch": 2.95, + "learning_rate": 1.766204890640166e-07, + "loss": 1.4407, + "step": 37538 + }, + { + "epoch": 2.95, + "learning_rate": 1.7602138538166942e-07, + "loss": 1.4699, + "step": 37539 + }, + { + "epoch": 2.95, + "learning_rate": 1.7542329892144547e-07, + "loss": 1.4886, + "step": 37540 + }, + { + "epoch": 2.95, + "learning_rate": 1.7482622968742477e-07, + "loss": 1.4422, + "step": 37541 + }, + { + "epoch": 2.95, + "learning_rate": 1.742301776836541e-07, + "loss": 1.4619, + "step": 37542 + }, + { + "epoch": 2.95, + "learning_rate": 1.7363514291418023e-07, + "loss": 1.4732, + "step": 37543 + }, + { + "epoch": 2.95, + "learning_rate": 1.7304112538303327e-07, + "loss": 1.4602, + "step": 37544 + }, + { + "epoch": 2.95, + "learning_rate": 1.7244812509425998e-07, + "loss": 1.3959, + "step": 37545 + }, + { + "epoch": 2.95, + "learning_rate": 1.7185614205189047e-07, + "loss": 1.4714, + "step": 37546 + }, + { + "epoch": 2.95, + "learning_rate": 1.7126517625993818e-07, + "loss": 1.451, + "step": 37547 + }, + { + "epoch": 2.95, + "learning_rate": 1.7067522772239995e-07, + "loss": 1.44, + "step": 37548 + }, + { + "epoch": 2.95, + "learning_rate": 1.7008629644330586e-07, + "loss": 1.4227, + "step": 37549 + }, + { + "epoch": 2.95, + "learning_rate": 1.6949838242663605e-07, + "loss": 1.3973, + "step": 37550 + }, + { + "epoch": 2.95, + "learning_rate": 1.6891148567638734e-07, + "loss": 1.4607, + "step": 37551 + }, + { + "epoch": 2.95, + "learning_rate": 1.683256061965399e-07, + "loss": 1.4232, + "step": 37552 + }, + { + "epoch": 2.95, + "learning_rate": 1.677407439910905e-07, + "loss": 1.4922, + "step": 37553 + }, + { + "epoch": 2.95, + "learning_rate": 1.6715689906400265e-07, + "loss": 1.4511, + "step": 37554 + }, + { + "epoch": 2.95, + "learning_rate": 1.665740714192232e-07, + "loss": 1.5123, + "step": 37555 + }, + { + "epoch": 2.95, + "learning_rate": 1.659922610607156e-07, + "loss": 1.4787, + "step": 37556 + }, + { + "epoch": 2.96, + "learning_rate": 1.6541146799244344e-07, + "loss": 1.4527, + "step": 37557 + }, + { + "epoch": 2.96, + "learning_rate": 1.648316922183368e-07, + "loss": 1.4966, + "step": 37558 + }, + { + "epoch": 2.96, + "learning_rate": 1.6425293374234262e-07, + "loss": 1.4293, + "step": 37559 + }, + { + "epoch": 2.96, + "learning_rate": 1.63675192568391e-07, + "loss": 1.4052, + "step": 37560 + }, + { + "epoch": 2.96, + "learning_rate": 1.6309846870039556e-07, + "loss": 1.4002, + "step": 37561 + }, + { + "epoch": 2.96, + "learning_rate": 1.6252276214225314e-07, + "loss": 1.4343, + "step": 37562 + }, + { + "epoch": 2.96, + "learning_rate": 1.6194807289791058e-07, + "loss": 1.4325, + "step": 37563 + }, + { + "epoch": 2.96, + "learning_rate": 1.6137440097126475e-07, + "loss": 1.5096, + "step": 37564 + }, + { + "epoch": 2.96, + "learning_rate": 1.6080174636617927e-07, + "loss": 1.4295, + "step": 37565 + }, + { + "epoch": 2.96, + "learning_rate": 1.6023010908656764e-07, + "loss": 1.4361, + "step": 37566 + }, + { + "epoch": 2.96, + "learning_rate": 1.5965948913631011e-07, + "loss": 1.4939, + "step": 37567 + }, + { + "epoch": 2.96, + "learning_rate": 1.5908988651927023e-07, + "loss": 1.4627, + "step": 37568 + }, + { + "epoch": 2.96, + "learning_rate": 1.5852130123932826e-07, + "loss": 1.4854, + "step": 37569 + }, + { + "epoch": 2.96, + "learning_rate": 1.5795373330033112e-07, + "loss": 1.4455, + "step": 37570 + }, + { + "epoch": 2.96, + "learning_rate": 1.5738718270614236e-07, + "loss": 1.4477, + "step": 37571 + }, + { + "epoch": 2.96, + "learning_rate": 1.5682164946060894e-07, + "loss": 1.4399, + "step": 37572 + }, + { + "epoch": 2.96, + "learning_rate": 1.562571335675611e-07, + "loss": 1.4528, + "step": 37573 + }, + { + "epoch": 2.96, + "learning_rate": 1.556936350308291e-07, + "loss": 1.4926, + "step": 37574 + }, + { + "epoch": 2.96, + "learning_rate": 1.551311538542599e-07, + "loss": 1.4228, + "step": 37575 + }, + { + "epoch": 2.96, + "learning_rate": 1.5456969004165044e-07, + "loss": 1.4507, + "step": 37576 + }, + { + "epoch": 2.96, + "learning_rate": 1.5400924359681433e-07, + "loss": 1.418, + "step": 37577 + }, + { + "epoch": 2.96, + "learning_rate": 1.5344981452358185e-07, + "loss": 1.4568, + "step": 37578 + }, + { + "epoch": 2.96, + "learning_rate": 1.5289140282571667e-07, + "loss": 1.4132, + "step": 37579 + }, + { + "epoch": 2.96, + "learning_rate": 1.5233400850703236e-07, + "loss": 1.4155, + "step": 37580 + }, + { + "epoch": 2.96, + "learning_rate": 1.5177763157130928e-07, + "loss": 1.4271, + "step": 37581 + }, + { + "epoch": 2.96, + "learning_rate": 1.5122227202231107e-07, + "loss": 1.433, + "step": 37582 + }, + { + "epoch": 2.96, + "learning_rate": 1.5066792986383468e-07, + "loss": 1.4629, + "step": 37583 + }, + { + "epoch": 2.96, + "learning_rate": 1.5011460509962713e-07, + "loss": 1.4384, + "step": 37584 + }, + { + "epoch": 2.96, + "learning_rate": 1.4956229773345207e-07, + "loss": 1.4426, + "step": 37585 + }, + { + "epoch": 2.96, + "learning_rate": 1.4901100776903986e-07, + "loss": 1.4305, + "step": 37586 + }, + { + "epoch": 2.96, + "learning_rate": 1.484607352101541e-07, + "loss": 1.4574, + "step": 37587 + }, + { + "epoch": 2.96, + "learning_rate": 1.4791148006052522e-07, + "loss": 1.4243, + "step": 37588 + }, + { + "epoch": 2.96, + "learning_rate": 1.4736324232388353e-07, + "loss": 1.4479, + "step": 37589 + }, + { + "epoch": 2.96, + "learning_rate": 1.4681602200395936e-07, + "loss": 1.443, + "step": 37590 + }, + { + "epoch": 2.96, + "learning_rate": 1.4626981910444978e-07, + "loss": 1.3833, + "step": 37591 + }, + { + "epoch": 2.96, + "learning_rate": 1.457246336290685e-07, + "loss": 1.453, + "step": 37592 + }, + { + "epoch": 2.96, + "learning_rate": 1.4518046558152917e-07, + "loss": 1.4158, + "step": 37593 + }, + { + "epoch": 2.96, + "learning_rate": 1.4463731496551224e-07, + "loss": 1.4389, + "step": 37594 + }, + { + "epoch": 2.96, + "learning_rate": 1.4409518178471468e-07, + "loss": 1.4421, + "step": 37595 + }, + { + "epoch": 2.96, + "learning_rate": 1.4355406604280027e-07, + "loss": 1.4493, + "step": 37596 + }, + { + "epoch": 2.96, + "learning_rate": 1.4301396774346607e-07, + "loss": 1.428, + "step": 37597 + }, + { + "epoch": 2.96, + "learning_rate": 1.4247488689037578e-07, + "loss": 1.459, + "step": 37598 + }, + { + "epoch": 2.96, + "learning_rate": 1.419368234871765e-07, + "loss": 1.4475, + "step": 37599 + }, + { + "epoch": 2.96, + "learning_rate": 1.4139977753753195e-07, + "loss": 1.3941, + "step": 37600 + }, + { + "epoch": 2.96, + "learning_rate": 1.4086374904507258e-07, + "loss": 1.4412, + "step": 37601 + }, + { + "epoch": 2.96, + "learning_rate": 1.4032873801346212e-07, + "loss": 1.4601, + "step": 37602 + }, + { + "epoch": 2.96, + "learning_rate": 1.3979474444631433e-07, + "loss": 1.4079, + "step": 37603 + }, + { + "epoch": 2.96, + "learning_rate": 1.3926176834725966e-07, + "loss": 1.431, + "step": 37604 + }, + { + "epoch": 2.96, + "learning_rate": 1.3872980971991188e-07, + "loss": 1.5127, + "step": 37605 + }, + { + "epoch": 2.96, + "learning_rate": 1.3819886856790142e-07, + "loss": 1.4549, + "step": 37606 + }, + { + "epoch": 2.96, + "learning_rate": 1.3766894489480872e-07, + "loss": 1.467, + "step": 37607 + }, + { + "epoch": 2.96, + "learning_rate": 1.3714003870424763e-07, + "loss": 1.4347, + "step": 37608 + }, + { + "epoch": 2.96, + "learning_rate": 1.3661214999981518e-07, + "loss": 1.4252, + "step": 37609 + }, + { + "epoch": 2.96, + "learning_rate": 1.3608527878505858e-07, + "loss": 1.4546, + "step": 37610 + }, + { + "epoch": 2.96, + "learning_rate": 1.355594250636083e-07, + "loss": 1.4271, + "step": 37611 + }, + { + "epoch": 2.96, + "learning_rate": 1.3503458883899477e-07, + "loss": 1.4335, + "step": 37612 + }, + { + "epoch": 2.96, + "learning_rate": 1.345107701147985e-07, + "loss": 1.4523, + "step": 37613 + }, + { + "epoch": 2.96, + "learning_rate": 1.3398796889456665e-07, + "loss": 1.4418, + "step": 37614 + }, + { + "epoch": 2.96, + "learning_rate": 1.3346618518184637e-07, + "loss": 1.4183, + "step": 37615 + }, + { + "epoch": 2.96, + "learning_rate": 1.329454189802015e-07, + "loss": 1.4477, + "step": 37616 + }, + { + "epoch": 2.96, + "learning_rate": 1.324256702931459e-07, + "loss": 1.4165, + "step": 37617 + }, + { + "epoch": 2.96, + "learning_rate": 1.3190693912422668e-07, + "loss": 1.4795, + "step": 37618 + }, + { + "epoch": 2.96, + "learning_rate": 1.3138922547694107e-07, + "loss": 1.4461, + "step": 37619 + }, + { + "epoch": 2.96, + "learning_rate": 1.308725293548196e-07, + "loss": 1.4266, + "step": 37620 + }, + { + "epoch": 2.96, + "learning_rate": 1.3035685076137615e-07, + "loss": 1.4203, + "step": 37621 + }, + { + "epoch": 2.96, + "learning_rate": 1.2984218970010783e-07, + "loss": 1.4411, + "step": 37622 + }, + { + "epoch": 2.96, + "learning_rate": 1.2932854617449527e-07, + "loss": 1.4698, + "step": 37623 + }, + { + "epoch": 2.96, + "learning_rate": 1.288159201880523e-07, + "loss": 1.4595, + "step": 37624 + }, + { + "epoch": 2.96, + "learning_rate": 1.2830431174422617e-07, + "loss": 1.4951, + "step": 37625 + }, + { + "epoch": 2.96, + "learning_rate": 1.2779372084651406e-07, + "loss": 1.395, + "step": 37626 + }, + { + "epoch": 2.96, + "learning_rate": 1.2728414749837989e-07, + "loss": 1.4579, + "step": 37627 + }, + { + "epoch": 2.96, + "learning_rate": 1.2677559170327088e-07, + "loss": 1.4509, + "step": 37628 + }, + { + "epoch": 2.96, + "learning_rate": 1.2626805346466762e-07, + "loss": 1.4553, + "step": 37629 + }, + { + "epoch": 2.96, + "learning_rate": 1.25761532785984e-07, + "loss": 1.4513, + "step": 37630 + }, + { + "epoch": 2.96, + "learning_rate": 1.2525602967066729e-07, + "loss": 1.5002, + "step": 37631 + }, + { + "epoch": 2.96, + "learning_rate": 1.247515441221647e-07, + "loss": 1.4626, + "step": 37632 + }, + { + "epoch": 2.96, + "learning_rate": 1.2424807614387355e-07, + "loss": 1.3921, + "step": 37633 + }, + { + "epoch": 2.96, + "learning_rate": 1.2374562573924106e-07, + "loss": 1.4885, + "step": 37634 + }, + { + "epoch": 2.96, + "learning_rate": 1.232441929116812e-07, + "loss": 1.4849, + "step": 37635 + }, + { + "epoch": 2.96, + "learning_rate": 1.227437776645579e-07, + "loss": 1.4307, + "step": 37636 + }, + { + "epoch": 2.96, + "learning_rate": 1.2224438000131843e-07, + "loss": 1.4242, + "step": 37637 + }, + { + "epoch": 2.96, + "learning_rate": 1.217459999253101e-07, + "loss": 1.4335, + "step": 37638 + }, + { + "epoch": 2.96, + "learning_rate": 1.2124863743996348e-07, + "loss": 1.47, + "step": 37639 + }, + { + "epoch": 2.96, + "learning_rate": 1.2075229254860929e-07, + "loss": 1.4474, + "step": 37640 + }, + { + "epoch": 2.96, + "learning_rate": 1.2025696525462813e-07, + "loss": 1.4106, + "step": 37641 + }, + { + "epoch": 2.96, + "learning_rate": 1.1976265556141728e-07, + "loss": 1.4656, + "step": 37642 + }, + { + "epoch": 2.96, + "learning_rate": 1.1926936347229078e-07, + "loss": 1.3565, + "step": 37643 + }, + { + "epoch": 2.96, + "learning_rate": 1.1877708899061256e-07, + "loss": 1.3927, + "step": 37644 + }, + { + "epoch": 2.96, + "learning_rate": 1.1828583211972998e-07, + "loss": 1.5004, + "step": 37645 + }, + { + "epoch": 2.96, + "learning_rate": 1.1779559286297369e-07, + "loss": 1.4453, + "step": 37646 + }, + { + "epoch": 2.96, + "learning_rate": 1.1730637122367436e-07, + "loss": 1.4699, + "step": 37647 + }, + { + "epoch": 2.96, + "learning_rate": 1.1681816720516269e-07, + "loss": 1.5039, + "step": 37648 + }, + { + "epoch": 2.96, + "learning_rate": 1.16330980810736e-07, + "loss": 1.4713, + "step": 37649 + }, + { + "epoch": 2.96, + "learning_rate": 1.1584481204370833e-07, + "loss": 1.4366, + "step": 37650 + }, + { + "epoch": 2.96, + "learning_rate": 1.1535966090737702e-07, + "loss": 1.4159, + "step": 37651 + }, + { + "epoch": 2.96, + "learning_rate": 1.1487552740503946e-07, + "loss": 1.4056, + "step": 37652 + }, + { + "epoch": 2.96, + "learning_rate": 1.1439241153999301e-07, + "loss": 1.4253, + "step": 37653 + }, + { + "epoch": 2.96, + "learning_rate": 1.1391031331550171e-07, + "loss": 1.444, + "step": 37654 + }, + { + "epoch": 2.96, + "learning_rate": 1.1342923273484628e-07, + "loss": 1.5204, + "step": 37655 + }, + { + "epoch": 2.96, + "learning_rate": 1.1294916980129076e-07, + "loss": 1.4966, + "step": 37656 + }, + { + "epoch": 2.96, + "learning_rate": 1.1247012451809923e-07, + "loss": 1.4241, + "step": 37657 + }, + { + "epoch": 2.96, + "learning_rate": 1.1199209688851906e-07, + "loss": 1.4014, + "step": 37658 + }, + { + "epoch": 2.96, + "learning_rate": 1.1151508691581435e-07, + "loss": 1.4524, + "step": 37659 + }, + { + "epoch": 2.96, + "learning_rate": 1.110390946031825e-07, + "loss": 1.4831, + "step": 37660 + }, + { + "epoch": 2.96, + "learning_rate": 1.1056411995388759e-07, + "loss": 1.3916, + "step": 37661 + }, + { + "epoch": 2.96, + "learning_rate": 1.100901629711437e-07, + "loss": 1.4525, + "step": 37662 + }, + { + "epoch": 2.96, + "learning_rate": 1.096172236581816e-07, + "loss": 1.432, + "step": 37663 + }, + { + "epoch": 2.96, + "learning_rate": 1.0914530201819871e-07, + "loss": 1.4153, + "step": 37664 + }, + { + "epoch": 2.96, + "learning_rate": 1.0867439805439248e-07, + "loss": 1.3847, + "step": 37665 + }, + { + "epoch": 2.96, + "learning_rate": 1.0820451176997702e-07, + "loss": 1.4648, + "step": 37666 + }, + { + "epoch": 2.96, + "learning_rate": 1.077356431681331e-07, + "loss": 1.4804, + "step": 37667 + }, + { + "epoch": 2.96, + "learning_rate": 1.0726779225205818e-07, + "loss": 1.405, + "step": 37668 + }, + { + "epoch": 2.96, + "learning_rate": 1.0680095902489971e-07, + "loss": 1.4483, + "step": 37669 + }, + { + "epoch": 2.96, + "learning_rate": 1.0633514348985516e-07, + "loss": 1.4364, + "step": 37670 + }, + { + "epoch": 2.96, + "learning_rate": 1.0587034565008867e-07, + "loss": 1.3979, + "step": 37671 + }, + { + "epoch": 2.96, + "learning_rate": 1.0540656550873105e-07, + "loss": 1.4196, + "step": 37672 + }, + { + "epoch": 2.96, + "learning_rate": 1.0494380306894645e-07, + "loss": 1.4178, + "step": 37673 + }, + { + "epoch": 2.96, + "learning_rate": 1.0448205833386569e-07, + "loss": 1.4115, + "step": 37674 + }, + { + "epoch": 2.96, + "learning_rate": 1.0402133130663626e-07, + "loss": 1.4283, + "step": 37675 + }, + { + "epoch": 2.96, + "learning_rate": 1.0356162199038897e-07, + "loss": 1.4617, + "step": 37676 + }, + { + "epoch": 2.96, + "learning_rate": 1.0310293038823802e-07, + "loss": 1.3731, + "step": 37677 + }, + { + "epoch": 2.96, + "learning_rate": 1.0264525650329757e-07, + "loss": 1.4455, + "step": 37678 + }, + { + "epoch": 2.96, + "learning_rate": 1.0218860033866517e-07, + "loss": 1.3884, + "step": 37679 + }, + { + "epoch": 2.96, + "learning_rate": 1.0173296189745495e-07, + "loss": 1.4651, + "step": 37680 + }, + { + "epoch": 2.96, + "learning_rate": 1.0127834118276445e-07, + "loss": 1.4585, + "step": 37681 + }, + { + "epoch": 2.96, + "learning_rate": 1.0082473819767456e-07, + "loss": 1.4522, + "step": 37682 + }, + { + "epoch": 2.96, + "learning_rate": 1.0037215294526613e-07, + "loss": 1.4596, + "step": 37683 + }, + { + "epoch": 2.97, + "learning_rate": 9.992058542858672e-08, + "loss": 1.4408, + "step": 37684 + }, + { + "epoch": 2.97, + "learning_rate": 9.947003565075052e-08, + "loss": 1.486, + "step": 37685 + }, + { + "epoch": 2.97, + "learning_rate": 9.902050361478842e-08, + "loss": 1.4455, + "step": 37686 + }, + { + "epoch": 2.97, + "learning_rate": 9.857198932374799e-08, + "loss": 1.4115, + "step": 37687 + }, + { + "epoch": 2.97, + "learning_rate": 9.81244927806768e-08, + "loss": 1.4268, + "step": 37688 + }, + { + "epoch": 2.97, + "learning_rate": 9.767801398862241e-08, + "loss": 1.4318, + "step": 37689 + }, + { + "epoch": 2.97, + "learning_rate": 9.723255295061572e-08, + "loss": 1.4596, + "step": 37690 + }, + { + "epoch": 2.97, + "learning_rate": 9.678810966965434e-08, + "loss": 1.4035, + "step": 37691 + }, + { + "epoch": 2.97, + "learning_rate": 9.634468414880247e-08, + "loss": 1.505, + "step": 37692 + }, + { + "epoch": 2.97, + "learning_rate": 9.590227639104109e-08, + "loss": 1.4522, + "step": 37693 + }, + { + "epoch": 2.97, + "learning_rate": 9.546088639938443e-08, + "loss": 1.4365, + "step": 37694 + }, + { + "epoch": 2.97, + "learning_rate": 9.502051417681344e-08, + "loss": 1.4028, + "step": 37695 + }, + { + "epoch": 2.97, + "learning_rate": 9.458115972632574e-08, + "loss": 1.4424, + "step": 37696 + }, + { + "epoch": 2.97, + "learning_rate": 9.414282305091891e-08, + "loss": 1.4885, + "step": 37697 + }, + { + "epoch": 2.97, + "learning_rate": 9.370550415355726e-08, + "loss": 1.4109, + "step": 37698 + }, + { + "epoch": 2.97, + "learning_rate": 9.326920303720508e-08, + "loss": 1.4333, + "step": 37699 + }, + { + "epoch": 2.97, + "learning_rate": 9.283391970482667e-08, + "loss": 1.3784, + "step": 37700 + }, + { + "epoch": 2.97, + "learning_rate": 9.239965415938633e-08, + "loss": 1.4523, + "step": 37701 + }, + { + "epoch": 2.97, + "learning_rate": 9.196640640383169e-08, + "loss": 1.4274, + "step": 37702 + }, + { + "epoch": 2.97, + "learning_rate": 9.153417644109374e-08, + "loss": 1.3814, + "step": 37703 + }, + { + "epoch": 2.97, + "learning_rate": 9.110296427410347e-08, + "loss": 1.4323, + "step": 37704 + }, + { + "epoch": 2.97, + "learning_rate": 9.067276990580851e-08, + "loss": 1.4823, + "step": 37705 + }, + { + "epoch": 2.97, + "learning_rate": 9.024359333910657e-08, + "loss": 1.4748, + "step": 37706 + }, + { + "epoch": 2.97, + "learning_rate": 8.981543457692863e-08, + "loss": 1.4338, + "step": 37707 + }, + { + "epoch": 2.97, + "learning_rate": 8.938829362218903e-08, + "loss": 1.4635, + "step": 37708 + }, + { + "epoch": 2.97, + "learning_rate": 8.896217047776877e-08, + "loss": 1.4656, + "step": 37709 + }, + { + "epoch": 2.97, + "learning_rate": 8.853706514656556e-08, + "loss": 1.4653, + "step": 37710 + }, + { + "epoch": 2.97, + "learning_rate": 8.811297763146041e-08, + "loss": 1.4876, + "step": 37711 + }, + { + "epoch": 2.97, + "learning_rate": 8.768990793535103e-08, + "loss": 1.4516, + "step": 37712 + }, + { + "epoch": 2.97, + "learning_rate": 8.726785606108511e-08, + "loss": 1.348, + "step": 37713 + }, + { + "epoch": 2.97, + "learning_rate": 8.684682201156034e-08, + "loss": 1.4463, + "step": 37714 + }, + { + "epoch": 2.97, + "learning_rate": 8.642680578960781e-08, + "loss": 1.4533, + "step": 37715 + }, + { + "epoch": 2.97, + "learning_rate": 8.600780739807523e-08, + "loss": 1.4329, + "step": 37716 + }, + { + "epoch": 2.97, + "learning_rate": 8.558982683984361e-08, + "loss": 1.459, + "step": 37717 + }, + { + "epoch": 2.97, + "learning_rate": 8.517286411771074e-08, + "loss": 1.4414, + "step": 37718 + }, + { + "epoch": 2.97, + "learning_rate": 8.475691923452432e-08, + "loss": 1.4863, + "step": 37719 + }, + { + "epoch": 2.97, + "learning_rate": 8.434199219311544e-08, + "loss": 1.4375, + "step": 37720 + }, + { + "epoch": 2.97, + "learning_rate": 8.39280829962985e-08, + "loss": 1.4234, + "step": 37721 + }, + { + "epoch": 2.97, + "learning_rate": 8.351519164687126e-08, + "loss": 1.4499, + "step": 37722 + }, + { + "epoch": 2.97, + "learning_rate": 8.310331814764814e-08, + "loss": 1.4397, + "step": 37723 + }, + { + "epoch": 2.97, + "learning_rate": 8.269246250142691e-08, + "loss": 1.449, + "step": 37724 + }, + { + "epoch": 2.97, + "learning_rate": 8.228262471098868e-08, + "loss": 1.4447, + "step": 37725 + }, + { + "epoch": 2.97, + "learning_rate": 8.187380477911454e-08, + "loss": 1.4801, + "step": 37726 + }, + { + "epoch": 2.97, + "learning_rate": 8.146600270858561e-08, + "loss": 1.4415, + "step": 37727 + }, + { + "epoch": 2.97, + "learning_rate": 8.1059218502183e-08, + "loss": 1.4557, + "step": 37728 + }, + { + "epoch": 2.97, + "learning_rate": 8.065345216263786e-08, + "loss": 1.4529, + "step": 37729 + }, + { + "epoch": 2.97, + "learning_rate": 8.024870369274793e-08, + "loss": 1.4393, + "step": 37730 + }, + { + "epoch": 2.97, + "learning_rate": 7.98449730952111e-08, + "loss": 1.4943, + "step": 37731 + }, + { + "epoch": 2.97, + "learning_rate": 7.944226037280843e-08, + "loss": 1.4111, + "step": 37732 + }, + { + "epoch": 2.97, + "learning_rate": 7.904056552825444e-08, + "loss": 1.4167, + "step": 37733 + }, + { + "epoch": 2.97, + "learning_rate": 7.863988856429692e-08, + "loss": 1.4579, + "step": 37734 + }, + { + "epoch": 2.97, + "learning_rate": 7.824022948361708e-08, + "loss": 1.4711, + "step": 37735 + }, + { + "epoch": 2.97, + "learning_rate": 7.78415882889627e-08, + "loss": 1.4029, + "step": 37736 + }, + { + "epoch": 2.97, + "learning_rate": 7.744396498303162e-08, + "loss": 1.4563, + "step": 37737 + }, + { + "epoch": 2.97, + "learning_rate": 7.70473595685217e-08, + "loss": 1.4244, + "step": 37738 + }, + { + "epoch": 2.97, + "learning_rate": 7.665177204813078e-08, + "loss": 1.4646, + "step": 37739 + }, + { + "epoch": 2.97, + "learning_rate": 7.625720242454003e-08, + "loss": 1.4246, + "step": 37740 + }, + { + "epoch": 2.97, + "learning_rate": 7.5863650700414e-08, + "loss": 1.4354, + "step": 37741 + }, + { + "epoch": 2.97, + "learning_rate": 7.547111687845054e-08, + "loss": 1.4011, + "step": 37742 + }, + { + "epoch": 2.97, + "learning_rate": 7.50796009612975e-08, + "loss": 1.4615, + "step": 37743 + }, + { + "epoch": 2.97, + "learning_rate": 7.468910295161945e-08, + "loss": 1.4545, + "step": 37744 + }, + { + "epoch": 2.97, + "learning_rate": 7.429962285206426e-08, + "loss": 1.4191, + "step": 37745 + }, + { + "epoch": 2.97, + "learning_rate": 7.391116066529646e-08, + "loss": 1.446, + "step": 37746 + }, + { + "epoch": 2.97, + "learning_rate": 7.352371639391396e-08, + "loss": 1.4539, + "step": 37747 + }, + { + "epoch": 2.97, + "learning_rate": 7.313729004058133e-08, + "loss": 1.4399, + "step": 37748 + }, + { + "epoch": 2.97, + "learning_rate": 7.275188160789647e-08, + "loss": 1.4286, + "step": 37749 + }, + { + "epoch": 2.97, + "learning_rate": 7.236749109850725e-08, + "loss": 1.3982, + "step": 37750 + }, + { + "epoch": 2.97, + "learning_rate": 7.198411851499497e-08, + "loss": 1.4587, + "step": 37751 + }, + { + "epoch": 2.97, + "learning_rate": 7.160176385997418e-08, + "loss": 1.4157, + "step": 37752 + }, + { + "epoch": 2.97, + "learning_rate": 7.122042713604281e-08, + "loss": 1.4729, + "step": 37753 + }, + { + "epoch": 2.97, + "learning_rate": 7.084010834579879e-08, + "loss": 1.452, + "step": 37754 + }, + { + "epoch": 2.97, + "learning_rate": 7.046080749179006e-08, + "loss": 1.4499, + "step": 37755 + }, + { + "epoch": 2.97, + "learning_rate": 7.008252457663122e-08, + "loss": 1.4328, + "step": 37756 + }, + { + "epoch": 2.97, + "learning_rate": 6.970525960287021e-08, + "loss": 1.5185, + "step": 37757 + }, + { + "epoch": 2.97, + "learning_rate": 6.932901257305501e-08, + "loss": 1.4076, + "step": 37758 + }, + { + "epoch": 2.97, + "learning_rate": 6.895378348978353e-08, + "loss": 1.4241, + "step": 37759 + }, + { + "epoch": 2.97, + "learning_rate": 6.857957235555378e-08, + "loss": 1.453, + "step": 37760 + }, + { + "epoch": 2.97, + "learning_rate": 6.820637917294702e-08, + "loss": 1.4481, + "step": 37761 + }, + { + "epoch": 2.97, + "learning_rate": 6.783420394447791e-08, + "loss": 1.4712, + "step": 37762 + }, + { + "epoch": 2.97, + "learning_rate": 6.746304667266111e-08, + "loss": 1.3746, + "step": 37763 + }, + { + "epoch": 2.97, + "learning_rate": 6.709290736004457e-08, + "loss": 1.4336, + "step": 37764 + }, + { + "epoch": 2.97, + "learning_rate": 6.672378600912632e-08, + "loss": 1.4664, + "step": 37765 + }, + { + "epoch": 2.97, + "learning_rate": 6.635568262240431e-08, + "loss": 1.4169, + "step": 37766 + }, + { + "epoch": 2.97, + "learning_rate": 6.598859720239325e-08, + "loss": 1.3887, + "step": 37767 + }, + { + "epoch": 2.97, + "learning_rate": 6.56225297515911e-08, + "loss": 1.4542, + "step": 37768 + }, + { + "epoch": 2.97, + "learning_rate": 6.525748027244593e-08, + "loss": 1.4289, + "step": 37769 + }, + { + "epoch": 2.97, + "learning_rate": 6.489344876748903e-08, + "loss": 1.4469, + "step": 37770 + }, + { + "epoch": 2.97, + "learning_rate": 6.45304352391518e-08, + "loss": 1.4631, + "step": 37771 + }, + { + "epoch": 2.97, + "learning_rate": 6.416843968989893e-08, + "loss": 1.4561, + "step": 37772 + }, + { + "epoch": 2.97, + "learning_rate": 6.380746212221177e-08, + "loss": 1.4797, + "step": 37773 + }, + { + "epoch": 2.97, + "learning_rate": 6.344750253853837e-08, + "loss": 1.452, + "step": 37774 + }, + { + "epoch": 2.97, + "learning_rate": 6.308856094131009e-08, + "loss": 1.436, + "step": 37775 + }, + { + "epoch": 2.97, + "learning_rate": 6.273063733295836e-08, + "loss": 1.4552, + "step": 37776 + }, + { + "epoch": 2.97, + "learning_rate": 6.237373171593119e-08, + "loss": 1.4412, + "step": 37777 + }, + { + "epoch": 2.97, + "learning_rate": 6.201784409264333e-08, + "loss": 1.3912, + "step": 37778 + }, + { + "epoch": 2.97, + "learning_rate": 6.16629744655095e-08, + "loss": 1.4261, + "step": 37779 + }, + { + "epoch": 2.97, + "learning_rate": 6.130912283694444e-08, + "loss": 1.4497, + "step": 37780 + }, + { + "epoch": 2.97, + "learning_rate": 6.095628920934625e-08, + "loss": 1.4524, + "step": 37781 + }, + { + "epoch": 2.97, + "learning_rate": 6.0604473585113e-08, + "loss": 1.4349, + "step": 37782 + }, + { + "epoch": 2.97, + "learning_rate": 6.025367596664276e-08, + "loss": 1.4474, + "step": 37783 + }, + { + "epoch": 2.97, + "learning_rate": 5.990389635628368e-08, + "loss": 1.5089, + "step": 37784 + }, + { + "epoch": 2.97, + "learning_rate": 5.955513475645046e-08, + "loss": 1.4657, + "step": 37785 + }, + { + "epoch": 2.97, + "learning_rate": 5.9207391169491244e-08, + "loss": 1.4431, + "step": 37786 + }, + { + "epoch": 2.97, + "learning_rate": 5.886066559775415e-08, + "loss": 1.3905, + "step": 37787 + }, + { + "epoch": 2.97, + "learning_rate": 5.8514958043620607e-08, + "loss": 1.4023, + "step": 37788 + }, + { + "epoch": 2.97, + "learning_rate": 5.817026850943873e-08, + "loss": 1.434, + "step": 37789 + }, + { + "epoch": 2.97, + "learning_rate": 5.782659699752334e-08, + "loss": 1.4183, + "step": 37790 + }, + { + "epoch": 2.97, + "learning_rate": 5.7483943510222563e-08, + "loss": 1.4594, + "step": 37791 + }, + { + "epoch": 2.97, + "learning_rate": 5.7142308049851206e-08, + "loss": 1.4297, + "step": 37792 + }, + { + "epoch": 2.97, + "learning_rate": 5.6801690618740735e-08, + "loss": 1.3873, + "step": 37793 + }, + { + "epoch": 2.97, + "learning_rate": 5.646209121920597e-08, + "loss": 1.4629, + "step": 37794 + }, + { + "epoch": 2.97, + "learning_rate": 5.612350985356173e-08, + "loss": 1.453, + "step": 37795 + }, + { + "epoch": 2.97, + "learning_rate": 5.578594652407287e-08, + "loss": 1.4209, + "step": 37796 + }, + { + "epoch": 2.97, + "learning_rate": 5.5449401233054195e-08, + "loss": 1.4761, + "step": 37797 + }, + { + "epoch": 2.97, + "learning_rate": 5.511387398278722e-08, + "loss": 1.4493, + "step": 37798 + }, + { + "epoch": 2.97, + "learning_rate": 5.47793647755701e-08, + "loss": 1.4411, + "step": 37799 + }, + { + "epoch": 2.97, + "learning_rate": 5.4445873613634394e-08, + "loss": 1.4469, + "step": 37800 + }, + { + "epoch": 2.97, + "learning_rate": 5.4113400499261605e-08, + "loss": 1.4152, + "step": 37801 + }, + { + "epoch": 2.97, + "learning_rate": 5.3781945434733245e-08, + "loss": 1.4492, + "step": 37802 + }, + { + "epoch": 2.97, + "learning_rate": 5.345150842224755e-08, + "loss": 1.4586, + "step": 37803 + }, + { + "epoch": 2.97, + "learning_rate": 5.312208946410268e-08, + "loss": 1.439, + "step": 37804 + }, + { + "epoch": 2.97, + "learning_rate": 5.279368856251354e-08, + "loss": 1.4399, + "step": 37805 + }, + { + "epoch": 2.97, + "learning_rate": 5.246630571969501e-08, + "loss": 1.4541, + "step": 37806 + }, + { + "epoch": 2.97, + "learning_rate": 5.2139940937878657e-08, + "loss": 1.3772, + "step": 37807 + }, + { + "epoch": 2.97, + "learning_rate": 5.181459421929601e-08, + "loss": 1.4984, + "step": 37808 + }, + { + "epoch": 2.97, + "learning_rate": 5.149026556614533e-08, + "loss": 1.4598, + "step": 37809 + }, + { + "epoch": 2.97, + "learning_rate": 5.1166954980608186e-08, + "loss": 1.4423, + "step": 37810 + }, + { + "epoch": 2.98, + "learning_rate": 5.084466246491614e-08, + "loss": 1.4699, + "step": 37811 + }, + { + "epoch": 2.98, + "learning_rate": 5.052338802123412e-08, + "loss": 1.4324, + "step": 37812 + }, + { + "epoch": 2.98, + "learning_rate": 5.0203131651760375e-08, + "loss": 1.4351, + "step": 37813 + }, + { + "epoch": 2.98, + "learning_rate": 4.988389335864318e-08, + "loss": 1.3565, + "step": 37814 + }, + { + "epoch": 2.98, + "learning_rate": 4.9565673144064125e-08, + "loss": 1.4158, + "step": 37815 + }, + { + "epoch": 2.98, + "learning_rate": 4.9248471010204795e-08, + "loss": 1.4662, + "step": 37816 + }, + { + "epoch": 2.98, + "learning_rate": 4.8932286959180165e-08, + "loss": 1.4833, + "step": 37817 + }, + { + "epoch": 2.98, + "learning_rate": 4.861712099315518e-08, + "loss": 1.4266, + "step": 37818 + }, + { + "epoch": 2.98, + "learning_rate": 4.830297311427811e-08, + "loss": 1.4373, + "step": 37819 + }, + { + "epoch": 2.98, + "learning_rate": 4.798984332466393e-08, + "loss": 1.4239, + "step": 37820 + }, + { + "epoch": 2.98, + "learning_rate": 4.767773162646094e-08, + "loss": 1.4588, + "step": 37821 + }, + { + "epoch": 2.98, + "learning_rate": 4.736663802176744e-08, + "loss": 1.3971, + "step": 37822 + }, + { + "epoch": 2.98, + "learning_rate": 4.705656251271506e-08, + "loss": 1.4958, + "step": 37823 + }, + { + "epoch": 2.98, + "learning_rate": 4.674750510138548e-08, + "loss": 1.4435, + "step": 37824 + }, + { + "epoch": 2.98, + "learning_rate": 4.643946578989366e-08, + "loss": 1.4687, + "step": 37825 + }, + { + "epoch": 2.98, + "learning_rate": 4.613244458032128e-08, + "loss": 1.3965, + "step": 37826 + }, + { + "epoch": 2.98, + "learning_rate": 4.582644147476666e-08, + "loss": 1.4661, + "step": 37827 + }, + { + "epoch": 2.98, + "learning_rate": 4.552145647529482e-08, + "loss": 1.4604, + "step": 37828 + }, + { + "epoch": 2.98, + "learning_rate": 4.521748958397076e-08, + "loss": 1.4265, + "step": 37829 + }, + { + "epoch": 2.98, + "learning_rate": 4.4914540802892804e-08, + "loss": 1.4036, + "step": 37830 + }, + { + "epoch": 2.98, + "learning_rate": 4.461261013407602e-08, + "loss": 1.4727, + "step": 37831 + }, + { + "epoch": 2.98, + "learning_rate": 4.431169757958542e-08, + "loss": 1.4327, + "step": 37832 + }, + { + "epoch": 2.98, + "learning_rate": 4.401180314146935e-08, + "loss": 1.4551, + "step": 37833 + }, + { + "epoch": 2.98, + "learning_rate": 4.371292682175953e-08, + "loss": 1.4411, + "step": 37834 + }, + { + "epoch": 2.98, + "learning_rate": 4.3415068622487667e-08, + "loss": 1.4566, + "step": 37835 + }, + { + "epoch": 2.98, + "learning_rate": 4.3118228545685474e-08, + "loss": 1.4516, + "step": 37836 + }, + { + "epoch": 2.98, + "learning_rate": 4.282240659333469e-08, + "loss": 1.4046, + "step": 37837 + }, + { + "epoch": 2.98, + "learning_rate": 4.2527602767483683e-08, + "loss": 1.4644, + "step": 37838 + }, + { + "epoch": 2.98, + "learning_rate": 4.2233817070114195e-08, + "loss": 1.3998, + "step": 37839 + }, + { + "epoch": 2.98, + "learning_rate": 4.1941049503224634e-08, + "loss": 1.511, + "step": 37840 + }, + { + "epoch": 2.98, + "learning_rate": 4.1649300068796745e-08, + "loss": 1.4367, + "step": 37841 + }, + { + "epoch": 2.98, + "learning_rate": 4.1358568768812275e-08, + "loss": 1.3848, + "step": 37842 + }, + { + "epoch": 2.98, + "learning_rate": 4.106885560525297e-08, + "loss": 1.4081, + "step": 37843 + }, + { + "epoch": 2.98, + "learning_rate": 4.078016058008393e-08, + "loss": 1.386, + "step": 37844 + }, + { + "epoch": 2.98, + "learning_rate": 4.049248369527025e-08, + "loss": 1.4411, + "step": 37845 + }, + { + "epoch": 2.98, + "learning_rate": 4.020582495274372e-08, + "loss": 1.4533, + "step": 37846 + }, + { + "epoch": 2.98, + "learning_rate": 3.992018435446942e-08, + "loss": 1.4474, + "step": 37847 + }, + { + "epoch": 2.98, + "learning_rate": 3.963556190239581e-08, + "loss": 1.4579, + "step": 37848 + }, + { + "epoch": 2.98, + "learning_rate": 3.9351957598421356e-08, + "loss": 1.4605, + "step": 37849 + }, + { + "epoch": 2.98, + "learning_rate": 3.9069371444511164e-08, + "loss": 1.4499, + "step": 37850 + }, + { + "epoch": 2.98, + "learning_rate": 3.8787803442547064e-08, + "loss": 1.4977, + "step": 37851 + }, + { + "epoch": 2.98, + "learning_rate": 3.850725359446083e-08, + "loss": 1.412, + "step": 37852 + }, + { + "epoch": 2.98, + "learning_rate": 3.822772190216761e-08, + "loss": 1.4566, + "step": 37853 + }, + { + "epoch": 2.98, + "learning_rate": 3.794920836754922e-08, + "loss": 1.4429, + "step": 37854 + }, + { + "epoch": 2.98, + "learning_rate": 3.76717129924875e-08, + "loss": 1.4368, + "step": 37855 + }, + { + "epoch": 2.98, + "learning_rate": 3.739523577889758e-08, + "loss": 1.3997, + "step": 37856 + }, + { + "epoch": 2.98, + "learning_rate": 3.7119776728627984e-08, + "loss": 1.4176, + "step": 37857 + }, + { + "epoch": 2.98, + "learning_rate": 3.684533584354388e-08, + "loss": 1.4173, + "step": 37858 + }, + { + "epoch": 2.98, + "learning_rate": 3.657191312554375e-08, + "loss": 1.4873, + "step": 37859 + }, + { + "epoch": 2.98, + "learning_rate": 3.6299508576459465e-08, + "loss": 1.5565, + "step": 37860 + }, + { + "epoch": 2.98, + "learning_rate": 3.602812219813955e-08, + "loss": 1.4664, + "step": 37861 + }, + { + "epoch": 2.98, + "learning_rate": 3.5757753992432524e-08, + "loss": 1.4097, + "step": 37862 + }, + { + "epoch": 2.98, + "learning_rate": 3.548840396118691e-08, + "loss": 1.4998, + "step": 37863 + }, + { + "epoch": 2.98, + "learning_rate": 3.522007210620126e-08, + "loss": 1.4422, + "step": 37864 + }, + { + "epoch": 2.98, + "learning_rate": 3.49527584293241e-08, + "loss": 1.472, + "step": 37865 + }, + { + "epoch": 2.98, + "learning_rate": 3.4686462932354e-08, + "loss": 1.4483, + "step": 37866 + }, + { + "epoch": 2.98, + "learning_rate": 3.442118561710616e-08, + "loss": 1.4437, + "step": 37867 + }, + { + "epoch": 2.98, + "learning_rate": 3.4156926485379157e-08, + "loss": 1.4401, + "step": 37868 + }, + { + "epoch": 2.98, + "learning_rate": 3.389368553897154e-08, + "loss": 1.4507, + "step": 37869 + }, + { + "epoch": 2.98, + "learning_rate": 3.363146277966522e-08, + "loss": 1.4686, + "step": 37870 + }, + { + "epoch": 2.98, + "learning_rate": 3.337025820924211e-08, + "loss": 1.4719, + "step": 37871 + }, + { + "epoch": 2.98, + "learning_rate": 3.311007182946745e-08, + "loss": 1.4569, + "step": 37872 + }, + { + "epoch": 2.98, + "learning_rate": 3.2850903642139826e-08, + "loss": 1.3915, + "step": 37873 + }, + { + "epoch": 2.98, + "learning_rate": 3.259275364897451e-08, + "loss": 1.4642, + "step": 37874 + }, + { + "epoch": 2.98, + "learning_rate": 3.233562185175342e-08, + "loss": 1.4674, + "step": 37875 + }, + { + "epoch": 2.98, + "learning_rate": 3.207950825222516e-08, + "loss": 1.4692, + "step": 37876 + }, + { + "epoch": 2.98, + "learning_rate": 3.182441285210502e-08, + "loss": 1.4146, + "step": 37877 + }, + { + "epoch": 2.98, + "learning_rate": 3.15703356531416e-08, + "loss": 1.4473, + "step": 37878 + }, + { + "epoch": 2.98, + "learning_rate": 3.13172766570502e-08, + "loss": 1.4337, + "step": 37879 + }, + { + "epoch": 2.98, + "learning_rate": 3.106523586556275e-08, + "loss": 1.4501, + "step": 37880 + }, + { + "epoch": 2.98, + "learning_rate": 3.0814213280377917e-08, + "loss": 1.4118, + "step": 37881 + }, + { + "epoch": 2.98, + "learning_rate": 3.0564208903210986e-08, + "loss": 1.4938, + "step": 37882 + }, + { + "epoch": 2.98, + "learning_rate": 3.031522273576059e-08, + "loss": 1.4491, + "step": 37883 + }, + { + "epoch": 2.98, + "learning_rate": 3.0067254779692076e-08, + "loss": 1.4348, + "step": 37884 + }, + { + "epoch": 2.98, + "learning_rate": 2.9820305036720724e-08, + "loss": 1.4882, + "step": 37885 + }, + { + "epoch": 2.98, + "learning_rate": 2.957437350849523e-08, + "loss": 1.4376, + "step": 37886 + }, + { + "epoch": 2.98, + "learning_rate": 2.9329460196697573e-08, + "loss": 1.4646, + "step": 37887 + }, + { + "epoch": 2.98, + "learning_rate": 2.9085565103009745e-08, + "loss": 1.4507, + "step": 37888 + }, + { + "epoch": 2.98, + "learning_rate": 2.884268822906377e-08, + "loss": 1.4251, + "step": 37889 + }, + { + "epoch": 2.98, + "learning_rate": 2.8600829576508333e-08, + "loss": 1.435, + "step": 37890 + }, + { + "epoch": 2.98, + "learning_rate": 2.8359989146992113e-08, + "loss": 1.4713, + "step": 37891 + }, + { + "epoch": 2.98, + "learning_rate": 2.812016694216379e-08, + "loss": 1.4392, + "step": 37892 + }, + { + "epoch": 2.98, + "learning_rate": 2.788136296362209e-08, + "loss": 1.4019, + "step": 37893 + }, + { + "epoch": 2.98, + "learning_rate": 2.7643577213015687e-08, + "loss": 1.4459, + "step": 37894 + }, + { + "epoch": 2.98, + "learning_rate": 2.740680969194331e-08, + "loss": 1.4746, + "step": 37895 + }, + { + "epoch": 2.98, + "learning_rate": 2.7171060402003675e-08, + "loss": 1.399, + "step": 37896 + }, + { + "epoch": 2.98, + "learning_rate": 2.693632934482881e-08, + "loss": 1.4152, + "step": 37897 + }, + { + "epoch": 2.98, + "learning_rate": 2.6702616521984134e-08, + "loss": 1.4483, + "step": 37898 + }, + { + "epoch": 2.98, + "learning_rate": 2.6469921935085016e-08, + "loss": 1.4942, + "step": 37899 + }, + { + "epoch": 2.98, + "learning_rate": 2.623824558568022e-08, + "loss": 1.4488, + "step": 37900 + }, + { + "epoch": 2.98, + "learning_rate": 2.600758747535181e-08, + "loss": 1.4497, + "step": 37901 + }, + { + "epoch": 2.98, + "learning_rate": 2.5777947605665205e-08, + "loss": 1.4387, + "step": 37902 + }, + { + "epoch": 2.98, + "learning_rate": 2.554932597818582e-08, + "loss": 1.4012, + "step": 37903 + }, + { + "epoch": 2.98, + "learning_rate": 2.5321722594479067e-08, + "loss": 1.4961, + "step": 37904 + }, + { + "epoch": 2.98, + "learning_rate": 2.50951374560604e-08, + "loss": 1.424, + "step": 37905 + }, + { + "epoch": 2.98, + "learning_rate": 2.4869570564495233e-08, + "loss": 1.4283, + "step": 37906 + }, + { + "epoch": 2.98, + "learning_rate": 2.464502192128237e-08, + "loss": 1.4328, + "step": 37907 + }, + { + "epoch": 2.98, + "learning_rate": 2.4421491527987226e-08, + "loss": 1.4066, + "step": 37908 + }, + { + "epoch": 2.98, + "learning_rate": 2.4198979386091945e-08, + "loss": 1.461, + "step": 37909 + }, + { + "epoch": 2.98, + "learning_rate": 2.3977485497128636e-08, + "loss": 1.4443, + "step": 37910 + }, + { + "epoch": 2.98, + "learning_rate": 2.37570098625961e-08, + "loss": 1.437, + "step": 37911 + }, + { + "epoch": 2.98, + "learning_rate": 2.353755248399314e-08, + "loss": 1.4287, + "step": 37912 + }, + { + "epoch": 2.98, + "learning_rate": 2.33191133628019e-08, + "loss": 1.4432, + "step": 37913 + }, + { + "epoch": 2.98, + "learning_rate": 2.310169250050453e-08, + "loss": 1.4788, + "step": 37914 + }, + { + "epoch": 2.98, + "learning_rate": 2.2885289898583183e-08, + "loss": 1.4898, + "step": 37915 + }, + { + "epoch": 2.98, + "learning_rate": 2.2669905558503343e-08, + "loss": 1.3773, + "step": 37916 + }, + { + "epoch": 2.98, + "learning_rate": 2.2455539481747164e-08, + "loss": 1.4354, + "step": 37917 + }, + { + "epoch": 2.98, + "learning_rate": 2.2242191669746833e-08, + "loss": 1.4718, + "step": 37918 + }, + { + "epoch": 2.98, + "learning_rate": 2.2029862123951193e-08, + "loss": 1.4605, + "step": 37919 + }, + { + "epoch": 2.98, + "learning_rate": 2.181855084580908e-08, + "loss": 1.4477, + "step": 37920 + }, + { + "epoch": 2.98, + "learning_rate": 2.1608257836752684e-08, + "loss": 1.4668, + "step": 37921 + }, + { + "epoch": 2.98, + "learning_rate": 2.1398983098214195e-08, + "loss": 1.3788, + "step": 37922 + }, + { + "epoch": 2.98, + "learning_rate": 2.1190726631609145e-08, + "loss": 1.4801, + "step": 37923 + }, + { + "epoch": 2.98, + "learning_rate": 2.0983488438369723e-08, + "loss": 1.4893, + "step": 37924 + }, + { + "epoch": 2.98, + "learning_rate": 2.07772685198615e-08, + "loss": 1.3803, + "step": 37925 + }, + { + "epoch": 2.98, + "learning_rate": 2.057206687753332e-08, + "loss": 1.472, + "step": 37926 + }, + { + "epoch": 2.98, + "learning_rate": 2.036788351275076e-08, + "loss": 1.4632, + "step": 37927 + }, + { + "epoch": 2.98, + "learning_rate": 2.0164718426896044e-08, + "loss": 1.4827, + "step": 37928 + }, + { + "epoch": 2.98, + "learning_rate": 1.9962571621351398e-08, + "loss": 1.4198, + "step": 37929 + }, + { + "epoch": 2.98, + "learning_rate": 1.9761443097515707e-08, + "loss": 1.4412, + "step": 37930 + }, + { + "epoch": 2.98, + "learning_rate": 1.9561332856721236e-08, + "loss": 1.3954, + "step": 37931 + }, + { + "epoch": 2.98, + "learning_rate": 1.936224090033356e-08, + "loss": 1.4513, + "step": 37932 + }, + { + "epoch": 2.98, + "learning_rate": 1.9164167229718253e-08, + "loss": 1.4307, + "step": 37933 + }, + { + "epoch": 2.98, + "learning_rate": 1.8967111846207582e-08, + "loss": 1.4847, + "step": 37934 + }, + { + "epoch": 2.98, + "learning_rate": 1.8771074751150472e-08, + "loss": 1.5143, + "step": 37935 + }, + { + "epoch": 2.98, + "learning_rate": 1.8576055945862533e-08, + "loss": 1.4997, + "step": 37936 + }, + { + "epoch": 2.98, + "learning_rate": 1.8382055431692687e-08, + "loss": 1.4458, + "step": 37937 + }, + { + "epoch": 2.99, + "learning_rate": 1.8189073209923244e-08, + "loss": 1.4213, + "step": 37938 + }, + { + "epoch": 2.99, + "learning_rate": 1.7997109281886467e-08, + "loss": 1.4659, + "step": 37939 + }, + { + "epoch": 2.99, + "learning_rate": 1.7806163648897975e-08, + "loss": 1.445, + "step": 37940 + }, + { + "epoch": 2.99, + "learning_rate": 1.761623631222342e-08, + "loss": 1.423, + "step": 37941 + }, + { + "epoch": 2.99, + "learning_rate": 1.7427327273161762e-08, + "loss": 1.3874, + "step": 37942 + }, + { + "epoch": 2.99, + "learning_rate": 1.7239436533011963e-08, + "loss": 1.4502, + "step": 37943 + }, + { + "epoch": 2.99, + "learning_rate": 1.7052564093039678e-08, + "loss": 1.4494, + "step": 37944 + }, + { + "epoch": 2.99, + "learning_rate": 1.686670995451056e-08, + "loss": 1.5077, + "step": 37945 + }, + { + "epoch": 2.99, + "learning_rate": 1.6681874118690263e-08, + "loss": 1.4187, + "step": 37946 + }, + { + "epoch": 2.99, + "learning_rate": 1.6498056586844445e-08, + "loss": 1.4348, + "step": 37947 + }, + { + "epoch": 2.99, + "learning_rate": 1.6315257360188793e-08, + "loss": 1.4656, + "step": 37948 + }, + { + "epoch": 2.99, + "learning_rate": 1.6133476439988967e-08, + "loss": 1.4393, + "step": 37949 + }, + { + "epoch": 2.99, + "learning_rate": 1.5952713827477314e-08, + "loss": 1.4082, + "step": 37950 + }, + { + "epoch": 2.99, + "learning_rate": 1.577296952388618e-08, + "loss": 1.4331, + "step": 37951 + }, + { + "epoch": 2.99, + "learning_rate": 1.5594243530414608e-08, + "loss": 1.4907, + "step": 37952 + }, + { + "epoch": 2.99, + "learning_rate": 1.5416535848311595e-08, + "loss": 1.4214, + "step": 37953 + }, + { + "epoch": 2.99, + "learning_rate": 1.523984647874288e-08, + "loss": 1.4156, + "step": 37954 + }, + { + "epoch": 2.99, + "learning_rate": 1.506417542292415e-08, + "loss": 1.4866, + "step": 37955 + }, + { + "epoch": 2.99, + "learning_rate": 1.4889522682071108e-08, + "loss": 1.4543, + "step": 37956 + }, + { + "epoch": 2.99, + "learning_rate": 1.4715888257332831e-08, + "loss": 1.4028, + "step": 37957 + }, + { + "epoch": 2.99, + "learning_rate": 1.4543272149908358e-08, + "loss": 1.4373, + "step": 37958 + }, + { + "epoch": 2.99, + "learning_rate": 1.4371674360963426e-08, + "loss": 1.3944, + "step": 37959 + }, + { + "epoch": 2.99, + "learning_rate": 1.420109489168042e-08, + "loss": 1.461, + "step": 37960 + }, + { + "epoch": 2.99, + "learning_rate": 1.403153374319177e-08, + "loss": 1.4466, + "step": 37961 + }, + { + "epoch": 2.99, + "learning_rate": 1.3862990916646555e-08, + "loss": 1.4301, + "step": 37962 + }, + { + "epoch": 2.99, + "learning_rate": 1.3695466413227163e-08, + "loss": 1.5027, + "step": 37963 + }, + { + "epoch": 2.99, + "learning_rate": 1.3528960234032716e-08, + "loss": 1.436, + "step": 37964 + }, + { + "epoch": 2.99, + "learning_rate": 1.3363472380212292e-08, + "loss": 1.4582, + "step": 37965 + }, + { + "epoch": 2.99, + "learning_rate": 1.3199002852881669e-08, + "loss": 1.4109, + "step": 37966 + }, + { + "epoch": 2.99, + "learning_rate": 1.3035551653156617e-08, + "loss": 1.4031, + "step": 37967 + }, + { + "epoch": 2.99, + "learning_rate": 1.2873118782152914e-08, + "loss": 1.411, + "step": 37968 + }, + { + "epoch": 2.99, + "learning_rate": 1.2711704240986331e-08, + "loss": 1.491, + "step": 37969 + }, + { + "epoch": 2.99, + "learning_rate": 1.2551308030722684e-08, + "loss": 1.4548, + "step": 37970 + }, + { + "epoch": 2.99, + "learning_rate": 1.2391930152461093e-08, + "loss": 1.4543, + "step": 37971 + }, + { + "epoch": 2.99, + "learning_rate": 1.223357060730068e-08, + "loss": 1.5027, + "step": 37972 + }, + { + "epoch": 2.99, + "learning_rate": 1.2076229396290605e-08, + "loss": 1.4319, + "step": 37973 + }, + { + "epoch": 2.99, + "learning_rate": 1.1919906520513333e-08, + "loss": 1.442, + "step": 37974 + }, + { + "epoch": 2.99, + "learning_rate": 1.1764601981051336e-08, + "loss": 1.4177, + "step": 37975 + }, + { + "epoch": 2.99, + "learning_rate": 1.1610315778920464e-08, + "loss": 1.4563, + "step": 37976 + }, + { + "epoch": 2.99, + "learning_rate": 1.1457047915186535e-08, + "loss": 1.4334, + "step": 37977 + }, + { + "epoch": 2.99, + "learning_rate": 1.1304798390882052e-08, + "loss": 1.4156, + "step": 37978 + }, + { + "epoch": 2.99, + "learning_rate": 1.115356720705618e-08, + "loss": 1.4608, + "step": 37979 + }, + { + "epoch": 2.99, + "learning_rate": 1.100335436472477e-08, + "loss": 1.4209, + "step": 37980 + }, + { + "epoch": 2.99, + "learning_rate": 1.0854159864903678e-08, + "loss": 1.4855, + "step": 37981 + }, + { + "epoch": 2.99, + "learning_rate": 1.0705983708625409e-08, + "loss": 1.3926, + "step": 37982 + }, + { + "epoch": 2.99, + "learning_rate": 1.0558825896872514e-08, + "loss": 1.4074, + "step": 37983 + }, + { + "epoch": 2.99, + "learning_rate": 1.0412686430660844e-08, + "loss": 1.4612, + "step": 37984 + }, + { + "epoch": 2.99, + "learning_rate": 1.0267565310972948e-08, + "loss": 1.4523, + "step": 37985 + }, + { + "epoch": 2.99, + "learning_rate": 1.0123462538791372e-08, + "loss": 1.4596, + "step": 37986 + }, + { + "epoch": 2.99, + "learning_rate": 9.980378115115317e-09, + "loss": 1.4833, + "step": 37987 + }, + { + "epoch": 2.99, + "learning_rate": 9.838312040894025e-09, + "loss": 1.4459, + "step": 37988 + }, + { + "epoch": 2.99, + "learning_rate": 9.69726431709339e-09, + "loss": 1.4929, + "step": 37989 + }, + { + "epoch": 2.99, + "learning_rate": 9.557234944679303e-09, + "loss": 1.4778, + "step": 37990 + }, + { + "epoch": 2.99, + "learning_rate": 9.418223924601009e-09, + "loss": 1.4439, + "step": 37991 + }, + { + "epoch": 2.99, + "learning_rate": 9.280231257791093e-09, + "loss": 1.4462, + "step": 37992 + }, + { + "epoch": 2.99, + "learning_rate": 9.14325694521545e-09, + "loss": 1.4235, + "step": 37993 + }, + { + "epoch": 2.99, + "learning_rate": 9.007300987773358e-09, + "loss": 1.4243, + "step": 37994 + }, + { + "epoch": 2.99, + "learning_rate": 8.872363386397407e-09, + "loss": 1.4101, + "step": 37995 + }, + { + "epoch": 2.99, + "learning_rate": 8.738444142020184e-09, + "loss": 1.4576, + "step": 37996 + }, + { + "epoch": 2.99, + "learning_rate": 8.605543255524316e-09, + "loss": 1.4726, + "step": 37997 + }, + { + "epoch": 2.99, + "learning_rate": 8.473660727825737e-09, + "loss": 1.4671, + "step": 37998 + }, + { + "epoch": 2.99, + "learning_rate": 8.342796559823727e-09, + "loss": 1.4382, + "step": 37999 + }, + { + "epoch": 2.99, + "learning_rate": 8.212950752400915e-09, + "loss": 1.4031, + "step": 38000 + }, + { + "epoch": 2.99, + "learning_rate": 8.084123306439926e-09, + "loss": 1.4139, + "step": 38001 + }, + { + "epoch": 2.99, + "learning_rate": 7.956314222806737e-09, + "loss": 1.4402, + "step": 38002 + }, + { + "epoch": 2.99, + "learning_rate": 7.829523502383973e-09, + "loss": 1.4882, + "step": 38003 + }, + { + "epoch": 2.99, + "learning_rate": 7.703751146037606e-09, + "loss": 1.4801, + "step": 38004 + }, + { + "epoch": 2.99, + "learning_rate": 7.578997154600308e-09, + "loss": 1.3937, + "step": 38005 + }, + { + "epoch": 2.99, + "learning_rate": 7.455261528921398e-09, + "loss": 1.4379, + "step": 38006 + }, + { + "epoch": 2.99, + "learning_rate": 7.3325442698668465e-09, + "loss": 1.426, + "step": 38007 + }, + { + "epoch": 2.99, + "learning_rate": 7.210845378236019e-09, + "loss": 1.421, + "step": 38008 + }, + { + "epoch": 2.99, + "learning_rate": 7.090164854878233e-09, + "loss": 1.4281, + "step": 38009 + }, + { + "epoch": 2.99, + "learning_rate": 6.9705027005928506e-09, + "loss": 1.4262, + "step": 38010 + }, + { + "epoch": 2.99, + "learning_rate": 6.851858916212538e-09, + "loss": 1.4594, + "step": 38011 + }, + { + "epoch": 2.99, + "learning_rate": 6.734233502536657e-09, + "loss": 1.4774, + "step": 38012 + }, + { + "epoch": 2.99, + "learning_rate": 6.617626460364567e-09, + "loss": 1.4472, + "step": 38013 + }, + { + "epoch": 2.99, + "learning_rate": 6.502037790495629e-09, + "loss": 1.4285, + "step": 38014 + }, + { + "epoch": 2.99, + "learning_rate": 6.387467493679244e-09, + "loss": 1.4472, + "step": 38015 + }, + { + "epoch": 2.99, + "learning_rate": 6.273915570731425e-09, + "loss": 1.4322, + "step": 38016 + }, + { + "epoch": 2.99, + "learning_rate": 6.1613820224182265e-09, + "loss": 1.4273, + "step": 38017 + }, + { + "epoch": 2.99, + "learning_rate": 6.049866849489049e-09, + "loss": 1.3849, + "step": 38018 + }, + { + "epoch": 2.99, + "learning_rate": 5.939370052709946e-09, + "loss": 1.4195, + "step": 38019 + }, + { + "epoch": 2.99, + "learning_rate": 5.829891632813666e-09, + "loss": 1.4458, + "step": 38020 + }, + { + "epoch": 2.99, + "learning_rate": 5.721431590582914e-09, + "loss": 1.4901, + "step": 38021 + }, + { + "epoch": 2.99, + "learning_rate": 5.613989926717133e-09, + "loss": 1.4249, + "step": 38022 + }, + { + "epoch": 2.99, + "learning_rate": 5.507566641949068e-09, + "loss": 1.3829, + "step": 38023 + }, + { + "epoch": 2.99, + "learning_rate": 5.402161737028121e-09, + "loss": 1.3889, + "step": 38024 + }, + { + "epoch": 2.99, + "learning_rate": 5.297775212637079e-09, + "loss": 1.5098, + "step": 38025 + }, + { + "epoch": 2.99, + "learning_rate": 5.194407069508688e-09, + "loss": 1.4516, + "step": 38026 + }, + { + "epoch": 2.99, + "learning_rate": 5.09205730834239e-09, + "loss": 1.4932, + "step": 38027 + }, + { + "epoch": 2.99, + "learning_rate": 4.990725929820971e-09, + "loss": 1.452, + "step": 38028 + }, + { + "epoch": 2.99, + "learning_rate": 4.890412934643873e-09, + "loss": 1.4619, + "step": 38029 + }, + { + "epoch": 2.99, + "learning_rate": 4.791118323477228e-09, + "loss": 1.4159, + "step": 38030 + }, + { + "epoch": 2.99, + "learning_rate": 4.692842097003824e-09, + "loss": 1.463, + "step": 38031 + }, + { + "epoch": 2.99, + "learning_rate": 4.5955842559064485e-09, + "loss": 1.3856, + "step": 38032 + }, + { + "epoch": 2.99, + "learning_rate": 4.499344800817928e-09, + "loss": 1.485, + "step": 38033 + }, + { + "epoch": 2.99, + "learning_rate": 4.404123732404397e-09, + "loss": 1.4056, + "step": 38034 + }, + { + "epoch": 2.99, + "learning_rate": 4.3099210513153345e-09, + "loss": 1.4465, + "step": 38035 + }, + { + "epoch": 2.99, + "learning_rate": 4.216736758200223e-09, + "loss": 1.4484, + "step": 38036 + }, + { + "epoch": 2.99, + "learning_rate": 4.124570853658582e-09, + "loss": 1.4459, + "step": 38037 + }, + { + "epoch": 2.99, + "learning_rate": 4.0334233383398914e-09, + "loss": 1.4482, + "step": 38038 + }, + { + "epoch": 2.99, + "learning_rate": 3.94329421287698e-09, + "loss": 1.4513, + "step": 38039 + }, + { + "epoch": 2.99, + "learning_rate": 3.854183477836059e-09, + "loss": 1.4061, + "step": 38040 + }, + { + "epoch": 2.99, + "learning_rate": 3.766091133866611e-09, + "loss": 1.4005, + "step": 38041 + }, + { + "epoch": 2.99, + "learning_rate": 3.6790171815515024e-09, + "loss": 1.3993, + "step": 38042 + }, + { + "epoch": 2.99, + "learning_rate": 3.5929616214902533e-09, + "loss": 1.4311, + "step": 38043 + }, + { + "epoch": 2.99, + "learning_rate": 3.507924454249078e-09, + "loss": 1.4015, + "step": 38044 + }, + { + "epoch": 2.99, + "learning_rate": 3.4239056804108435e-09, + "loss": 1.4475, + "step": 38045 + }, + { + "epoch": 2.99, + "learning_rate": 3.340905300541763e-09, + "loss": 1.4553, + "step": 38046 + }, + { + "epoch": 2.99, + "learning_rate": 3.258923315224704e-09, + "loss": 1.4472, + "step": 38047 + }, + { + "epoch": 2.99, + "learning_rate": 3.177959725009227e-09, + "loss": 1.4285, + "step": 38048 + }, + { + "epoch": 2.99, + "learning_rate": 3.0980145304282387e-09, + "loss": 1.4256, + "step": 38049 + }, + { + "epoch": 2.99, + "learning_rate": 3.0190877320479534e-09, + "loss": 1.4341, + "step": 38050 + }, + { + "epoch": 2.99, + "learning_rate": 2.941179330384624e-09, + "loss": 1.3726, + "step": 38051 + }, + { + "epoch": 2.99, + "learning_rate": 2.8642893259711585e-09, + "loss": 1.4355, + "step": 38052 + }, + { + "epoch": 2.99, + "learning_rate": 2.788417719340463e-09, + "loss": 1.4111, + "step": 38053 + }, + { + "epoch": 2.99, + "learning_rate": 2.713564511008792e-09, + "loss": 1.4348, + "step": 38054 + }, + { + "epoch": 2.99, + "learning_rate": 2.6397297014590923e-09, + "loss": 1.4392, + "step": 38055 + }, + { + "epoch": 2.99, + "learning_rate": 2.566913291224271e-09, + "loss": 1.481, + "step": 38056 + }, + { + "epoch": 2.99, + "learning_rate": 2.495115280770621e-09, + "loss": 1.447, + "step": 38057 + }, + { + "epoch": 2.99, + "learning_rate": 2.424335670614397e-09, + "loss": 1.4176, + "step": 38058 + }, + { + "epoch": 2.99, + "learning_rate": 2.354574461221892e-09, + "loss": 1.4493, + "step": 38059 + }, + { + "epoch": 2.99, + "learning_rate": 2.2858316530594e-09, + "loss": 1.476, + "step": 38060 + }, + { + "epoch": 2.99, + "learning_rate": 2.2181072465932147e-09, + "loss": 1.4594, + "step": 38061 + }, + { + "epoch": 2.99, + "learning_rate": 2.1514012423062833e-09, + "loss": 1.4045, + "step": 38062 + }, + { + "epoch": 2.99, + "learning_rate": 2.085713640631592e-09, + "loss": 1.4645, + "step": 38063 + }, + { + "epoch": 2.99, + "learning_rate": 2.021044442018782e-09, + "loss": 1.4029, + "step": 38064 + }, + { + "epoch": 3.0, + "learning_rate": 1.95739364690084e-09, + "loss": 1.422, + "step": 38065 + }, + { + "epoch": 3.0, + "learning_rate": 1.894761255710753e-09, + "loss": 1.3974, + "step": 38066 + }, + { + "epoch": 3.0, + "learning_rate": 1.8331472688981607e-09, + "loss": 1.4811, + "step": 38067 + }, + { + "epoch": 3.0, + "learning_rate": 1.772551686846091e-09, + "loss": 1.4983, + "step": 38068 + }, + { + "epoch": 3.0, + "learning_rate": 1.7129745099875302e-09, + "loss": 1.4089, + "step": 38069 + }, + { + "epoch": 3.0, + "learning_rate": 1.6544157387388124e-09, + "loss": 1.4513, + "step": 38070 + }, + { + "epoch": 3.0, + "learning_rate": 1.5968753734496575e-09, + "loss": 1.4888, + "step": 38071 + }, + { + "epoch": 3.0, + "learning_rate": 1.540353414569706e-09, + "loss": 1.4227, + "step": 38072 + }, + { + "epoch": 3.0, + "learning_rate": 1.4848498624320248e-09, + "loss": 1.4201, + "step": 38073 + }, + { + "epoch": 3.0, + "learning_rate": 1.4303647174529475e-09, + "loss": 1.4273, + "step": 38074 + }, + { + "epoch": 3.0, + "learning_rate": 1.3768979799821945e-09, + "loss": 1.3795, + "step": 38075 + }, + { + "epoch": 3.0, + "learning_rate": 1.324449650386139e-09, + "loss": 1.4576, + "step": 38076 + }, + { + "epoch": 3.0, + "learning_rate": 1.2730197290145016e-09, + "loss": 1.4191, + "step": 38077 + }, + { + "epoch": 3.0, + "learning_rate": 1.222608216233656e-09, + "loss": 1.4711, + "step": 38078 + }, + { + "epoch": 3.0, + "learning_rate": 1.1732151123600153e-09, + "loss": 1.4533, + "step": 38079 + }, + { + "epoch": 3.0, + "learning_rate": 1.1248404177599536e-09, + "loss": 1.4689, + "step": 38080 + }, + { + "epoch": 3.0, + "learning_rate": 1.0774841327332306e-09, + "loss": 1.4377, + "step": 38081 + }, + { + "epoch": 3.0, + "learning_rate": 1.0311462576295671e-09, + "loss": 1.4845, + "step": 38082 + }, + { + "epoch": 3.0, + "learning_rate": 9.858267927320695e-10, + "loss": 1.4464, + "step": 38083 + }, + { + "epoch": 3.0, + "learning_rate": 9.41525738373805e-10, + "loss": 1.3995, + "step": 38084 + }, + { + "epoch": 3.0, + "learning_rate": 8.982430948378805e-10, + "loss": 1.4929, + "step": 38085 + }, + { + "epoch": 3.0, + "learning_rate": 8.559788624407094e-10, + "loss": 1.4295, + "step": 38086 + }, + { + "epoch": 3.0, + "learning_rate": 8.147330414320918e-10, + "loss": 1.4512, + "step": 38087 + }, + { + "epoch": 3.0, + "learning_rate": 7.745056321450948e-10, + "loss": 1.4853, + "step": 38088 + }, + { + "epoch": 3.0, + "learning_rate": 7.352966347962119e-10, + "loss": 1.4643, + "step": 38089 + }, + { + "epoch": 3.0, + "learning_rate": 6.971060496852033e-10, + "loss": 1.4783, + "step": 38090 + }, + { + "epoch": 3.0, + "learning_rate": 6.599338770785223e-10, + "loss": 1.4419, + "step": 38091 + }, + { + "epoch": 3.0, + "learning_rate": 6.237801171926626e-10, + "loss": 1.4038, + "step": 38092 + }, + { + "epoch": 3.0, + "learning_rate": 5.886447703107311e-10, + "loss": 1.4419, + "step": 38093 + }, + { + "epoch": 3.0, + "learning_rate": 5.545278366492211e-10, + "loss": 1.4464, + "step": 38094 + }, + { + "epoch": 3.0, + "learning_rate": 5.214293164579331e-10, + "loss": 1.4558, + "step": 38095 + }, + { + "epoch": 3.0, + "learning_rate": 4.893492099367069e-10, + "loss": 1.3968, + "step": 38096 + }, + { + "epoch": 3.0, + "learning_rate": 4.582875173186895e-10, + "loss": 1.4312, + "step": 38097 + }, + { + "epoch": 3.0, + "learning_rate": 4.2824423880372104e-10, + "loss": 1.3819, + "step": 38098 + }, + { + "epoch": 3.0, + "learning_rate": 3.9921937462494835e-10, + "loss": 1.4538, + "step": 38099 + }, + { + "epoch": 3.0, + "learning_rate": 3.7121292493225153e-10, + "loss": 1.5402, + "step": 38100 + }, + { + "epoch": 3.0, + "learning_rate": 3.442248899587774e-10, + "loss": 1.4314, + "step": 38101 + }, + { + "epoch": 3.0, + "learning_rate": 3.182552698710594e-10, + "loss": 1.4789, + "step": 38102 + }, + { + "epoch": 3.0, + "learning_rate": 2.9330406485228444e-10, + "loss": 1.4952, + "step": 38103 + }, + { + "epoch": 3.0, + "learning_rate": 2.693712750523325e-10, + "loss": 1.4511, + "step": 38104 + }, + { + "epoch": 3.0, + "learning_rate": 2.464569006543904e-10, + "loss": 1.4643, + "step": 38105 + }, + { + "epoch": 3.0, + "learning_rate": 2.2456094180833828e-10, + "loss": 1.4974, + "step": 38106 + }, + { + "epoch": 3.0, + "learning_rate": 2.036833986474029e-10, + "loss": 1.425, + "step": 38107 + }, + { + "epoch": 3.0, + "learning_rate": 1.8382427133811773e-10, + "loss": 1.4331, + "step": 38108 + }, + { + "epoch": 3.0, + "learning_rate": 1.6498355999705614e-10, + "loss": 1.4042, + "step": 38109 + }, + { + "epoch": 3.0, + "learning_rate": 1.4716126477409828e-10, + "loss": 1.4844, + "step": 38110 + }, + { + "epoch": 3.0, + "learning_rate": 1.3035738575251088e-10, + "loss": 1.4571, + "step": 38111 + }, + { + "epoch": 3.0, + "learning_rate": 1.14571923082174e-10, + "loss": 1.4909, + "step": 38112 + }, + { + "epoch": 3.0, + "learning_rate": 9.980487686300776e-11, + "loss": 1.4658, + "step": 38113 + }, + { + "epoch": 3.0, + "learning_rate": 8.605624717827886e-11, + "loss": 1.4182, + "step": 38114 + }, + { + "epoch": 3.0, + "learning_rate": 7.332603412790738e-11, + "loss": 1.4711, + "step": 38115 + }, + { + "epoch": 3.0, + "learning_rate": 6.161423781181341e-11, + "loss": 1.4193, + "step": 38116 + }, + { + "epoch": 3.0, + "learning_rate": 5.0920858313263645e-11, + "loss": 1.4367, + "step": 38117 + }, + { + "epoch": 3.0, + "learning_rate": 4.12458956655648e-11, + "loss": 1.4355, + "step": 38118 + }, + { + "epoch": 3.0, + "learning_rate": 3.258934998529028e-11, + "loss": 1.482, + "step": 38119 + }, + { + "epoch": 3.0, + "learning_rate": 2.495122128909344e-11, + "loss": 1.4803, + "step": 38120 + }, + { + "epoch": 3.0, + "learning_rate": 1.8331509660240994e-11, + "loss": 1.4884, + "step": 38121 + }, + { + "epoch": 3.0, + "learning_rate": 1.27302151153863e-11, + "loss": 1.4714, + "step": 38122 + }, + { + "epoch": 3.0, + "learning_rate": 8.147337721142733e-12, + "loss": 1.3664, + "step": 38123 + }, + { + "epoch": 3.0, + "learning_rate": 4.582877477510294e-12, + "loss": 1.4175, + "step": 38124 + }, + { + "epoch": 3.0, + "learning_rate": 2.036834451102365e-12, + "loss": 1.4506, + "step": 38125 + }, + { + "epoch": 3.0, + "learning_rate": 5.092086086122549e-13, + "loss": 1.424, + "step": 38126 + }, + { + "epoch": 3.0, + "learning_rate": 0.0, + "loss": 1.4081, + "step": 38127 + }, + { + "epoch": 3.0, + "step": 38127, + "total_flos": 2.6896453959942144e+16, + "train_loss": 1.6263817286927247, + "train_runtime": 649257.4466, + "train_samples_per_second": 60.135, + "train_steps_per_second": 0.059 + } + ], + "logging_steps": 1.0, + "max_steps": 38127, + "num_input_tokens_seen": 0, + "num_train_epochs": 3, + "save_steps": 500, + "total_flos": 2.6896453959942144e+16, + "train_batch_size": 64, + "trial_name": null, + "trial_params": null +}