{ "best_metric": null, "best_model_checkpoint": null, "epoch": 4.999872737916466, "eval_steps": 500, "global_step": 24555, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 1.2195121951219512e-06, "loss": 0.8901, "step": 1 }, { "epoch": 0.0, "learning_rate": 2.4390243902439023e-06, "loss": 0.8157, "step": 2 }, { "epoch": 0.0, "learning_rate": 3.6585365853658533e-06, "loss": 0.8273, "step": 3 }, { "epoch": 0.0, "learning_rate": 4.878048780487805e-06, "loss": 0.8642, "step": 4 }, { "epoch": 0.0, "learning_rate": 6.097560975609756e-06, "loss": 0.9531, "step": 5 }, { "epoch": 0.0, "learning_rate": 7.3170731707317065e-06, "loss": 0.7688, "step": 6 }, { "epoch": 0.0, "learning_rate": 8.536585365853657e-06, "loss": 0.9389, "step": 7 }, { "epoch": 0.0, "learning_rate": 9.75609756097561e-06, "loss": 0.8463, "step": 8 }, { "epoch": 0.0, "learning_rate": 1.0975609756097559e-05, "loss": 0.8358, "step": 9 }, { "epoch": 0.0, "learning_rate": 1.2195121951219511e-05, "loss": 0.7671, "step": 10 }, { "epoch": 0.0, "learning_rate": 1.3414634146341462e-05, "loss": 0.7806, "step": 11 }, { "epoch": 0.0, "learning_rate": 1.4634146341463413e-05, "loss": 0.8797, "step": 12 }, { "epoch": 0.0, "learning_rate": 1.5853658536585366e-05, "loss": 0.6765, "step": 13 }, { "epoch": 0.0, "learning_rate": 1.7073170731707313e-05, "loss": 0.8248, "step": 14 }, { "epoch": 0.0, "learning_rate": 1.8292682926829268e-05, "loss": 0.7479, "step": 15 }, { "epoch": 0.0, "learning_rate": 1.951219512195122e-05, "loss": 0.9234, "step": 16 }, { "epoch": 0.0, "learning_rate": 2.073170731707317e-05, "loss": 0.743, "step": 17 }, { "epoch": 0.0, "learning_rate": 2.1951219512195117e-05, "loss": 0.7324, "step": 18 }, { "epoch": 0.0, "learning_rate": 2.317073170731707e-05, "loss": 0.6685, "step": 19 }, { "epoch": 0.0, "learning_rate": 2.4390243902439022e-05, "loss": 0.6609, "step": 20 }, { "epoch": 0.0, "learning_rate": 2.5609756097560977e-05, "loss": 0.5058, "step": 21 }, { "epoch": 0.0, "learning_rate": 2.6829268292682924e-05, "loss": 0.5153, "step": 22 }, { "epoch": 0.0, "learning_rate": 2.8048780487804875e-05, "loss": 0.511, "step": 23 }, { "epoch": 0.0, "learning_rate": 2.9268292682926826e-05, "loss": 0.4987, "step": 24 }, { "epoch": 0.01, "learning_rate": 3.0487804878048777e-05, "loss": 0.4468, "step": 25 }, { "epoch": 0.01, "learning_rate": 3.170731707317073e-05, "loss": 0.4207, "step": 26 }, { "epoch": 0.01, "learning_rate": 3.292682926829268e-05, "loss": 0.3482, "step": 27 }, { "epoch": 0.01, "learning_rate": 3.4146341463414627e-05, "loss": 0.2525, "step": 28 }, { "epoch": 0.01, "learning_rate": 3.5365853658536584e-05, "loss": 0.2636, "step": 29 }, { "epoch": 0.01, "learning_rate": 3.6585365853658535e-05, "loss": 0.2023, "step": 30 }, { "epoch": 0.01, "learning_rate": 3.780487804878048e-05, "loss": 0.2962, "step": 31 }, { "epoch": 0.01, "learning_rate": 3.902439024390244e-05, "loss": 0.2923, "step": 32 }, { "epoch": 0.01, "learning_rate": 4.024390243902439e-05, "loss": 0.2076, "step": 33 }, { "epoch": 0.01, "learning_rate": 4.146341463414634e-05, "loss": 0.2102, "step": 34 }, { "epoch": 0.01, "learning_rate": 4.268292682926829e-05, "loss": 0.1848, "step": 35 }, { "epoch": 0.01, "learning_rate": 4.3902439024390234e-05, "loss": 0.2199, "step": 36 }, { "epoch": 0.01, "learning_rate": 4.512195121951219e-05, "loss": 0.1717, "step": 37 }, { "epoch": 0.01, "learning_rate": 4.634146341463414e-05, "loss": 0.2331, "step": 38 }, { "epoch": 0.01, "learning_rate": 4.7560975609756094e-05, "loss": 0.2204, "step": 39 }, { "epoch": 0.01, "learning_rate": 4.8780487804878045e-05, "loss": 0.137, "step": 40 }, { "epoch": 0.01, "learning_rate": 4.9999999999999996e-05, "loss": 0.1524, "step": 41 }, { "epoch": 0.01, "learning_rate": 5.121951219512195e-05, "loss": 0.1477, "step": 42 }, { "epoch": 0.01, "learning_rate": 5.24390243902439e-05, "loss": 0.2392, "step": 43 }, { "epoch": 0.01, "learning_rate": 5.365853658536585e-05, "loss": 0.1178, "step": 44 }, { "epoch": 0.01, "learning_rate": 5.48780487804878e-05, "loss": 0.172, "step": 45 }, { "epoch": 0.01, "learning_rate": 5.609756097560975e-05, "loss": 0.1596, "step": 46 }, { "epoch": 0.01, "learning_rate": 5.731707317073171e-05, "loss": 0.1053, "step": 47 }, { "epoch": 0.01, "learning_rate": 5.853658536585365e-05, "loss": 0.181, "step": 48 }, { "epoch": 0.01, "learning_rate": 5.97560975609756e-05, "loss": 0.1285, "step": 49 }, { "epoch": 0.01, "learning_rate": 6.0975609756097554e-05, "loss": 0.2609, "step": 50 }, { "epoch": 0.01, "learning_rate": 6.21951219512195e-05, "loss": 0.0859, "step": 51 }, { "epoch": 0.01, "learning_rate": 6.341463414634146e-05, "loss": 0.1277, "step": 52 }, { "epoch": 0.01, "learning_rate": 6.463414634146341e-05, "loss": 0.0935, "step": 53 }, { "epoch": 0.01, "learning_rate": 6.585365853658536e-05, "loss": 0.148, "step": 54 }, { "epoch": 0.01, "learning_rate": 6.707317073170731e-05, "loss": 0.0975, "step": 55 }, { "epoch": 0.01, "learning_rate": 6.829268292682925e-05, "loss": 0.1179, "step": 56 }, { "epoch": 0.01, "learning_rate": 6.951219512195121e-05, "loss": 0.0992, "step": 57 }, { "epoch": 0.01, "learning_rate": 7.073170731707317e-05, "loss": 0.1607, "step": 58 }, { "epoch": 0.01, "learning_rate": 7.195121951219511e-05, "loss": 0.1898, "step": 59 }, { "epoch": 0.01, "learning_rate": 7.317073170731707e-05, "loss": 0.0832, "step": 60 }, { "epoch": 0.01, "learning_rate": 7.439024390243901e-05, "loss": 0.1476, "step": 61 }, { "epoch": 0.01, "learning_rate": 7.560975609756096e-05, "loss": 0.1459, "step": 62 }, { "epoch": 0.01, "learning_rate": 7.682926829268292e-05, "loss": 0.1631, "step": 63 }, { "epoch": 0.01, "learning_rate": 7.804878048780487e-05, "loss": 0.1454, "step": 64 }, { "epoch": 0.01, "learning_rate": 7.926829268292682e-05, "loss": 0.1268, "step": 65 }, { "epoch": 0.01, "learning_rate": 8.048780487804878e-05, "loss": 0.1435, "step": 66 }, { "epoch": 0.01, "learning_rate": 8.170731707317072e-05, "loss": 0.1703, "step": 67 }, { "epoch": 0.01, "learning_rate": 8.292682926829268e-05, "loss": 0.1395, "step": 68 }, { "epoch": 0.01, "learning_rate": 8.414634146341464e-05, "loss": 0.1493, "step": 69 }, { "epoch": 0.01, "learning_rate": 8.536585365853658e-05, "loss": 0.0931, "step": 70 }, { "epoch": 0.01, "learning_rate": 8.658536585365854e-05, "loss": 0.1304, "step": 71 }, { "epoch": 0.01, "learning_rate": 8.780487804878047e-05, "loss": 0.0573, "step": 72 }, { "epoch": 0.01, "learning_rate": 8.902439024390243e-05, "loss": 0.1005, "step": 73 }, { "epoch": 0.02, "learning_rate": 9.024390243902438e-05, "loss": 0.1031, "step": 74 }, { "epoch": 0.02, "learning_rate": 9.146341463414633e-05, "loss": 0.1224, "step": 75 }, { "epoch": 0.02, "learning_rate": 9.268292682926829e-05, "loss": 0.1241, "step": 76 }, { "epoch": 0.02, "learning_rate": 9.390243902439023e-05, "loss": 0.1499, "step": 77 }, { "epoch": 0.02, "learning_rate": 9.512195121951219e-05, "loss": 0.065, "step": 78 }, { "epoch": 0.02, "learning_rate": 9.634146341463415e-05, "loss": 0.0461, "step": 79 }, { "epoch": 0.02, "learning_rate": 9.756097560975609e-05, "loss": 0.1377, "step": 80 }, { "epoch": 0.02, "learning_rate": 9.878048780487805e-05, "loss": 0.0652, "step": 81 }, { "epoch": 0.02, "learning_rate": 9.999999999999999e-05, "loss": 0.0434, "step": 82 }, { "epoch": 0.02, "learning_rate": 0.00010121951219512195, "loss": 0.0873, "step": 83 }, { "epoch": 0.02, "learning_rate": 0.0001024390243902439, "loss": 0.057, "step": 84 }, { "epoch": 0.02, "learning_rate": 0.00010365853658536584, "loss": 0.1902, "step": 85 }, { "epoch": 0.02, "learning_rate": 0.0001048780487804878, "loss": 0.1914, "step": 86 }, { "epoch": 0.02, "learning_rate": 0.00010609756097560974, "loss": 0.1099, "step": 87 }, { "epoch": 0.02, "learning_rate": 0.0001073170731707317, "loss": 0.1579, "step": 88 }, { "epoch": 0.02, "learning_rate": 0.00010853658536585365, "loss": 0.1448, "step": 89 }, { "epoch": 0.02, "learning_rate": 0.0001097560975609756, "loss": 0.1048, "step": 90 }, { "epoch": 0.02, "learning_rate": 0.00011097560975609756, "loss": 0.0703, "step": 91 }, { "epoch": 0.02, "learning_rate": 0.0001121951219512195, "loss": 0.0778, "step": 92 }, { "epoch": 0.02, "learning_rate": 0.00011341463414634146, "loss": 0.2221, "step": 93 }, { "epoch": 0.02, "learning_rate": 0.00011463414634146342, "loss": 0.1015, "step": 94 }, { "epoch": 0.02, "learning_rate": 0.00011585365853658535, "loss": 0.1234, "step": 95 }, { "epoch": 0.02, "learning_rate": 0.0001170731707317073, "loss": 0.0951, "step": 96 }, { "epoch": 0.02, "learning_rate": 0.00011829268292682925, "loss": 0.0773, "step": 97 }, { "epoch": 0.02, "learning_rate": 0.0001195121951219512, "loss": 0.1571, "step": 98 }, { "epoch": 0.02, "learning_rate": 0.00012073170731707316, "loss": 0.0873, "step": 99 }, { "epoch": 0.02, "learning_rate": 0.00012195121951219511, "loss": 0.0332, "step": 100 }, { "epoch": 0.02, "learning_rate": 0.00012317073170731708, "loss": 0.0526, "step": 101 }, { "epoch": 0.02, "learning_rate": 0.000124390243902439, "loss": 0.0885, "step": 102 }, { "epoch": 0.02, "learning_rate": 0.00012560975609756097, "loss": 0.1175, "step": 103 }, { "epoch": 0.02, "learning_rate": 0.00012682926829268293, "loss": 0.1182, "step": 104 }, { "epoch": 0.02, "learning_rate": 0.00012804878048780486, "loss": 0.0798, "step": 105 }, { "epoch": 0.02, "learning_rate": 0.00012926829268292681, "loss": 0.0659, "step": 106 }, { "epoch": 0.02, "learning_rate": 0.00013048780487804877, "loss": 0.0878, "step": 107 }, { "epoch": 0.02, "learning_rate": 0.00013170731707317073, "loss": 0.1082, "step": 108 }, { "epoch": 0.02, "learning_rate": 0.0001329268292682927, "loss": 0.1111, "step": 109 }, { "epoch": 0.02, "learning_rate": 0.00013414634146341462, "loss": 0.0777, "step": 110 }, { "epoch": 0.02, "learning_rate": 0.00013536585365853658, "loss": 0.0633, "step": 111 }, { "epoch": 0.02, "learning_rate": 0.0001365853658536585, "loss": 0.07, "step": 112 }, { "epoch": 0.02, "learning_rate": 0.00013780487804878046, "loss": 0.1092, "step": 113 }, { "epoch": 0.02, "learning_rate": 0.00013902439024390242, "loss": 0.0514, "step": 114 }, { "epoch": 0.02, "learning_rate": 0.00014024390243902438, "loss": 0.095, "step": 115 }, { "epoch": 0.02, "learning_rate": 0.00014146341463414634, "loss": 0.0424, "step": 116 }, { "epoch": 0.02, "learning_rate": 0.00014268292682926827, "loss": 0.037, "step": 117 }, { "epoch": 0.02, "learning_rate": 0.00014390243902439023, "loss": 0.0788, "step": 118 }, { "epoch": 0.02, "learning_rate": 0.00014512195121951218, "loss": 0.0757, "step": 119 }, { "epoch": 0.02, "learning_rate": 0.00014634146341463414, "loss": 0.0382, "step": 120 }, { "epoch": 0.02, "learning_rate": 0.0001475609756097561, "loss": 0.0711, "step": 121 }, { "epoch": 0.02, "learning_rate": 0.00014878048780487803, "loss": 0.038, "step": 122 }, { "epoch": 0.03, "learning_rate": 0.00015, "loss": 0.0515, "step": 123 }, { "epoch": 0.03, "learning_rate": 0.00015121951219512192, "loss": 0.049, "step": 124 }, { "epoch": 0.03, "learning_rate": 0.0001524390243902439, "loss": 0.0646, "step": 125 }, { "epoch": 0.03, "learning_rate": 0.00015365853658536583, "loss": 0.1073, "step": 126 }, { "epoch": 0.03, "learning_rate": 0.0001548780487804878, "loss": 0.0996, "step": 127 }, { "epoch": 0.03, "learning_rate": 0.00015609756097560975, "loss": 0.1134, "step": 128 }, { "epoch": 0.03, "learning_rate": 0.0001573170731707317, "loss": 0.1024, "step": 129 }, { "epoch": 0.03, "learning_rate": 0.00015853658536585364, "loss": 0.0958, "step": 130 }, { "epoch": 0.03, "learning_rate": 0.0001597560975609756, "loss": 0.0443, "step": 131 }, { "epoch": 0.03, "learning_rate": 0.00016097560975609755, "loss": 0.1178, "step": 132 }, { "epoch": 0.03, "learning_rate": 0.0001621951219512195, "loss": 0.082, "step": 133 }, { "epoch": 0.03, "learning_rate": 0.00016341463414634144, "loss": 0.0791, "step": 134 }, { "epoch": 0.03, "learning_rate": 0.00016463414634146343, "loss": 0.079, "step": 135 }, { "epoch": 0.03, "learning_rate": 0.00016585365853658536, "loss": 0.0666, "step": 136 }, { "epoch": 0.03, "learning_rate": 0.0001670731707317073, "loss": 0.0789, "step": 137 }, { "epoch": 0.03, "learning_rate": 0.00016829268292682927, "loss": 0.065, "step": 138 }, { "epoch": 0.03, "learning_rate": 0.0001695121951219512, "loss": 0.0548, "step": 139 }, { "epoch": 0.03, "learning_rate": 0.00017073170731707316, "loss": 0.0742, "step": 140 }, { "epoch": 0.03, "learning_rate": 0.0001719512195121951, "loss": 0.0796, "step": 141 }, { "epoch": 0.03, "learning_rate": 0.00017317073170731708, "loss": 0.1732, "step": 142 }, { "epoch": 0.03, "learning_rate": 0.000174390243902439, "loss": 0.0393, "step": 143 }, { "epoch": 0.03, "learning_rate": 0.00017560975609756094, "loss": 0.0439, "step": 144 }, { "epoch": 0.03, "learning_rate": 0.00017682926829268292, "loss": 0.1158, "step": 145 }, { "epoch": 0.03, "learning_rate": 0.00017804878048780485, "loss": 0.0425, "step": 146 }, { "epoch": 0.03, "learning_rate": 0.0001792682926829268, "loss": 0.061, "step": 147 }, { "epoch": 0.03, "learning_rate": 0.00018048780487804877, "loss": 0.0722, "step": 148 }, { "epoch": 0.03, "learning_rate": 0.00018170731707317073, "loss": 0.0714, "step": 149 }, { "epoch": 0.03, "learning_rate": 0.00018292682926829266, "loss": 0.0603, "step": 150 }, { "epoch": 0.03, "learning_rate": 0.0001841463414634146, "loss": 0.0475, "step": 151 }, { "epoch": 0.03, "learning_rate": 0.00018536585365853657, "loss": 0.0675, "step": 152 }, { "epoch": 0.03, "learning_rate": 0.00018658536585365853, "loss": 0.0315, "step": 153 }, { "epoch": 0.03, "learning_rate": 0.00018780487804878046, "loss": 0.0354, "step": 154 }, { "epoch": 0.03, "learning_rate": 0.00018902439024390244, "loss": 0.0566, "step": 155 }, { "epoch": 0.03, "learning_rate": 0.00019024390243902437, "loss": 0.0679, "step": 156 }, { "epoch": 0.03, "learning_rate": 0.0001914634146341463, "loss": 0.1309, "step": 157 }, { "epoch": 0.03, "learning_rate": 0.0001926829268292683, "loss": 0.1161, "step": 158 }, { "epoch": 0.03, "learning_rate": 0.00019390243902439022, "loss": 0.0409, "step": 159 }, { "epoch": 0.03, "learning_rate": 0.00019512195121951218, "loss": 0.0717, "step": 160 }, { "epoch": 0.03, "learning_rate": 0.0001963414634146341, "loss": 0.0329, "step": 161 }, { "epoch": 0.03, "learning_rate": 0.0001975609756097561, "loss": 0.0549, "step": 162 }, { "epoch": 0.03, "learning_rate": 0.00019878048780487802, "loss": 0.0514, "step": 163 }, { "epoch": 0.03, "learning_rate": 0.00019999999999999998, "loss": 0.0611, "step": 164 }, { "epoch": 0.03, "learning_rate": 0.00020121951219512194, "loss": 0.057, "step": 165 }, { "epoch": 0.03, "learning_rate": 0.0002024390243902439, "loss": 0.0812, "step": 166 }, { "epoch": 0.03, "learning_rate": 0.00020365853658536583, "loss": 0.0629, "step": 167 }, { "epoch": 0.03, "learning_rate": 0.0002048780487804878, "loss": 0.0566, "step": 168 }, { "epoch": 0.03, "learning_rate": 0.00020609756097560974, "loss": 0.0521, "step": 169 }, { "epoch": 0.03, "learning_rate": 0.00020731707317073167, "loss": 0.0665, "step": 170 }, { "epoch": 0.03, "learning_rate": 0.00020853658536585363, "loss": 0.033, "step": 171 }, { "epoch": 0.04, "learning_rate": 0.0002097560975609756, "loss": 0.0132, "step": 172 }, { "epoch": 0.04, "learning_rate": 0.00021097560975609755, "loss": 0.0796, "step": 173 }, { "epoch": 0.04, "learning_rate": 0.00021219512195121948, "loss": 0.0408, "step": 174 }, { "epoch": 0.04, "learning_rate": 0.00021341463414634146, "loss": 0.0795, "step": 175 }, { "epoch": 0.04, "learning_rate": 0.0002146341463414634, "loss": 0.1066, "step": 176 }, { "epoch": 0.04, "learning_rate": 0.00021585365853658535, "loss": 0.0334, "step": 177 }, { "epoch": 0.04, "learning_rate": 0.0002170731707317073, "loss": 0.0482, "step": 178 }, { "epoch": 0.04, "learning_rate": 0.00021829268292682927, "loss": 0.0386, "step": 179 }, { "epoch": 0.04, "learning_rate": 0.0002195121951219512, "loss": 0.0833, "step": 180 }, { "epoch": 0.04, "learning_rate": 0.00022073170731707313, "loss": 0.0337, "step": 181 }, { "epoch": 0.04, "learning_rate": 0.0002219512195121951, "loss": 0.0388, "step": 182 }, { "epoch": 0.04, "learning_rate": 0.00022317073170731704, "loss": 0.0646, "step": 183 }, { "epoch": 0.04, "learning_rate": 0.000224390243902439, "loss": 0.0507, "step": 184 }, { "epoch": 0.04, "learning_rate": 0.00022560975609756096, "loss": 0.0264, "step": 185 }, { "epoch": 0.04, "learning_rate": 0.00022682926829268292, "loss": 0.0459, "step": 186 }, { "epoch": 0.04, "learning_rate": 0.00022804878048780485, "loss": 0.0394, "step": 187 }, { "epoch": 0.04, "learning_rate": 0.00022926829268292683, "loss": 0.0814, "step": 188 }, { "epoch": 0.04, "learning_rate": 0.00023048780487804876, "loss": 0.0205, "step": 189 }, { "epoch": 0.04, "learning_rate": 0.0002317073170731707, "loss": 0.0395, "step": 190 }, { "epoch": 0.04, "learning_rate": 0.00023292682926829265, "loss": 0.0781, "step": 191 }, { "epoch": 0.04, "learning_rate": 0.0002341463414634146, "loss": 0.0435, "step": 192 }, { "epoch": 0.04, "learning_rate": 0.00023536585365853657, "loss": 0.0715, "step": 193 }, { "epoch": 0.04, "learning_rate": 0.0002365853658536585, "loss": 0.0657, "step": 194 }, { "epoch": 0.04, "learning_rate": 0.00023780487804878048, "loss": 0.0321, "step": 195 }, { "epoch": 0.04, "learning_rate": 0.0002390243902439024, "loss": 0.0472, "step": 196 }, { "epoch": 0.04, "learning_rate": 0.00024024390243902437, "loss": 0.0425, "step": 197 }, { "epoch": 0.04, "learning_rate": 0.00024146341463414633, "loss": 0.0681, "step": 198 }, { "epoch": 0.04, "learning_rate": 0.00024268292682926829, "loss": 0.0902, "step": 199 }, { "epoch": 0.04, "learning_rate": 0.00024390243902439022, "loss": 0.054, "step": 200 }, { "epoch": 0.04, "learning_rate": 0.0002451219512195122, "loss": 0.0395, "step": 201 }, { "epoch": 0.04, "learning_rate": 0.00024634146341463416, "loss": 0.0823, "step": 202 }, { "epoch": 0.04, "learning_rate": 0.0002475609756097561, "loss": 0.0908, "step": 203 }, { "epoch": 0.04, "learning_rate": 0.000248780487804878, "loss": 0.0745, "step": 204 }, { "epoch": 0.04, "learning_rate": 0.00025, "loss": 0.0415, "step": 205 }, { "epoch": 0.04, "learning_rate": 0.00025121951219512194, "loss": 0.0727, "step": 206 }, { "epoch": 0.04, "learning_rate": 0.00025243902439024387, "loss": 0.053, "step": 207 }, { "epoch": 0.04, "learning_rate": 0.00025365853658536585, "loss": 0.0292, "step": 208 }, { "epoch": 0.04, "learning_rate": 0.0002548780487804878, "loss": 0.0401, "step": 209 }, { "epoch": 0.04, "learning_rate": 0.0002560975609756097, "loss": 0.0338, "step": 210 }, { "epoch": 0.04, "learning_rate": 0.00025731707317073164, "loss": 0.0563, "step": 211 }, { "epoch": 0.04, "learning_rate": 0.00025853658536585363, "loss": 0.0173, "step": 212 }, { "epoch": 0.04, "learning_rate": 0.00025975609756097556, "loss": 0.0943, "step": 213 }, { "epoch": 0.04, "learning_rate": 0.00026097560975609754, "loss": 0.0493, "step": 214 }, { "epoch": 0.04, "learning_rate": 0.0002621951219512195, "loss": 0.0565, "step": 215 }, { "epoch": 0.04, "learning_rate": 0.00026341463414634146, "loss": 0.0507, "step": 216 }, { "epoch": 0.04, "learning_rate": 0.0002646341463414634, "loss": 0.0389, "step": 217 }, { "epoch": 0.04, "learning_rate": 0.0002658536585365854, "loss": 0.1022, "step": 218 }, { "epoch": 0.04, "learning_rate": 0.0002670731707317073, "loss": 0.0296, "step": 219 }, { "epoch": 0.04, "learning_rate": 0.00026829268292682924, "loss": 0.1012, "step": 220 }, { "epoch": 0.04, "learning_rate": 0.00026951219512195117, "loss": 0.0203, "step": 221 }, { "epoch": 0.05, "learning_rate": 0.00027073170731707315, "loss": 0.048, "step": 222 }, { "epoch": 0.05, "learning_rate": 0.0002719512195121951, "loss": 0.0479, "step": 223 }, { "epoch": 0.05, "learning_rate": 0.000273170731707317, "loss": 0.0735, "step": 224 }, { "epoch": 0.05, "learning_rate": 0.000274390243902439, "loss": 0.0365, "step": 225 }, { "epoch": 0.05, "learning_rate": 0.00027560975609756093, "loss": 0.0195, "step": 226 }, { "epoch": 0.05, "learning_rate": 0.0002768292682926829, "loss": 0.0254, "step": 227 }, { "epoch": 0.05, "learning_rate": 0.00027804878048780484, "loss": 0.0298, "step": 228 }, { "epoch": 0.05, "learning_rate": 0.00027926829268292683, "loss": 0.0459, "step": 229 }, { "epoch": 0.05, "learning_rate": 0.00028048780487804876, "loss": 0.0155, "step": 230 }, { "epoch": 0.05, "learning_rate": 0.0002817073170731707, "loss": 0.0237, "step": 231 }, { "epoch": 0.05, "learning_rate": 0.0002829268292682927, "loss": 0.0715, "step": 232 }, { "epoch": 0.05, "learning_rate": 0.0002841463414634146, "loss": 0.0456, "step": 233 }, { "epoch": 0.05, "learning_rate": 0.00028536585365853654, "loss": 0.077, "step": 234 }, { "epoch": 0.05, "learning_rate": 0.0002865853658536585, "loss": 0.0776, "step": 235 }, { "epoch": 0.05, "learning_rate": 0.00028780487804878045, "loss": 0.0948, "step": 236 }, { "epoch": 0.05, "learning_rate": 0.0002890243902439024, "loss": 0.1215, "step": 237 }, { "epoch": 0.05, "learning_rate": 0.00029024390243902437, "loss": 0.0517, "step": 238 }, { "epoch": 0.05, "learning_rate": 0.0002914634146341463, "loss": 0.0695, "step": 239 }, { "epoch": 0.05, "learning_rate": 0.0002926829268292683, "loss": 0.0677, "step": 240 }, { "epoch": 0.05, "learning_rate": 0.0002939024390243902, "loss": 0.0551, "step": 241 }, { "epoch": 0.05, "learning_rate": 0.0002951219512195122, "loss": 0.0429, "step": 242 }, { "epoch": 0.05, "learning_rate": 0.00029634146341463413, "loss": 0.0761, "step": 243 }, { "epoch": 0.05, "learning_rate": 0.00029756097560975606, "loss": 0.0387, "step": 244 }, { "epoch": 0.05, "learning_rate": 0.00029878048780487804, "loss": 0.0343, "step": 245 }, { "epoch": 0.05, "learning_rate": 0.0003, "loss": 0.0775, "step": 246 }, { "epoch": 0.05, "learning_rate": 0.0002999999987473584, "loss": 0.0449, "step": 247 }, { "epoch": 0.05, "learning_rate": 0.00029999999498943374, "loss": 0.0312, "step": 248 }, { "epoch": 0.05, "learning_rate": 0.0002999999887262259, "loss": 0.0471, "step": 249 }, { "epoch": 0.05, "learning_rate": 0.00029999997995773525, "loss": 0.066, "step": 250 }, { "epoch": 0.05, "learning_rate": 0.0002999999686839617, "loss": 0.0703, "step": 251 }, { "epoch": 0.05, "learning_rate": 0.0002999999549049056, "loss": 0.0565, "step": 252 }, { "epoch": 0.05, "learning_rate": 0.000299999938620567, "loss": 0.0257, "step": 253 }, { "epoch": 0.05, "learning_rate": 0.0002999999198309464, "loss": 0.0553, "step": 254 }, { "epoch": 0.05, "learning_rate": 0.0002999998985360439, "loss": 0.0673, "step": 255 }, { "epoch": 0.05, "learning_rate": 0.00029999987473586, "loss": 0.0649, "step": 256 }, { "epoch": 0.05, "learning_rate": 0.000299999848430395, "loss": 0.0242, "step": 257 }, { "epoch": 0.05, "learning_rate": 0.00029999981961964945, "loss": 0.0248, "step": 258 }, { "epoch": 0.05, "learning_rate": 0.0002999997883036237, "loss": 0.0472, "step": 259 }, { "epoch": 0.05, "learning_rate": 0.0002999997544823184, "loss": 0.0406, "step": 260 }, { "epoch": 0.05, "learning_rate": 0.00029999971815573406, "loss": 0.0873, "step": 261 }, { "epoch": 0.05, "learning_rate": 0.0002999996793238712, "loss": 0.0659, "step": 262 }, { "epoch": 0.05, "learning_rate": 0.0002999996379867306, "loss": 0.0276, "step": 263 }, { "epoch": 0.05, "learning_rate": 0.0002999995941443129, "loss": 0.0365, "step": 264 }, { "epoch": 0.05, "learning_rate": 0.00029999954779661884, "loss": 0.0623, "step": 265 }, { "epoch": 0.05, "learning_rate": 0.0002999994989436492, "loss": 0.0676, "step": 266 }, { "epoch": 0.05, "learning_rate": 0.0002999994475854048, "loss": 0.0449, "step": 267 }, { "epoch": 0.05, "learning_rate": 0.0002999993937218865, "loss": 0.0699, "step": 268 }, { "epoch": 0.05, "learning_rate": 0.00029999933735309507, "loss": 0.044, "step": 269 }, { "epoch": 0.05, "learning_rate": 0.0002999992784790316, "loss": 0.0237, "step": 270 }, { "epoch": 0.06, "learning_rate": 0.00029999921709969706, "loss": 0.1078, "step": 271 }, { "epoch": 0.06, "learning_rate": 0.0002999991532150925, "loss": 0.0534, "step": 272 }, { "epoch": 0.06, "learning_rate": 0.00029999908682521885, "loss": 0.0618, "step": 273 }, { "epoch": 0.06, "learning_rate": 0.0002999990179300774, "loss": 0.0366, "step": 274 }, { "epoch": 0.06, "learning_rate": 0.00029999894652966915, "loss": 0.0702, "step": 275 }, { "epoch": 0.06, "learning_rate": 0.0002999988726239953, "loss": 0.0368, "step": 276 }, { "epoch": 0.06, "learning_rate": 0.00029999879621305723, "loss": 0.0335, "step": 277 }, { "epoch": 0.06, "learning_rate": 0.0002999987172968561, "loss": 0.0244, "step": 278 }, { "epoch": 0.06, "learning_rate": 0.0002999986358753932, "loss": 0.0224, "step": 279 }, { "epoch": 0.06, "learning_rate": 0.00029999855194867, "loss": 0.0277, "step": 280 }, { "epoch": 0.06, "learning_rate": 0.00029999846551668775, "loss": 0.0556, "step": 281 }, { "epoch": 0.06, "learning_rate": 0.00029999837657944807, "loss": 0.0783, "step": 282 }, { "epoch": 0.06, "learning_rate": 0.0002999982851369523, "loss": 0.0527, "step": 283 }, { "epoch": 0.06, "learning_rate": 0.00029999819118920205, "loss": 0.0449, "step": 284 }, { "epoch": 0.06, "learning_rate": 0.00029999809473619886, "loss": 0.0479, "step": 285 }, { "epoch": 0.06, "learning_rate": 0.0002999979957779444, "loss": 0.0295, "step": 286 }, { "epoch": 0.06, "learning_rate": 0.0002999978943144402, "loss": 0.0519, "step": 287 }, { "epoch": 0.06, "learning_rate": 0.0002999977903456881, "loss": 0.0255, "step": 288 }, { "epoch": 0.06, "learning_rate": 0.00029999768387168967, "loss": 0.045, "step": 289 }, { "epoch": 0.06, "learning_rate": 0.0002999975748924468, "loss": 0.0483, "step": 290 }, { "epoch": 0.06, "learning_rate": 0.00029999746340796134, "loss": 0.0377, "step": 291 }, { "epoch": 0.06, "learning_rate": 0.00029999734941823505, "loss": 0.0152, "step": 292 }, { "epoch": 0.06, "learning_rate": 0.0002999972329232699, "loss": 0.0926, "step": 293 }, { "epoch": 0.06, "learning_rate": 0.00029999711392306785, "loss": 0.0415, "step": 294 }, { "epoch": 0.06, "learning_rate": 0.00029999699241763084, "loss": 0.0328, "step": 295 }, { "epoch": 0.06, "learning_rate": 0.0002999968684069609, "loss": 0.0475, "step": 296 }, { "epoch": 0.06, "learning_rate": 0.0002999967418910601, "loss": 0.0329, "step": 297 }, { "epoch": 0.06, "learning_rate": 0.0002999966128699306, "loss": 0.0323, "step": 298 }, { "epoch": 0.06, "learning_rate": 0.00029999648134357456, "loss": 0.0461, "step": 299 }, { "epoch": 0.06, "learning_rate": 0.00029999634731199407, "loss": 0.0906, "step": 300 }, { "epoch": 0.06, "learning_rate": 0.0002999962107751915, "loss": 0.0349, "step": 301 }, { "epoch": 0.06, "learning_rate": 0.000299996071733169, "loss": 0.0199, "step": 302 }, { "epoch": 0.06, "learning_rate": 0.00029999593018592905, "loss": 0.0675, "step": 303 }, { "epoch": 0.06, "learning_rate": 0.0002999957861334739, "loss": 0.0388, "step": 304 }, { "epoch": 0.06, "learning_rate": 0.000299995639575806, "loss": 0.0593, "step": 305 }, { "epoch": 0.06, "learning_rate": 0.00029999549051292775, "loss": 0.0317, "step": 306 }, { "epoch": 0.06, "learning_rate": 0.00029999533894484165, "loss": 0.0267, "step": 307 }, { "epoch": 0.06, "learning_rate": 0.0002999951848715503, "loss": 0.0891, "step": 308 }, { "epoch": 0.06, "learning_rate": 0.0002999950282930562, "loss": 0.0234, "step": 309 }, { "epoch": 0.06, "learning_rate": 0.000299994869209362, "loss": 0.0385, "step": 310 }, { "epoch": 0.06, "learning_rate": 0.0002999947076204704, "loss": 0.0474, "step": 311 }, { "epoch": 0.06, "learning_rate": 0.000299994543526384, "loss": 0.0089, "step": 312 }, { "epoch": 0.06, "learning_rate": 0.0002999943769271056, "loss": 0.0439, "step": 313 }, { "epoch": 0.06, "learning_rate": 0.00029999420782263794, "loss": 0.0282, "step": 314 }, { "epoch": 0.06, "learning_rate": 0.0002999940362129839, "loss": 0.0715, "step": 315 }, { "epoch": 0.06, "learning_rate": 0.0002999938620981463, "loss": 0.0594, "step": 316 }, { "epoch": 0.06, "learning_rate": 0.00029999368547812806, "loss": 0.0226, "step": 317 }, { "epoch": 0.06, "learning_rate": 0.00029999350635293216, "loss": 0.0359, "step": 318 }, { "epoch": 0.06, "learning_rate": 0.00029999332472256164, "loss": 0.0433, "step": 319 }, { "epoch": 0.07, "learning_rate": 0.0002999931405870194, "loss": 0.0163, "step": 320 }, { "epoch": 0.07, "learning_rate": 0.00029999295394630857, "loss": 0.1083, "step": 321 }, { "epoch": 0.07, "learning_rate": 0.0002999927648004323, "loss": 0.0328, "step": 322 }, { "epoch": 0.07, "learning_rate": 0.0002999925731493937, "loss": 0.0299, "step": 323 }, { "epoch": 0.07, "learning_rate": 0.000299992378993196, "loss": 0.0094, "step": 324 }, { "epoch": 0.07, "learning_rate": 0.0002999921823318425, "loss": 0.0228, "step": 325 }, { "epoch": 0.07, "learning_rate": 0.0002999919831653363, "loss": 0.0682, "step": 326 }, { "epoch": 0.07, "learning_rate": 0.00029999178149368096, "loss": 0.0442, "step": 327 }, { "epoch": 0.07, "learning_rate": 0.00029999157731687973, "loss": 0.017, "step": 328 }, { "epoch": 0.07, "learning_rate": 0.000299991370634936, "loss": 0.0479, "step": 329 }, { "epoch": 0.07, "learning_rate": 0.0002999911614478533, "loss": 0.1235, "step": 330 }, { "epoch": 0.07, "learning_rate": 0.00029999094975563496, "loss": 0.0237, "step": 331 }, { "epoch": 0.07, "learning_rate": 0.0002999907355582847, "loss": 0.0284, "step": 332 }, { "epoch": 0.07, "learning_rate": 0.0002999905188558061, "loss": 0.0566, "step": 333 }, { "epoch": 0.07, "learning_rate": 0.0002999902996482026, "loss": 0.0413, "step": 334 }, { "epoch": 0.07, "learning_rate": 0.00029999007793547804, "loss": 0.0412, "step": 335 }, { "epoch": 0.07, "learning_rate": 0.00029998985371763604, "loss": 0.0257, "step": 336 }, { "epoch": 0.07, "learning_rate": 0.00029998962699468037, "loss": 0.0218, "step": 337 }, { "epoch": 0.07, "learning_rate": 0.00029998939776661475, "loss": 0.059, "step": 338 }, { "epoch": 0.07, "learning_rate": 0.0002999891660334431, "loss": 0.0482, "step": 339 }, { "epoch": 0.07, "learning_rate": 0.0002999889317951692, "loss": 0.0414, "step": 340 }, { "epoch": 0.07, "learning_rate": 0.0002999886950517971, "loss": 0.0316, "step": 341 }, { "epoch": 0.07, "learning_rate": 0.0002999884558033306, "loss": 0.0361, "step": 342 }, { "epoch": 0.07, "learning_rate": 0.0002999882140497738, "loss": 0.1174, "step": 343 }, { "epoch": 0.07, "learning_rate": 0.0002999879697911307, "loss": 0.0333, "step": 344 }, { "epoch": 0.07, "learning_rate": 0.00029998772302740535, "loss": 0.0255, "step": 345 }, { "epoch": 0.07, "learning_rate": 0.0002999874737586019, "loss": 0.0219, "step": 346 }, { "epoch": 0.07, "learning_rate": 0.00029998722198472453, "loss": 0.0753, "step": 347 }, { "epoch": 0.07, "learning_rate": 0.00029998696770577746, "loss": 0.0571, "step": 348 }, { "epoch": 0.07, "learning_rate": 0.0002999867109217649, "loss": 0.0328, "step": 349 }, { "epoch": 0.07, "learning_rate": 0.0002999864516326912, "loss": 0.0689, "step": 350 }, { "epoch": 0.07, "learning_rate": 0.00029998618983856053, "loss": 0.0738, "step": 351 }, { "epoch": 0.07, "learning_rate": 0.0002999859255393774, "loss": 0.0806, "step": 352 }, { "epoch": 0.07, "learning_rate": 0.00029998565873514625, "loss": 0.0297, "step": 353 }, { "epoch": 0.07, "learning_rate": 0.00029998538942587144, "loss": 0.0424, "step": 354 }, { "epoch": 0.07, "learning_rate": 0.0002999851176115575, "loss": 0.0373, "step": 355 }, { "epoch": 0.07, "learning_rate": 0.000299984843292209, "loss": 0.0167, "step": 356 }, { "epoch": 0.07, "learning_rate": 0.00029998456646783053, "loss": 0.0345, "step": 357 }, { "epoch": 0.07, "learning_rate": 0.00029998428713842664, "loss": 0.0279, "step": 358 }, { "epoch": 0.07, "learning_rate": 0.000299984005304002, "loss": 0.041, "step": 359 }, { "epoch": 0.07, "learning_rate": 0.00029998372096456147, "loss": 0.0473, "step": 360 }, { "epoch": 0.07, "learning_rate": 0.0002999834341201096, "loss": 0.043, "step": 361 }, { "epoch": 0.07, "learning_rate": 0.0002999831447706513, "loss": 0.0319, "step": 362 }, { "epoch": 0.07, "learning_rate": 0.0002999828529161913, "loss": 0.1028, "step": 363 }, { "epoch": 0.07, "learning_rate": 0.0002999825585567347, "loss": 0.0416, "step": 364 }, { "epoch": 0.07, "learning_rate": 0.0002999822616922861, "loss": 0.0234, "step": 365 }, { "epoch": 0.07, "learning_rate": 0.0002999819623228507, "loss": 0.0228, "step": 366 }, { "epoch": 0.07, "learning_rate": 0.0002999816604484334, "loss": 0.0734, "step": 367 }, { "epoch": 0.07, "learning_rate": 0.0002999813560690392, "loss": 0.0243, "step": 368 }, { "epoch": 0.08, "learning_rate": 0.0002999810491846733, "loss": 0.0547, "step": 369 }, { "epoch": 0.08, "learning_rate": 0.00029998073979534086, "loss": 0.0342, "step": 370 }, { "epoch": 0.08, "learning_rate": 0.00029998042790104683, "loss": 0.0385, "step": 371 }, { "epoch": 0.08, "learning_rate": 0.0002999801135017966, "loss": 0.0381, "step": 372 }, { "epoch": 0.08, "learning_rate": 0.0002999797965975953, "loss": 0.0512, "step": 373 }, { "epoch": 0.08, "learning_rate": 0.00029997947718844834, "loss": 0.0407, "step": 374 }, { "epoch": 0.08, "learning_rate": 0.000299979155274361, "loss": 0.0639, "step": 375 }, { "epoch": 0.08, "learning_rate": 0.0002999788308553387, "loss": 0.0492, "step": 376 }, { "epoch": 0.08, "learning_rate": 0.0002999785039313868, "loss": 0.0318, "step": 377 }, { "epoch": 0.08, "learning_rate": 0.00029997817450251076, "loss": 0.0328, "step": 378 }, { "epoch": 0.08, "learning_rate": 0.00029997784256871607, "loss": 0.0309, "step": 379 }, { "epoch": 0.08, "learning_rate": 0.0002999775081300084, "loss": 0.0146, "step": 380 }, { "epoch": 0.08, "learning_rate": 0.0002999771711863932, "loss": 0.0512, "step": 381 }, { "epoch": 0.08, "learning_rate": 0.00029997683173787603, "loss": 0.0163, "step": 382 }, { "epoch": 0.08, "learning_rate": 0.0002999764897844628, "loss": 0.065, "step": 383 }, { "epoch": 0.08, "learning_rate": 0.00029997614532615907, "loss": 0.0522, "step": 384 }, { "epoch": 0.08, "learning_rate": 0.0002999757983629706, "loss": 0.0182, "step": 385 }, { "epoch": 0.08, "learning_rate": 0.0002999754488949032, "loss": 0.0309, "step": 386 }, { "epoch": 0.08, "learning_rate": 0.00029997509692196266, "loss": 0.0864, "step": 387 }, { "epoch": 0.08, "learning_rate": 0.000299974742444155, "loss": 0.05, "step": 388 }, { "epoch": 0.08, "learning_rate": 0.0002999743854614859, "loss": 0.0295, "step": 389 }, { "epoch": 0.08, "learning_rate": 0.0002999740259739616, "loss": 0.0582, "step": 390 }, { "epoch": 0.08, "learning_rate": 0.0002999736639815879, "loss": 0.0497, "step": 391 }, { "epoch": 0.08, "learning_rate": 0.000299973299484371, "loss": 0.0291, "step": 392 }, { "epoch": 0.08, "learning_rate": 0.0002999729324823168, "loss": 0.0294, "step": 393 }, { "epoch": 0.08, "learning_rate": 0.00029997256297543154, "loss": 0.0435, "step": 394 }, { "epoch": 0.08, "learning_rate": 0.0002999721909637214, "loss": 0.0551, "step": 395 }, { "epoch": 0.08, "learning_rate": 0.00029997181644719263, "loss": 0.0795, "step": 396 }, { "epoch": 0.08, "learning_rate": 0.0002999714394258514, "loss": 0.0455, "step": 397 }, { "epoch": 0.08, "learning_rate": 0.00029997105989970407, "loss": 0.066, "step": 398 }, { "epoch": 0.08, "learning_rate": 0.0002999706778687569, "loss": 0.041, "step": 399 }, { "epoch": 0.08, "learning_rate": 0.00029997029333301634, "loss": 0.0422, "step": 400 }, { "epoch": 0.08, "learning_rate": 0.0002999699062924888, "loss": 0.0287, "step": 401 }, { "epoch": 0.08, "learning_rate": 0.00029996951674718077, "loss": 0.0392, "step": 402 }, { "epoch": 0.08, "learning_rate": 0.00029996912469709865, "loss": 0.0752, "step": 403 }, { "epoch": 0.08, "learning_rate": 0.0002999687301422491, "loss": 0.0473, "step": 404 }, { "epoch": 0.08, "learning_rate": 0.00029996833308263863, "loss": 0.0237, "step": 405 }, { "epoch": 0.08, "learning_rate": 0.00029996793351827396, "loss": 0.024, "step": 406 }, { "epoch": 0.08, "learning_rate": 0.0002999675314491617, "loss": 0.0357, "step": 407 }, { "epoch": 0.08, "learning_rate": 0.0002999671268753086, "loss": 0.1922, "step": 408 }, { "epoch": 0.08, "learning_rate": 0.0002999667197967214, "loss": 0.0469, "step": 409 }, { "epoch": 0.08, "learning_rate": 0.00029996631021340686, "loss": 0.0371, "step": 410 }, { "epoch": 0.08, "learning_rate": 0.0002999658981253719, "loss": 0.0494, "step": 411 }, { "epoch": 0.08, "learning_rate": 0.0002999654835326233, "loss": 0.0267, "step": 412 }, { "epoch": 0.08, "learning_rate": 0.0002999650664351681, "loss": 0.0336, "step": 413 }, { "epoch": 0.08, "learning_rate": 0.0002999646468330132, "loss": 0.0438, "step": 414 }, { "epoch": 0.08, "learning_rate": 0.00029996422472616563, "loss": 0.0468, "step": 415 }, { "epoch": 0.08, "learning_rate": 0.00029996380011463236, "loss": 0.0346, "step": 416 }, { "epoch": 0.08, "learning_rate": 0.0002999633729984206, "loss": 0.0458, "step": 417 }, { "epoch": 0.09, "learning_rate": 0.00029996294337753746, "loss": 0.0544, "step": 418 }, { "epoch": 0.09, "learning_rate": 0.00029996251125199004, "loss": 0.0285, "step": 419 }, { "epoch": 0.09, "learning_rate": 0.00029996207662178566, "loss": 0.0359, "step": 420 }, { "epoch": 0.09, "learning_rate": 0.0002999616394869315, "loss": 0.0586, "step": 421 }, { "epoch": 0.09, "learning_rate": 0.00029996119984743494, "loss": 0.0186, "step": 422 }, { "epoch": 0.09, "learning_rate": 0.0002999607577033032, "loss": 0.0878, "step": 423 }, { "epoch": 0.09, "learning_rate": 0.0002999603130545437, "loss": 0.0458, "step": 424 }, { "epoch": 0.09, "learning_rate": 0.000299959865901164, "loss": 0.0275, "step": 425 }, { "epoch": 0.09, "learning_rate": 0.0002999594162431714, "loss": 0.047, "step": 426 }, { "epoch": 0.09, "learning_rate": 0.00029995896408057353, "loss": 0.039, "step": 427 }, { "epoch": 0.09, "learning_rate": 0.0002999585094133779, "loss": 0.0205, "step": 428 }, { "epoch": 0.09, "learning_rate": 0.0002999580522415921, "loss": 0.0461, "step": 429 }, { "epoch": 0.09, "learning_rate": 0.0002999575925652237, "loss": 0.0402, "step": 430 }, { "epoch": 0.09, "learning_rate": 0.00029995713038428047, "loss": 0.0374, "step": 431 }, { "epoch": 0.09, "learning_rate": 0.0002999566656987701, "loss": 0.0364, "step": 432 }, { "epoch": 0.09, "learning_rate": 0.00029995619850870035, "loss": 0.0323, "step": 433 }, { "epoch": 0.09, "learning_rate": 0.00029995572881407904, "loss": 0.019, "step": 434 }, { "epoch": 0.09, "learning_rate": 0.00029995525661491397, "loss": 0.0288, "step": 435 }, { "epoch": 0.09, "learning_rate": 0.00029995478191121303, "loss": 0.0924, "step": 436 }, { "epoch": 0.09, "learning_rate": 0.00029995430470298426, "loss": 0.0281, "step": 437 }, { "epoch": 0.09, "learning_rate": 0.00029995382499023546, "loss": 0.0294, "step": 438 }, { "epoch": 0.09, "learning_rate": 0.0002999533427729747, "loss": 0.0258, "step": 439 }, { "epoch": 0.09, "learning_rate": 0.00029995285805121014, "loss": 0.0251, "step": 440 }, { "epoch": 0.09, "learning_rate": 0.00029995237082494977, "loss": 0.0313, "step": 441 }, { "epoch": 0.09, "learning_rate": 0.00029995188109420174, "loss": 0.0313, "step": 442 }, { "epoch": 0.09, "learning_rate": 0.0002999513888589743, "loss": 0.1238, "step": 443 }, { "epoch": 0.09, "learning_rate": 0.0002999508941192755, "loss": 0.0306, "step": 444 }, { "epoch": 0.09, "learning_rate": 0.0002999503968751138, "loss": 0.0107, "step": 445 }, { "epoch": 0.09, "learning_rate": 0.0002999498971264974, "loss": 0.0273, "step": 446 }, { "epoch": 0.09, "learning_rate": 0.00029994939487343466, "loss": 0.0164, "step": 447 }, { "epoch": 0.09, "learning_rate": 0.000299948890115934, "loss": 0.0267, "step": 448 }, { "epoch": 0.09, "learning_rate": 0.0002999483828540038, "loss": 0.0129, "step": 449 }, { "epoch": 0.09, "learning_rate": 0.0002999478730876526, "loss": 0.0254, "step": 450 }, { "epoch": 0.09, "learning_rate": 0.0002999473608168888, "loss": 0.031, "step": 451 }, { "epoch": 0.09, "learning_rate": 0.00029994684604172105, "loss": 0.0982, "step": 452 }, { "epoch": 0.09, "learning_rate": 0.000299946328762158, "loss": 0.0381, "step": 453 }, { "epoch": 0.09, "learning_rate": 0.00029994580897820813, "loss": 0.0204, "step": 454 }, { "epoch": 0.09, "learning_rate": 0.00029994528668988025, "loss": 0.0847, "step": 455 }, { "epoch": 0.09, "learning_rate": 0.000299944761897183, "loss": 0.0379, "step": 456 }, { "epoch": 0.09, "learning_rate": 0.0002999442346001252, "loss": 0.0463, "step": 457 }, { "epoch": 0.09, "learning_rate": 0.00029994370479871564, "loss": 0.0167, "step": 458 }, { "epoch": 0.09, "learning_rate": 0.00029994317249296327, "loss": 0.0333, "step": 459 }, { "epoch": 0.09, "learning_rate": 0.00029994263768287675, "loss": 0.0304, "step": 460 }, { "epoch": 0.09, "learning_rate": 0.0002999421003684652, "loss": 0.0495, "step": 461 }, { "epoch": 0.09, "learning_rate": 0.00029994156054973756, "loss": 0.0307, "step": 462 }, { "epoch": 0.09, "learning_rate": 0.0002999410182267028, "loss": 0.0239, "step": 463 }, { "epoch": 0.09, "learning_rate": 0.00029994047339936995, "loss": 0.0465, "step": 464 }, { "epoch": 0.09, "learning_rate": 0.00029993992606774825, "loss": 0.0422, "step": 465 }, { "epoch": 0.09, "learning_rate": 0.00029993937623184666, "loss": 0.0216, "step": 466 }, { "epoch": 0.1, "learning_rate": 0.00029993882389167453, "loss": 0.0112, "step": 467 }, { "epoch": 0.1, "learning_rate": 0.000299938269047241, "loss": 0.0537, "step": 468 }, { "epoch": 0.1, "learning_rate": 0.0002999377116985553, "loss": 0.0138, "step": 469 }, { "epoch": 0.1, "learning_rate": 0.00029993715184562685, "loss": 0.0543, "step": 470 }, { "epoch": 0.1, "learning_rate": 0.00029993658948846493, "loss": 0.0188, "step": 471 }, { "epoch": 0.1, "learning_rate": 0.0002999360246270789, "loss": 0.0416, "step": 472 }, { "epoch": 0.1, "learning_rate": 0.0002999354572614783, "loss": 0.0357, "step": 473 }, { "epoch": 0.1, "learning_rate": 0.0002999348873916725, "loss": 0.0678, "step": 474 }, { "epoch": 0.1, "learning_rate": 0.00029993431501767104, "loss": 0.0173, "step": 475 }, { "epoch": 0.1, "learning_rate": 0.0002999337401394835, "loss": 0.0153, "step": 476 }, { "epoch": 0.1, "learning_rate": 0.00029993316275711947, "loss": 0.0297, "step": 477 }, { "epoch": 0.1, "learning_rate": 0.00029993258287058864, "loss": 0.0197, "step": 478 }, { "epoch": 0.1, "learning_rate": 0.00029993200047990067, "loss": 0.0749, "step": 479 }, { "epoch": 0.1, "learning_rate": 0.0002999314155850652, "loss": 0.0162, "step": 480 }, { "epoch": 0.1, "learning_rate": 0.00029993082818609214, "loss": 0.0192, "step": 481 }, { "epoch": 0.1, "learning_rate": 0.0002999302382829912, "loss": 0.0219, "step": 482 }, { "epoch": 0.1, "learning_rate": 0.0002999296458757723, "loss": 0.0655, "step": 483 }, { "epoch": 0.1, "learning_rate": 0.00029992905096444533, "loss": 0.035, "step": 484 }, { "epoch": 0.1, "learning_rate": 0.0002999284535490201, "loss": 0.0394, "step": 485 }, { "epoch": 0.1, "learning_rate": 0.0002999278536295068, "loss": 0.0267, "step": 486 }, { "epoch": 0.1, "learning_rate": 0.00029992725120591524, "loss": 0.1209, "step": 487 }, { "epoch": 0.1, "learning_rate": 0.0002999266462782556, "loss": 0.0161, "step": 488 }, { "epoch": 0.1, "learning_rate": 0.000299926038846538, "loss": 0.052, "step": 489 }, { "epoch": 0.1, "learning_rate": 0.0002999254289107725, "loss": 0.0173, "step": 490 }, { "epoch": 0.1, "learning_rate": 0.00029992481647096936, "loss": 0.0156, "step": 491 }, { "epoch": 0.1, "learning_rate": 0.0002999242015271388, "loss": 0.0196, "step": 492 }, { "epoch": 0.1, "learning_rate": 0.000299923584079291, "loss": 0.0817, "step": 493 }, { "epoch": 0.1, "learning_rate": 0.0002999229641274364, "loss": 0.0555, "step": 494 }, { "epoch": 0.1, "learning_rate": 0.00029992234167158533, "loss": 0.0125, "step": 495 }, { "epoch": 0.1, "learning_rate": 0.0002999217167117481, "loss": 0.0328, "step": 496 }, { "epoch": 0.1, "learning_rate": 0.00029992108924793524, "loss": 0.0158, "step": 497 }, { "epoch": 0.1, "learning_rate": 0.00029992045928015716, "loss": 0.0369, "step": 498 }, { "epoch": 0.1, "learning_rate": 0.00029991982680842446, "loss": 0.0415, "step": 499 }, { "epoch": 0.1, "learning_rate": 0.0002999191918327476, "loss": 0.0427, "step": 500 }, { "epoch": 0.1, "learning_rate": 0.00029991855435313727, "loss": 0.0343, "step": 501 }, { "epoch": 0.1, "learning_rate": 0.0002999179143696041, "loss": 0.038, "step": 502 }, { "epoch": 0.1, "learning_rate": 0.00029991727188215874, "loss": 0.0356, "step": 503 }, { "epoch": 0.1, "learning_rate": 0.000299916626890812, "loss": 0.0559, "step": 504 }, { "epoch": 0.1, "learning_rate": 0.0002999159793955746, "loss": 0.0313, "step": 505 }, { "epoch": 0.1, "learning_rate": 0.0002999153293964573, "loss": 0.042, "step": 506 }, { "epoch": 0.1, "learning_rate": 0.00029991467689347105, "loss": 0.0371, "step": 507 }, { "epoch": 0.1, "learning_rate": 0.0002999140218866267, "loss": 0.0455, "step": 508 }, { "epoch": 0.1, "learning_rate": 0.00029991336437593525, "loss": 0.0172, "step": 509 }, { "epoch": 0.1, "learning_rate": 0.0002999127043614076, "loss": 0.0225, "step": 510 }, { "epoch": 0.1, "learning_rate": 0.00029991204184305473, "loss": 0.078, "step": 511 }, { "epoch": 0.1, "learning_rate": 0.0002999113768208879, "loss": 0.0672, "step": 512 }, { "epoch": 0.1, "learning_rate": 0.00029991070929491807, "loss": 0.0223, "step": 513 }, { "epoch": 0.1, "learning_rate": 0.00029991003926515636, "loss": 0.0547, "step": 514 }, { "epoch": 0.1, "learning_rate": 0.0002999093667316141, "loss": 0.0291, "step": 515 }, { "epoch": 0.11, "learning_rate": 0.0002999086916943024, "loss": 0.0329, "step": 516 }, { "epoch": 0.11, "learning_rate": 0.00029990801415323256, "loss": 0.0163, "step": 517 }, { "epoch": 0.11, "learning_rate": 0.00029990733410841593, "loss": 0.0777, "step": 518 }, { "epoch": 0.11, "learning_rate": 0.00029990665155986385, "loss": 0.0461, "step": 519 }, { "epoch": 0.11, "learning_rate": 0.0002999059665075877, "loss": 0.0131, "step": 520 }, { "epoch": 0.11, "learning_rate": 0.00029990527895159896, "loss": 0.0534, "step": 521 }, { "epoch": 0.11, "learning_rate": 0.0002999045888919091, "loss": 0.0393, "step": 522 }, { "epoch": 0.11, "learning_rate": 0.00029990389632852965, "loss": 0.0131, "step": 523 }, { "epoch": 0.11, "learning_rate": 0.00029990320126147213, "loss": 0.0243, "step": 524 }, { "epoch": 0.11, "learning_rate": 0.00029990250369074824, "loss": 0.0116, "step": 525 }, { "epoch": 0.11, "learning_rate": 0.00029990180361636956, "loss": 0.0492, "step": 526 }, { "epoch": 0.11, "learning_rate": 0.0002999011010383478, "loss": 0.041, "step": 527 }, { "epoch": 0.11, "learning_rate": 0.0002999003959566947, "loss": 0.0407, "step": 528 }, { "epoch": 0.11, "learning_rate": 0.000299899688371422, "loss": 0.2534, "step": 529 }, { "epoch": 0.11, "learning_rate": 0.00029989897828254156, "loss": 0.027, "step": 530 }, { "epoch": 0.11, "learning_rate": 0.00029989826569006527, "loss": 0.0198, "step": 531 }, { "epoch": 0.11, "learning_rate": 0.00029989755059400494, "loss": 0.058, "step": 532 }, { "epoch": 0.11, "learning_rate": 0.00029989683299437255, "loss": 0.0579, "step": 533 }, { "epoch": 0.11, "learning_rate": 0.00029989611289118014, "loss": 0.0291, "step": 534 }, { "epoch": 0.11, "learning_rate": 0.00029989539028443964, "loss": 0.0258, "step": 535 }, { "epoch": 0.11, "learning_rate": 0.00029989466517416324, "loss": 0.073, "step": 536 }, { "epoch": 0.11, "learning_rate": 0.000299893937560363, "loss": 0.0203, "step": 537 }, { "epoch": 0.11, "learning_rate": 0.000299893207443051, "loss": 0.0359, "step": 538 }, { "epoch": 0.11, "learning_rate": 0.0002998924748222395, "loss": 0.0169, "step": 539 }, { "epoch": 0.11, "learning_rate": 0.00029989173969794075, "loss": 0.1368, "step": 540 }, { "epoch": 0.11, "learning_rate": 0.00029989100207016695, "loss": 0.1126, "step": 541 }, { "epoch": 0.11, "learning_rate": 0.00029989026193893054, "loss": 0.0576, "step": 542 }, { "epoch": 0.11, "learning_rate": 0.0002998895193042438, "loss": 0.0325, "step": 543 }, { "epoch": 0.11, "learning_rate": 0.0002998887741661192, "loss": 0.0252, "step": 544 }, { "epoch": 0.11, "learning_rate": 0.00029988802652456905, "loss": 0.0448, "step": 545 }, { "epoch": 0.11, "learning_rate": 0.000299887276379606, "loss": 0.0238, "step": 546 }, { "epoch": 0.11, "learning_rate": 0.0002998865237312424, "loss": 0.0453, "step": 547 }, { "epoch": 0.11, "learning_rate": 0.000299885768579491, "loss": 0.0385, "step": 548 }, { "epoch": 0.11, "learning_rate": 0.0002998850109243643, "loss": 0.0537, "step": 549 }, { "epoch": 0.11, "learning_rate": 0.000299884250765875, "loss": 0.0779, "step": 550 }, { "epoch": 0.11, "learning_rate": 0.0002998834881040358, "loss": 0.0126, "step": 551 }, { "epoch": 0.11, "learning_rate": 0.00029988272293885945, "loss": 0.0237, "step": 552 }, { "epoch": 0.11, "learning_rate": 0.0002998819552703587, "loss": 0.0321, "step": 553 }, { "epoch": 0.11, "learning_rate": 0.0002998811850985463, "loss": 0.0117, "step": 554 }, { "epoch": 0.11, "learning_rate": 0.0002998804124234353, "loss": 0.019, "step": 555 }, { "epoch": 0.11, "learning_rate": 0.0002998796372450384, "loss": 0.0246, "step": 556 }, { "epoch": 0.11, "learning_rate": 0.0002998788595633687, "loss": 0.0217, "step": 557 }, { "epoch": 0.11, "learning_rate": 0.00029987807937843905, "loss": 0.0308, "step": 558 }, { "epoch": 0.11, "learning_rate": 0.00029987729669026257, "loss": 0.0623, "step": 559 }, { "epoch": 0.11, "learning_rate": 0.00029987651149885236, "loss": 0.0433, "step": 560 }, { "epoch": 0.11, "learning_rate": 0.00029987572380422154, "loss": 0.027, "step": 561 }, { "epoch": 0.11, "learning_rate": 0.00029987493360638317, "loss": 0.0382, "step": 562 }, { "epoch": 0.11, "learning_rate": 0.0002998741409053505, "loss": 0.0132, "step": 563 }, { "epoch": 0.11, "learning_rate": 0.00029987334570113675, "loss": 0.0408, "step": 564 }, { "epoch": 0.12, "learning_rate": 0.00029987254799375526, "loss": 0.0428, "step": 565 }, { "epoch": 0.12, "learning_rate": 0.0002998717477832193, "loss": 0.0393, "step": 566 }, { "epoch": 0.12, "learning_rate": 0.00029987094506954225, "loss": 0.0284, "step": 567 }, { "epoch": 0.12, "learning_rate": 0.0002998701398527375, "loss": 0.0497, "step": 568 }, { "epoch": 0.12, "learning_rate": 0.0002998693321328185, "loss": 0.0401, "step": 569 }, { "epoch": 0.12, "learning_rate": 0.0002998685219097988, "loss": 0.0142, "step": 570 }, { "epoch": 0.12, "learning_rate": 0.00029986770918369185, "loss": 0.0416, "step": 571 }, { "epoch": 0.12, "learning_rate": 0.0002998668939545113, "loss": 0.061, "step": 572 }, { "epoch": 0.12, "learning_rate": 0.0002998660762222707, "loss": 0.0388, "step": 573 }, { "epoch": 0.12, "learning_rate": 0.00029986525598698374, "loss": 0.0257, "step": 574 }, { "epoch": 0.12, "learning_rate": 0.00029986443324866416, "loss": 0.0392, "step": 575 }, { "epoch": 0.12, "learning_rate": 0.0002998636080073256, "loss": 0.0168, "step": 576 }, { "epoch": 0.12, "learning_rate": 0.0002998627802629819, "loss": 0.0471, "step": 577 }, { "epoch": 0.12, "learning_rate": 0.00029986195001564694, "loss": 0.0265, "step": 578 }, { "epoch": 0.12, "learning_rate": 0.0002998611172653345, "loss": 0.027, "step": 579 }, { "epoch": 0.12, "learning_rate": 0.0002998602820120585, "loss": 0.0864, "step": 580 }, { "epoch": 0.12, "learning_rate": 0.0002998594442558329, "loss": 0.0415, "step": 581 }, { "epoch": 0.12, "learning_rate": 0.0002998586039966717, "loss": 0.0397, "step": 582 }, { "epoch": 0.12, "learning_rate": 0.000299857761234589, "loss": 0.0205, "step": 583 }, { "epoch": 0.12, "learning_rate": 0.0002998569159695987, "loss": 0.1261, "step": 584 }, { "epoch": 0.12, "learning_rate": 0.0002998560682017151, "loss": 0.0415, "step": 585 }, { "epoch": 0.12, "learning_rate": 0.00029985521793095233, "loss": 0.0407, "step": 586 }, { "epoch": 0.12, "learning_rate": 0.00029985436515732447, "loss": 0.0715, "step": 587 }, { "epoch": 0.12, "learning_rate": 0.00029985350988084587, "loss": 0.0418, "step": 588 }, { "epoch": 0.12, "learning_rate": 0.0002998526521015308, "loss": 0.0415, "step": 589 }, { "epoch": 0.12, "learning_rate": 0.00029985179181939354, "loss": 0.0334, "step": 590 }, { "epoch": 0.12, "learning_rate": 0.0002998509290344485, "loss": 0.0502, "step": 591 }, { "epoch": 0.12, "learning_rate": 0.0002998500637467101, "loss": 0.0339, "step": 592 }, { "epoch": 0.12, "learning_rate": 0.00029984919595619277, "loss": 0.0311, "step": 593 }, { "epoch": 0.12, "learning_rate": 0.000299848325662911, "loss": 0.0446, "step": 594 }, { "epoch": 0.12, "learning_rate": 0.0002998474528668793, "loss": 0.0215, "step": 595 }, { "epoch": 0.12, "learning_rate": 0.00029984657756811236, "loss": 0.1002, "step": 596 }, { "epoch": 0.12, "learning_rate": 0.00029984569976662466, "loss": 0.0143, "step": 597 }, { "epoch": 0.12, "learning_rate": 0.0002998448194624309, "loss": 0.0291, "step": 598 }, { "epoch": 0.12, "learning_rate": 0.00029984393665554587, "loss": 0.0712, "step": 599 }, { "epoch": 0.12, "learning_rate": 0.0002998430513459842, "loss": 0.0251, "step": 600 }, { "epoch": 0.12, "learning_rate": 0.00029984216353376073, "loss": 0.0355, "step": 601 }, { "epoch": 0.12, "learning_rate": 0.0002998412732188903, "loss": 0.0273, "step": 602 }, { "epoch": 0.12, "learning_rate": 0.00029984038040138775, "loss": 0.0589, "step": 603 }, { "epoch": 0.12, "learning_rate": 0.000299839485081268, "loss": 0.0755, "step": 604 }, { "epoch": 0.12, "learning_rate": 0.000299838587258546, "loss": 0.0361, "step": 605 }, { "epoch": 0.12, "learning_rate": 0.0002998376869332368, "loss": 0.0464, "step": 606 }, { "epoch": 0.12, "learning_rate": 0.00029983678410535535, "loss": 0.0323, "step": 607 }, { "epoch": 0.12, "learning_rate": 0.00029983587877491675, "loss": 0.0538, "step": 608 }, { "epoch": 0.12, "learning_rate": 0.0002998349709419362, "loss": 0.0169, "step": 609 }, { "epoch": 0.12, "learning_rate": 0.00029983406060642875, "loss": 0.0379, "step": 610 }, { "epoch": 0.12, "learning_rate": 0.00029983314776840965, "loss": 0.0193, "step": 611 }, { "epoch": 0.12, "learning_rate": 0.0002998322324278942, "loss": 0.0131, "step": 612 }, { "epoch": 0.12, "learning_rate": 0.0002998313145848976, "loss": 0.0596, "step": 613 }, { "epoch": 0.13, "learning_rate": 0.0002998303942394352, "loss": 0.0403, "step": 614 }, { "epoch": 0.13, "learning_rate": 0.00029982947139152243, "loss": 0.0151, "step": 615 }, { "epoch": 0.13, "learning_rate": 0.00029982854604117465, "loss": 0.0403, "step": 616 }, { "epoch": 0.13, "learning_rate": 0.0002998276181884074, "loss": 0.0158, "step": 617 }, { "epoch": 0.13, "learning_rate": 0.000299826687833236, "loss": 0.0276, "step": 618 }, { "epoch": 0.13, "learning_rate": 0.00029982575497567614, "loss": 0.0393, "step": 619 }, { "epoch": 0.13, "learning_rate": 0.00029982481961574335, "loss": 0.0806, "step": 620 }, { "epoch": 0.13, "learning_rate": 0.00029982388175345324, "loss": 0.037, "step": 621 }, { "epoch": 0.13, "learning_rate": 0.00029982294138882154, "loss": 0.0247, "step": 622 }, { "epoch": 0.13, "learning_rate": 0.00029982199852186385, "loss": 0.0458, "step": 623 }, { "epoch": 0.13, "learning_rate": 0.000299821053152596, "loss": 0.0196, "step": 624 }, { "epoch": 0.13, "learning_rate": 0.0002998201052810338, "loss": 0.0942, "step": 625 }, { "epoch": 0.13, "learning_rate": 0.00029981915490719297, "loss": 0.0228, "step": 626 }, { "epoch": 0.13, "learning_rate": 0.0002998182020310895, "loss": 0.0321, "step": 627 }, { "epoch": 0.13, "learning_rate": 0.0002998172466527392, "loss": 0.0358, "step": 628 }, { "epoch": 0.13, "learning_rate": 0.00029981628877215815, "loss": 0.0452, "step": 629 }, { "epoch": 0.13, "learning_rate": 0.00029981532838936224, "loss": 0.0433, "step": 630 }, { "epoch": 0.13, "learning_rate": 0.0002998143655043676, "loss": 0.0464, "step": 631 }, { "epoch": 0.13, "learning_rate": 0.00029981340011719015, "loss": 0.0436, "step": 632 }, { "epoch": 0.13, "learning_rate": 0.0002998124322278462, "loss": 0.0535, "step": 633 }, { "epoch": 0.13, "learning_rate": 0.00029981146183635186, "loss": 0.0148, "step": 634 }, { "epoch": 0.13, "learning_rate": 0.0002998104889427233, "loss": 0.0248, "step": 635 }, { "epoch": 0.13, "learning_rate": 0.00029980951354697676, "loss": 0.0437, "step": 636 }, { "epoch": 0.13, "learning_rate": 0.00029980853564912855, "loss": 0.0598, "step": 637 }, { "epoch": 0.13, "learning_rate": 0.000299807555249195, "loss": 0.0357, "step": 638 }, { "epoch": 0.13, "learning_rate": 0.0002998065723471926, "loss": 0.0447, "step": 639 }, { "epoch": 0.13, "learning_rate": 0.00029980558694313753, "loss": 0.0148, "step": 640 }, { "epoch": 0.13, "learning_rate": 0.00029980459903704645, "loss": 0.0184, "step": 641 }, { "epoch": 0.13, "learning_rate": 0.0002998036086289358, "loss": 0.0552, "step": 642 }, { "epoch": 0.13, "learning_rate": 0.0002998026157188221, "loss": 0.0134, "step": 643 }, { "epoch": 0.13, "learning_rate": 0.00029980162030672193, "loss": 0.0302, "step": 644 }, { "epoch": 0.13, "learning_rate": 0.0002998006223926519, "loss": 0.0338, "step": 645 }, { "epoch": 0.13, "learning_rate": 0.0002997996219766288, "loss": 0.032, "step": 646 }, { "epoch": 0.13, "learning_rate": 0.0002997986190586692, "loss": 0.033, "step": 647 }, { "epoch": 0.13, "learning_rate": 0.0002997976136387899, "loss": 0.0426, "step": 648 }, { "epoch": 0.13, "learning_rate": 0.00029979660571700765, "loss": 0.0174, "step": 649 }, { "epoch": 0.13, "learning_rate": 0.00029979559529333936, "loss": 0.0441, "step": 650 }, { "epoch": 0.13, "learning_rate": 0.00029979458236780186, "loss": 0.0227, "step": 651 }, { "epoch": 0.13, "learning_rate": 0.00029979356694041206, "loss": 0.0296, "step": 652 }, { "epoch": 0.13, "learning_rate": 0.000299792549011187, "loss": 0.0278, "step": 653 }, { "epoch": 0.13, "learning_rate": 0.0002997915285801435, "loss": 0.0283, "step": 654 }, { "epoch": 0.13, "learning_rate": 0.00029979050564729885, "loss": 0.0601, "step": 655 }, { "epoch": 0.13, "learning_rate": 0.00029978948021266993, "loss": 0.0247, "step": 656 }, { "epoch": 0.13, "learning_rate": 0.00029978845227627394, "loss": 0.0216, "step": 657 }, { "epoch": 0.13, "learning_rate": 0.0002997874218381281, "loss": 0.0345, "step": 658 }, { "epoch": 0.13, "learning_rate": 0.00029978638889824956, "loss": 0.0316, "step": 659 }, { "epoch": 0.13, "learning_rate": 0.00029978535345665555, "loss": 0.0124, "step": 660 }, { "epoch": 0.13, "learning_rate": 0.0002997843155133634, "loss": 0.0101, "step": 661 }, { "epoch": 0.13, "learning_rate": 0.0002997832750683905, "loss": 0.0197, "step": 662 }, { "epoch": 0.13, "learning_rate": 0.0002997822321217541, "loss": 0.023, "step": 663 }, { "epoch": 0.14, "learning_rate": 0.00029978118667347176, "loss": 0.0145, "step": 664 }, { "epoch": 0.14, "learning_rate": 0.00029978013872356083, "loss": 0.0282, "step": 665 }, { "epoch": 0.14, "learning_rate": 0.0002997790882720388, "loss": 0.0491, "step": 666 }, { "epoch": 0.14, "learning_rate": 0.00029977803531892335, "loss": 0.0308, "step": 667 }, { "epoch": 0.14, "learning_rate": 0.00029977697986423193, "loss": 0.0098, "step": 668 }, { "epoch": 0.14, "learning_rate": 0.00029977592190798225, "loss": 0.0704, "step": 669 }, { "epoch": 0.14, "learning_rate": 0.000299774861450192, "loss": 0.0212, "step": 670 }, { "epoch": 0.14, "learning_rate": 0.00029977379849087875, "loss": 0.0185, "step": 671 }, { "epoch": 0.14, "learning_rate": 0.0002997727330300604, "loss": 0.0257, "step": 672 }, { "epoch": 0.14, "learning_rate": 0.00029977166506775467, "loss": 0.0259, "step": 673 }, { "epoch": 0.14, "learning_rate": 0.00029977059460397943, "loss": 0.018, "step": 674 }, { "epoch": 0.14, "learning_rate": 0.00029976952163875256, "loss": 0.0249, "step": 675 }, { "epoch": 0.14, "learning_rate": 0.00029976844617209196, "loss": 0.0179, "step": 676 }, { "epoch": 0.14, "learning_rate": 0.0002997673682040156, "loss": 0.0141, "step": 677 }, { "epoch": 0.14, "learning_rate": 0.0002997662877345415, "loss": 0.0367, "step": 678 }, { "epoch": 0.14, "learning_rate": 0.0002997652047636877, "loss": 0.0335, "step": 679 }, { "epoch": 0.14, "learning_rate": 0.0002997641192914722, "loss": 0.0296, "step": 680 }, { "epoch": 0.14, "learning_rate": 0.0002997630313179133, "loss": 0.0328, "step": 681 }, { "epoch": 0.14, "learning_rate": 0.00029976194084302903, "loss": 0.0206, "step": 682 }, { "epoch": 0.14, "learning_rate": 0.00029976084786683766, "loss": 0.0216, "step": 683 }, { "epoch": 0.14, "learning_rate": 0.00029975975238935744, "loss": 0.0287, "step": 684 }, { "epoch": 0.14, "learning_rate": 0.00029975865441060666, "loss": 0.0182, "step": 685 }, { "epoch": 0.14, "learning_rate": 0.00029975755393060364, "loss": 0.03, "step": 686 }, { "epoch": 0.14, "learning_rate": 0.0002997564509493668, "loss": 0.0349, "step": 687 }, { "epoch": 0.14, "learning_rate": 0.0002997553454669146, "loss": 0.043, "step": 688 }, { "epoch": 0.14, "learning_rate": 0.00029975423748326537, "loss": 0.0541, "step": 689 }, { "epoch": 0.14, "learning_rate": 0.00029975312699843774, "loss": 0.0298, "step": 690 }, { "epoch": 0.14, "learning_rate": 0.0002997520140124502, "loss": 0.0168, "step": 691 }, { "epoch": 0.14, "learning_rate": 0.00029975089852532136, "loss": 0.0332, "step": 692 }, { "epoch": 0.14, "learning_rate": 0.0002997497805370698, "loss": 0.027, "step": 693 }, { "epoch": 0.14, "learning_rate": 0.00029974866004771426, "loss": 0.0309, "step": 694 }, { "epoch": 0.14, "learning_rate": 0.0002997475370572734, "loss": 0.0244, "step": 695 }, { "epoch": 0.14, "learning_rate": 0.00029974641156576605, "loss": 0.0195, "step": 696 }, { "epoch": 0.14, "learning_rate": 0.0002997452835732109, "loss": 0.0339, "step": 697 }, { "epoch": 0.14, "learning_rate": 0.0002997441530796269, "loss": 0.0589, "step": 698 }, { "epoch": 0.14, "learning_rate": 0.00029974302008503286, "loss": 0.012, "step": 699 }, { "epoch": 0.14, "learning_rate": 0.0002997418845894477, "loss": 0.0427, "step": 700 }, { "epoch": 0.14, "learning_rate": 0.00029974074659289043, "loss": 0.0414, "step": 701 }, { "epoch": 0.14, "learning_rate": 0.0002997396060953801, "loss": 0.0322, "step": 702 }, { "epoch": 0.14, "learning_rate": 0.0002997384630969356, "loss": 0.01, "step": 703 }, { "epoch": 0.14, "learning_rate": 0.0002997373175975762, "loss": 0.0308, "step": 704 }, { "epoch": 0.14, "learning_rate": 0.0002997361695973209, "loss": 0.0362, "step": 705 }, { "epoch": 0.14, "learning_rate": 0.0002997350190961889, "loss": 0.0655, "step": 706 }, { "epoch": 0.14, "learning_rate": 0.00029973386609419945, "loss": 0.0695, "step": 707 }, { "epoch": 0.14, "learning_rate": 0.0002997327105913718, "loss": 0.0388, "step": 708 }, { "epoch": 0.14, "learning_rate": 0.0002997315525877253, "loss": 0.028, "step": 709 }, { "epoch": 0.14, "learning_rate": 0.0002997303920832791, "loss": 0.0412, "step": 710 }, { "epoch": 0.14, "learning_rate": 0.00029972922907805285, "loss": 0.0295, "step": 711 }, { "epoch": 0.14, "learning_rate": 0.00029972806357206577, "loss": 0.0816, "step": 712 }, { "epoch": 0.15, "learning_rate": 0.0002997268955653374, "loss": 0.0325, "step": 713 }, { "epoch": 0.15, "learning_rate": 0.00029972572505788725, "loss": 0.0783, "step": 714 }, { "epoch": 0.15, "learning_rate": 0.0002997245520497349, "loss": 0.0367, "step": 715 }, { "epoch": 0.15, "learning_rate": 0.00029972337654089986, "loss": 0.0079, "step": 716 }, { "epoch": 0.15, "learning_rate": 0.0002997221985314018, "loss": 0.0603, "step": 717 }, { "epoch": 0.15, "learning_rate": 0.00029972101802126045, "loss": 0.0231, "step": 718 }, { "epoch": 0.15, "learning_rate": 0.0002997198350104954, "loss": 0.0414, "step": 719 }, { "epoch": 0.15, "learning_rate": 0.0002997186494991266, "loss": 0.0447, "step": 720 }, { "epoch": 0.15, "learning_rate": 0.0002997174614871737, "loss": 0.0369, "step": 721 }, { "epoch": 0.15, "learning_rate": 0.00029971627097465656, "loss": 0.0504, "step": 722 }, { "epoch": 0.15, "learning_rate": 0.00029971507796159506, "loss": 0.0127, "step": 723 }, { "epoch": 0.15, "learning_rate": 0.0002997138824480092, "loss": 0.0367, "step": 724 }, { "epoch": 0.15, "learning_rate": 0.0002997126844339189, "loss": 0.0342, "step": 725 }, { "epoch": 0.15, "learning_rate": 0.00029971148391934413, "loss": 0.0391, "step": 726 }, { "epoch": 0.15, "learning_rate": 0.00029971028090430504, "loss": 0.0309, "step": 727 }, { "epoch": 0.15, "learning_rate": 0.0002997090753888216, "loss": 0.0405, "step": 728 }, { "epoch": 0.15, "learning_rate": 0.000299707867372914, "loss": 0.0288, "step": 729 }, { "epoch": 0.15, "learning_rate": 0.0002997066568566025, "loss": 0.011, "step": 730 }, { "epoch": 0.15, "learning_rate": 0.00029970544383990715, "loss": 0.0371, "step": 731 }, { "epoch": 0.15, "learning_rate": 0.00029970422832284834, "loss": 0.024, "step": 732 }, { "epoch": 0.15, "learning_rate": 0.00029970301030544634, "loss": 0.037, "step": 733 }, { "epoch": 0.15, "learning_rate": 0.0002997017897877214, "loss": 0.0245, "step": 734 }, { "epoch": 0.15, "learning_rate": 0.00029970056676969413, "loss": 0.0374, "step": 735 }, { "epoch": 0.15, "learning_rate": 0.00029969934125138474, "loss": 0.0475, "step": 736 }, { "epoch": 0.15, "learning_rate": 0.00029969811323281374, "loss": 0.0259, "step": 737 }, { "epoch": 0.15, "learning_rate": 0.00029969688271400173, "loss": 0.0134, "step": 738 }, { "epoch": 0.15, "learning_rate": 0.00029969564969496915, "loss": 0.0164, "step": 739 }, { "epoch": 0.15, "learning_rate": 0.00029969441417573666, "loss": 0.0053, "step": 740 }, { "epoch": 0.15, "learning_rate": 0.00029969317615632495, "loss": 0.0222, "step": 741 }, { "epoch": 0.15, "learning_rate": 0.0002996919356367546, "loss": 0.0462, "step": 742 }, { "epoch": 0.15, "learning_rate": 0.0002996906926170463, "loss": 0.0293, "step": 743 }, { "epoch": 0.15, "learning_rate": 0.00029968944709722096, "loss": 0.0102, "step": 744 }, { "epoch": 0.15, "learning_rate": 0.00029968819907729924, "loss": 0.0418, "step": 745 }, { "epoch": 0.15, "learning_rate": 0.0002996869485573021, "loss": 0.0567, "step": 746 }, { "epoch": 0.15, "learning_rate": 0.0002996856955372503, "loss": 0.0114, "step": 747 }, { "epoch": 0.15, "learning_rate": 0.0002996844400171649, "loss": 0.0108, "step": 748 }, { "epoch": 0.15, "learning_rate": 0.0002996831819970667, "loss": 0.0354, "step": 749 }, { "epoch": 0.15, "learning_rate": 0.00029968192147697686, "loss": 0.0417, "step": 750 }, { "epoch": 0.15, "learning_rate": 0.0002996806584569164, "loss": 0.051, "step": 751 }, { "epoch": 0.15, "learning_rate": 0.0002996793929369064, "loss": 0.0295, "step": 752 }, { "epoch": 0.15, "learning_rate": 0.00029967812491696805, "loss": 0.0255, "step": 753 }, { "epoch": 0.15, "learning_rate": 0.00029967685439712236, "loss": 0.026, "step": 754 }, { "epoch": 0.15, "learning_rate": 0.00029967558137739073, "loss": 0.0236, "step": 755 }, { "epoch": 0.15, "learning_rate": 0.0002996743058577944, "loss": 0.0405, "step": 756 }, { "epoch": 0.15, "learning_rate": 0.0002996730278383546, "loss": 0.03, "step": 757 }, { "epoch": 0.15, "learning_rate": 0.0002996717473190927, "loss": 0.1239, "step": 758 }, { "epoch": 0.15, "learning_rate": 0.00029967046430003005, "loss": 0.0206, "step": 759 }, { "epoch": 0.15, "learning_rate": 0.00029966917878118817, "loss": 0.0353, "step": 760 }, { "epoch": 0.15, "learning_rate": 0.00029966789076258846, "loss": 0.0369, "step": 761 }, { "epoch": 0.16, "learning_rate": 0.0002996666002442525, "loss": 0.0174, "step": 762 }, { "epoch": 0.16, "learning_rate": 0.0002996653072262018, "loss": 0.0366, "step": 763 }, { "epoch": 0.16, "learning_rate": 0.00029966401170845793, "loss": 0.064, "step": 764 }, { "epoch": 0.16, "learning_rate": 0.00029966271369104254, "loss": 0.0226, "step": 765 }, { "epoch": 0.16, "learning_rate": 0.0002996614131739773, "loss": 0.0349, "step": 766 }, { "epoch": 0.16, "learning_rate": 0.00029966011015728405, "loss": 0.0084, "step": 767 }, { "epoch": 0.16, "learning_rate": 0.0002996588046409844, "loss": 0.0565, "step": 768 }, { "epoch": 0.16, "learning_rate": 0.00029965749662510014, "loss": 0.0095, "step": 769 }, { "epoch": 0.16, "learning_rate": 0.00029965618610965333, "loss": 0.0826, "step": 770 }, { "epoch": 0.16, "learning_rate": 0.0002996548730946656, "loss": 0.0636, "step": 771 }, { "epoch": 0.16, "learning_rate": 0.00029965355758015906, "loss": 0.0113, "step": 772 }, { "epoch": 0.16, "learning_rate": 0.0002996522395661556, "loss": 0.0346, "step": 773 }, { "epoch": 0.16, "learning_rate": 0.0002996509190526772, "loss": 0.0271, "step": 774 }, { "epoch": 0.16, "learning_rate": 0.0002996495960397461, "loss": 0.0381, "step": 775 }, { "epoch": 0.16, "learning_rate": 0.00029964827052738415, "loss": 0.0404, "step": 776 }, { "epoch": 0.16, "learning_rate": 0.0002996469425156136, "loss": 0.0437, "step": 777 }, { "epoch": 0.16, "learning_rate": 0.0002996456120044567, "loss": 0.0462, "step": 778 }, { "epoch": 0.16, "learning_rate": 0.00029964427899393554, "loss": 0.0222, "step": 779 }, { "epoch": 0.16, "learning_rate": 0.0002996429434840725, "loss": 0.0427, "step": 780 }, { "epoch": 0.16, "learning_rate": 0.0002996416054748898, "loss": 0.0245, "step": 781 }, { "epoch": 0.16, "learning_rate": 0.0002996402649664098, "loss": 0.0216, "step": 782 }, { "epoch": 0.16, "learning_rate": 0.0002996389219586549, "loss": 0.03, "step": 783 }, { "epoch": 0.16, "learning_rate": 0.0002996375764516476, "loss": 0.0557, "step": 784 }, { "epoch": 0.16, "learning_rate": 0.00029963622844541026, "loss": 0.0772, "step": 785 }, { "epoch": 0.16, "learning_rate": 0.0002996348779399655, "loss": 0.0487, "step": 786 }, { "epoch": 0.16, "learning_rate": 0.00029963352493533576, "loss": 0.0473, "step": 787 }, { "epoch": 0.16, "learning_rate": 0.00029963216943154375, "loss": 0.0469, "step": 788 }, { "epoch": 0.16, "learning_rate": 0.0002996308114286121, "loss": 0.0508, "step": 789 }, { "epoch": 0.16, "learning_rate": 0.00029962945092656333, "loss": 0.039, "step": 790 }, { "epoch": 0.16, "learning_rate": 0.00029962808792542033, "loss": 0.0405, "step": 791 }, { "epoch": 0.16, "learning_rate": 0.00029962672242520586, "loss": 0.0416, "step": 792 }, { "epoch": 0.16, "learning_rate": 0.0002996253544259426, "loss": 0.0296, "step": 793 }, { "epoch": 0.16, "learning_rate": 0.0002996239839276536, "loss": 0.016, "step": 794 }, { "epoch": 0.16, "learning_rate": 0.00029962261093036157, "loss": 0.0204, "step": 795 }, { "epoch": 0.16, "learning_rate": 0.0002996212354340895, "loss": 0.0325, "step": 796 }, { "epoch": 0.16, "learning_rate": 0.0002996198574388604, "loss": 0.0753, "step": 797 }, { "epoch": 0.16, "learning_rate": 0.00029961847694469725, "loss": 0.0461, "step": 798 }, { "epoch": 0.16, "learning_rate": 0.0002996170939516231, "loss": 0.0342, "step": 799 }, { "epoch": 0.16, "learning_rate": 0.00029961570845966104, "loss": 0.0445, "step": 800 }, { "epoch": 0.16, "learning_rate": 0.00029961432046883427, "loss": 0.0296, "step": 801 }, { "epoch": 0.16, "learning_rate": 0.0002996129299791658, "loss": 0.0125, "step": 802 }, { "epoch": 0.16, "learning_rate": 0.00029961153699067917, "loss": 0.0372, "step": 803 }, { "epoch": 0.16, "learning_rate": 0.00029961014150339734, "loss": 0.0288, "step": 804 }, { "epoch": 0.16, "learning_rate": 0.0002996087435173438, "loss": 0.0355, "step": 805 }, { "epoch": 0.16, "learning_rate": 0.0002996073430325418, "loss": 0.009, "step": 806 }, { "epoch": 0.16, "learning_rate": 0.0002996059400490148, "loss": 0.0416, "step": 807 }, { "epoch": 0.16, "learning_rate": 0.00029960453456678615, "loss": 0.0325, "step": 808 }, { "epoch": 0.16, "learning_rate": 0.00029960312658587943, "loss": 0.0363, "step": 809 }, { "epoch": 0.16, "learning_rate": 0.00029960171610631805, "loss": 0.0403, "step": 810 }, { "epoch": 0.17, "learning_rate": 0.00029960030312812565, "loss": 0.0262, "step": 811 }, { "epoch": 0.17, "learning_rate": 0.0002995988876513258, "loss": 0.037, "step": 812 }, { "epoch": 0.17, "learning_rate": 0.00029959746967594215, "loss": 0.0252, "step": 813 }, { "epoch": 0.17, "learning_rate": 0.00029959604920199833, "loss": 0.016, "step": 814 }, { "epoch": 0.17, "learning_rate": 0.0002995946262295181, "loss": 0.0371, "step": 815 }, { "epoch": 0.17, "learning_rate": 0.0002995932007585252, "loss": 0.0137, "step": 816 }, { "epoch": 0.17, "learning_rate": 0.00029959177278904357, "loss": 0.0085, "step": 817 }, { "epoch": 0.17, "learning_rate": 0.00029959034232109695, "loss": 0.0232, "step": 818 }, { "epoch": 0.17, "learning_rate": 0.0002995889093547092, "loss": 0.0628, "step": 819 }, { "epoch": 0.17, "learning_rate": 0.0002995874738899043, "loss": 0.0109, "step": 820 }, { "epoch": 0.17, "learning_rate": 0.0002995860359267062, "loss": 0.0215, "step": 821 }, { "epoch": 0.17, "learning_rate": 0.000299584595465139, "loss": 0.0364, "step": 822 }, { "epoch": 0.17, "learning_rate": 0.0002995831525052266, "loss": 0.0241, "step": 823 }, { "epoch": 0.17, "learning_rate": 0.00029958170704699326, "loss": 0.0532, "step": 824 }, { "epoch": 0.17, "learning_rate": 0.0002995802590904631, "loss": 0.0646, "step": 825 }, { "epoch": 0.17, "learning_rate": 0.00029957880863566017, "loss": 0.0351, "step": 826 }, { "epoch": 0.17, "learning_rate": 0.00029957735568260884, "loss": 0.0538, "step": 827 }, { "epoch": 0.17, "learning_rate": 0.0002995759002313333, "loss": 0.0193, "step": 828 }, { "epoch": 0.17, "learning_rate": 0.00029957444228185783, "loss": 0.056, "step": 829 }, { "epoch": 0.17, "learning_rate": 0.00029957298183420694, "loss": 0.0151, "step": 830 }, { "epoch": 0.17, "learning_rate": 0.0002995715188884049, "loss": 0.0342, "step": 831 }, { "epoch": 0.17, "learning_rate": 0.0002995700534444761, "loss": 0.0338, "step": 832 }, { "epoch": 0.17, "learning_rate": 0.0002995685855024451, "loss": 0.0215, "step": 833 }, { "epoch": 0.17, "learning_rate": 0.0002995671150623364, "loss": 0.0162, "step": 834 }, { "epoch": 0.17, "learning_rate": 0.0002995656421241745, "loss": 0.0217, "step": 835 }, { "epoch": 0.17, "learning_rate": 0.00029956416668798405, "loss": 0.0401, "step": 836 }, { "epoch": 0.17, "learning_rate": 0.00029956268875378975, "loss": 0.0738, "step": 837 }, { "epoch": 0.17, "learning_rate": 0.0002995612083216162, "loss": 0.0364, "step": 838 }, { "epoch": 0.17, "learning_rate": 0.0002995597253914882, "loss": 0.0432, "step": 839 }, { "epoch": 0.17, "learning_rate": 0.0002995582399634304, "loss": 0.04, "step": 840 }, { "epoch": 0.17, "learning_rate": 0.00029955675203746776, "loss": 0.1019, "step": 841 }, { "epoch": 0.17, "learning_rate": 0.000299555261613625, "loss": 0.0194, "step": 842 }, { "epoch": 0.17, "learning_rate": 0.0002995537686919271, "loss": 0.0304, "step": 843 }, { "epoch": 0.17, "learning_rate": 0.0002995522732723989, "loss": 0.0208, "step": 844 }, { "epoch": 0.17, "learning_rate": 0.00029955077535506546, "loss": 0.0324, "step": 845 }, { "epoch": 0.17, "learning_rate": 0.0002995492749399518, "loss": 0.0547, "step": 846 }, { "epoch": 0.17, "learning_rate": 0.00029954777202708294, "loss": 0.0198, "step": 847 }, { "epoch": 0.17, "learning_rate": 0.000299546266616484, "loss": 0.0215, "step": 848 }, { "epoch": 0.17, "learning_rate": 0.0002995447587081801, "loss": 0.0268, "step": 849 }, { "epoch": 0.17, "learning_rate": 0.0002995432483021965, "loss": 0.0152, "step": 850 }, { "epoch": 0.17, "learning_rate": 0.0002995417353985583, "loss": 0.0227, "step": 851 }, { "epoch": 0.17, "learning_rate": 0.0002995402199972909, "loss": 0.0546, "step": 852 }, { "epoch": 0.17, "learning_rate": 0.00029953870209841946, "loss": 0.0295, "step": 853 }, { "epoch": 0.17, "learning_rate": 0.0002995371817019695, "loss": 0.0514, "step": 854 }, { "epoch": 0.17, "learning_rate": 0.0002995356588079663, "loss": 0.0412, "step": 855 }, { "epoch": 0.17, "learning_rate": 0.00029953413341643535, "loss": 0.0225, "step": 856 }, { "epoch": 0.17, "learning_rate": 0.0002995326055274021, "loss": 0.0123, "step": 857 }, { "epoch": 0.17, "learning_rate": 0.00029953107514089206, "loss": 0.013, "step": 858 }, { "epoch": 0.17, "learning_rate": 0.00029952954225693086, "loss": 0.011, "step": 859 }, { "epoch": 0.18, "learning_rate": 0.000299528006875544, "loss": 0.0108, "step": 860 }, { "epoch": 0.18, "learning_rate": 0.00029952646899675717, "loss": 0.0363, "step": 861 }, { "epoch": 0.18, "learning_rate": 0.00029952492862059607, "loss": 0.0217, "step": 862 }, { "epoch": 0.18, "learning_rate": 0.0002995233857470864, "loss": 0.0409, "step": 863 }, { "epoch": 0.18, "learning_rate": 0.00029952184037625396, "loss": 0.0524, "step": 864 }, { "epoch": 0.18, "learning_rate": 0.0002995202925081245, "loss": 0.0636, "step": 865 }, { "epoch": 0.18, "learning_rate": 0.00029951874214272393, "loss": 0.0259, "step": 866 }, { "epoch": 0.18, "learning_rate": 0.00029951718928007817, "loss": 0.0419, "step": 867 }, { "epoch": 0.18, "learning_rate": 0.0002995156339202131, "loss": 0.0169, "step": 868 }, { "epoch": 0.18, "learning_rate": 0.0002995140760631547, "loss": 0.0421, "step": 869 }, { "epoch": 0.18, "learning_rate": 0.00029951251570892905, "loss": 0.0188, "step": 870 }, { "epoch": 0.18, "learning_rate": 0.00029951095285756207, "loss": 0.027, "step": 871 }, { "epoch": 0.18, "learning_rate": 0.00029950938750908005, "loss": 0.0159, "step": 872 }, { "epoch": 0.18, "learning_rate": 0.00029950781966350896, "loss": 0.0328, "step": 873 }, { "epoch": 0.18, "learning_rate": 0.00029950624932087515, "loss": 0.048, "step": 874 }, { "epoch": 0.18, "learning_rate": 0.0002995046764812047, "loss": 0.0166, "step": 875 }, { "epoch": 0.18, "learning_rate": 0.0002995031011445239, "loss": 0.0297, "step": 876 }, { "epoch": 0.18, "learning_rate": 0.0002995015233108592, "loss": 0.0411, "step": 877 }, { "epoch": 0.18, "learning_rate": 0.0002994999429802368, "loss": 0.0398, "step": 878 }, { "epoch": 0.18, "learning_rate": 0.0002994983601526832, "loss": 0.028, "step": 879 }, { "epoch": 0.18, "learning_rate": 0.00029949677482822475, "loss": 0.0097, "step": 880 }, { "epoch": 0.18, "learning_rate": 0.000299495187006888, "loss": 0.1199, "step": 881 }, { "epoch": 0.18, "learning_rate": 0.0002994935966886994, "loss": 0.0205, "step": 882 }, { "epoch": 0.18, "learning_rate": 0.00029949200387368555, "loss": 0.0107, "step": 883 }, { "epoch": 0.18, "learning_rate": 0.00029949040856187305, "loss": 0.0171, "step": 884 }, { "epoch": 0.18, "learning_rate": 0.0002994888107532885, "loss": 0.0431, "step": 885 }, { "epoch": 0.18, "learning_rate": 0.00029948721044795873, "loss": 0.0396, "step": 886 }, { "epoch": 0.18, "learning_rate": 0.0002994856076459103, "loss": 0.0143, "step": 887 }, { "epoch": 0.18, "learning_rate": 0.0002994840023471701, "loss": 0.0127, "step": 888 }, { "epoch": 0.18, "learning_rate": 0.0002994823945517648, "loss": 0.1093, "step": 889 }, { "epoch": 0.18, "learning_rate": 0.00029948078425972137, "loss": 0.0169, "step": 890 }, { "epoch": 0.18, "learning_rate": 0.00029947917147106674, "loss": 0.0382, "step": 891 }, { "epoch": 0.18, "learning_rate": 0.00029947755618582773, "loss": 0.0352, "step": 892 }, { "epoch": 0.18, "learning_rate": 0.0002994759384040314, "loss": 0.0134, "step": 893 }, { "epoch": 0.18, "learning_rate": 0.00029947431812570475, "loss": 0.0241, "step": 894 }, { "epoch": 0.18, "learning_rate": 0.0002994726953508748, "loss": 0.0276, "step": 895 }, { "epoch": 0.18, "learning_rate": 0.0002994710700795687, "loss": 0.0196, "step": 896 }, { "epoch": 0.18, "learning_rate": 0.0002994694423118136, "loss": 0.0149, "step": 897 }, { "epoch": 0.18, "learning_rate": 0.00029946781204763664, "loss": 0.0427, "step": 898 }, { "epoch": 0.18, "learning_rate": 0.00029946617928706514, "loss": 0.0332, "step": 899 }, { "epoch": 0.18, "learning_rate": 0.0002994645440301262, "loss": 0.0441, "step": 900 }, { "epoch": 0.18, "learning_rate": 0.00029946290627684736, "loss": 0.0209, "step": 901 }, { "epoch": 0.18, "learning_rate": 0.0002994612660272558, "loss": 0.0303, "step": 902 }, { "epoch": 0.18, "learning_rate": 0.00029945962328137895, "loss": 0.0243, "step": 903 }, { "epoch": 0.18, "learning_rate": 0.00029945797803924425, "loss": 0.0141, "step": 904 }, { "epoch": 0.18, "learning_rate": 0.00029945633030087923, "loss": 0.0187, "step": 905 }, { "epoch": 0.18, "learning_rate": 0.00029945468006631137, "loss": 0.0146, "step": 906 }, { "epoch": 0.18, "learning_rate": 0.00029945302733556825, "loss": 0.0421, "step": 907 }, { "epoch": 0.18, "learning_rate": 0.0002994513721086775, "loss": 0.0234, "step": 908 }, { "epoch": 0.19, "learning_rate": 0.00029944971438566664, "loss": 0.0551, "step": 909 }, { "epoch": 0.19, "learning_rate": 0.0002994480541665635, "loss": 0.0537, "step": 910 }, { "epoch": 0.19, "learning_rate": 0.00029944639145139575, "loss": 0.0314, "step": 911 }, { "epoch": 0.19, "learning_rate": 0.00029944472624019114, "loss": 0.0122, "step": 912 }, { "epoch": 0.19, "learning_rate": 0.0002994430585329775, "loss": 0.0172, "step": 913 }, { "epoch": 0.19, "learning_rate": 0.0002994413883297827, "loss": 0.0479, "step": 914 }, { "epoch": 0.19, "learning_rate": 0.00029943971563063464, "loss": 0.0876, "step": 915 }, { "epoch": 0.19, "learning_rate": 0.0002994380404355612, "loss": 0.0365, "step": 916 }, { "epoch": 0.19, "learning_rate": 0.0002994363627445904, "loss": 0.032, "step": 917 }, { "epoch": 0.19, "learning_rate": 0.00029943468255775034, "loss": 0.017, "step": 918 }, { "epoch": 0.19, "learning_rate": 0.00029943299987506895, "loss": 0.0098, "step": 919 }, { "epoch": 0.19, "learning_rate": 0.00029943131469657437, "loss": 0.0201, "step": 920 }, { "epoch": 0.19, "learning_rate": 0.0002994296270222948, "loss": 0.071, "step": 921 }, { "epoch": 0.19, "learning_rate": 0.0002994279368522584, "loss": 0.0509, "step": 922 }, { "epoch": 0.19, "learning_rate": 0.00029942624418649333, "loss": 0.013, "step": 923 }, { "epoch": 0.19, "learning_rate": 0.000299424549025028, "loss": 0.0351, "step": 924 }, { "epoch": 0.19, "learning_rate": 0.00029942285136789055, "loss": 0.0187, "step": 925 }, { "epoch": 0.19, "learning_rate": 0.00029942115121510946, "loss": 0.0498, "step": 926 }, { "epoch": 0.19, "learning_rate": 0.0002994194485667131, "loss": 0.0208, "step": 927 }, { "epoch": 0.19, "learning_rate": 0.0002994177434227299, "loss": 0.0641, "step": 928 }, { "epoch": 0.19, "learning_rate": 0.00029941603578318836, "loss": 0.0428, "step": 929 }, { "epoch": 0.19, "learning_rate": 0.000299414325648117, "loss": 0.0225, "step": 930 }, { "epoch": 0.19, "learning_rate": 0.0002994126130175443, "loss": 0.0417, "step": 931 }, { "epoch": 0.19, "learning_rate": 0.0002994108978914989, "loss": 0.0198, "step": 932 }, { "epoch": 0.19, "learning_rate": 0.0002994091802700096, "loss": 0.0406, "step": 933 }, { "epoch": 0.19, "learning_rate": 0.0002994074601531048, "loss": 0.0073, "step": 934 }, { "epoch": 0.19, "learning_rate": 0.0002994057375408135, "loss": 0.0173, "step": 935 }, { "epoch": 0.19, "learning_rate": 0.0002994040124331644, "loss": 0.0643, "step": 936 }, { "epoch": 0.19, "learning_rate": 0.0002994022848301862, "loss": 0.0251, "step": 937 }, { "epoch": 0.19, "learning_rate": 0.0002994005547319078, "loss": 0.0148, "step": 938 }, { "epoch": 0.19, "learning_rate": 0.00029939882213835813, "loss": 0.0332, "step": 939 }, { "epoch": 0.19, "learning_rate": 0.00029939708704956614, "loss": 0.044, "step": 940 }, { "epoch": 0.19, "learning_rate": 0.0002993953494655608, "loss": 0.0091, "step": 941 }, { "epoch": 0.19, "learning_rate": 0.0002993936093863711, "loss": 0.031, "step": 942 }, { "epoch": 0.19, "learning_rate": 0.00029939186681202616, "loss": 0.1274, "step": 943 }, { "epoch": 0.19, "learning_rate": 0.000299390121742555, "loss": 0.0566, "step": 944 }, { "epoch": 0.19, "learning_rate": 0.0002993883741779868, "loss": 0.0291, "step": 945 }, { "epoch": 0.19, "learning_rate": 0.0002993866241183508, "loss": 0.0287, "step": 946 }, { "epoch": 0.19, "learning_rate": 0.00029938487156367624, "loss": 0.0353, "step": 947 }, { "epoch": 0.19, "learning_rate": 0.00029938311651399226, "loss": 0.0152, "step": 948 }, { "epoch": 0.19, "learning_rate": 0.0002993813589693283, "loss": 0.0099, "step": 949 }, { "epoch": 0.19, "learning_rate": 0.00029937959892971367, "loss": 0.0122, "step": 950 }, { "epoch": 0.19, "learning_rate": 0.0002993778363951777, "loss": 0.022, "step": 951 }, { "epoch": 0.19, "learning_rate": 0.0002993760713657499, "loss": 0.0586, "step": 952 }, { "epoch": 0.19, "learning_rate": 0.0002993743038414598, "loss": 0.0309, "step": 953 }, { "epoch": 0.19, "learning_rate": 0.00029937253382233687, "loss": 0.0688, "step": 954 }, { "epoch": 0.19, "learning_rate": 0.0002993707613084106, "loss": 0.0254, "step": 955 }, { "epoch": 0.19, "learning_rate": 0.0002993689862997107, "loss": 0.0831, "step": 956 }, { "epoch": 0.19, "learning_rate": 0.00029936720879626677, "loss": 0.0339, "step": 957 }, { "epoch": 0.2, "learning_rate": 0.0002993654287981085, "loss": 0.0133, "step": 958 }, { "epoch": 0.2, "learning_rate": 0.0002993636463052656, "loss": 0.0186, "step": 959 }, { "epoch": 0.2, "learning_rate": 0.0002993618613177679, "loss": 0.0345, "step": 960 }, { "epoch": 0.2, "learning_rate": 0.00029936007383564515, "loss": 0.0288, "step": 961 }, { "epoch": 0.2, "learning_rate": 0.00029935828385892725, "loss": 0.0329, "step": 962 }, { "epoch": 0.2, "learning_rate": 0.00029935649138764403, "loss": 0.0164, "step": 963 }, { "epoch": 0.2, "learning_rate": 0.00029935469642182553, "loss": 0.0177, "step": 964 }, { "epoch": 0.2, "learning_rate": 0.0002993528989615016, "loss": 0.018, "step": 965 }, { "epoch": 0.2, "learning_rate": 0.0002993510990067024, "loss": 0.0508, "step": 966 }, { "epoch": 0.2, "learning_rate": 0.0002993492965574579, "loss": 0.0167, "step": 967 }, { "epoch": 0.2, "learning_rate": 0.0002993474916137983, "loss": 0.0174, "step": 968 }, { "epoch": 0.2, "learning_rate": 0.0002993456841757536, "loss": 0.0286, "step": 969 }, { "epoch": 0.2, "learning_rate": 0.00029934387424335407, "loss": 0.0337, "step": 970 }, { "epoch": 0.2, "learning_rate": 0.00029934206181662996, "loss": 0.0391, "step": 971 }, { "epoch": 0.2, "learning_rate": 0.0002993402468956115, "loss": 0.0324, "step": 972 }, { "epoch": 0.2, "learning_rate": 0.000299338429480329, "loss": 0.0938, "step": 973 }, { "epoch": 0.2, "learning_rate": 0.00029933660957081286, "loss": 0.0297, "step": 974 }, { "epoch": 0.2, "learning_rate": 0.00029933478716709345, "loss": 0.0291, "step": 975 }, { "epoch": 0.2, "learning_rate": 0.0002993329622692012, "loss": 0.0125, "step": 976 }, { "epoch": 0.2, "learning_rate": 0.0002993311348771666, "loss": 0.0538, "step": 977 }, { "epoch": 0.2, "learning_rate": 0.0002993293049910201, "loss": 0.0194, "step": 978 }, { "epoch": 0.2, "learning_rate": 0.0002993274726107924, "loss": 0.0325, "step": 979 }, { "epoch": 0.2, "learning_rate": 0.00029932563773651396, "loss": 0.0112, "step": 980 }, { "epoch": 0.2, "learning_rate": 0.0002993238003682156, "loss": 0.0143, "step": 981 }, { "epoch": 0.2, "learning_rate": 0.0002993219605059278, "loss": 0.0374, "step": 982 }, { "epoch": 0.2, "learning_rate": 0.0002993201181496815, "loss": 0.0258, "step": 983 }, { "epoch": 0.2, "learning_rate": 0.00029931827329950723, "loss": 0.0235, "step": 984 }, { "epoch": 0.2, "learning_rate": 0.00029931642595543606, "loss": 0.029, "step": 985 }, { "epoch": 0.2, "learning_rate": 0.00029931457611749867, "loss": 0.0441, "step": 986 }, { "epoch": 0.2, "learning_rate": 0.000299312723785726, "loss": 0.0173, "step": 987 }, { "epoch": 0.2, "learning_rate": 0.00029931086896014907, "loss": 0.0475, "step": 988 }, { "epoch": 0.2, "learning_rate": 0.0002993090116407987, "loss": 0.0489, "step": 989 }, { "epoch": 0.2, "learning_rate": 0.000299307151827706, "loss": 0.0337, "step": 990 }, { "epoch": 0.2, "learning_rate": 0.0002993052895209021, "loss": 0.0263, "step": 991 }, { "epoch": 0.2, "learning_rate": 0.00029930342472041796, "loss": 0.0647, "step": 992 }, { "epoch": 0.2, "learning_rate": 0.0002993015574262848, "loss": 0.0486, "step": 993 }, { "epoch": 0.2, "learning_rate": 0.00029929968763853384, "loss": 0.0253, "step": 994 }, { "epoch": 0.2, "learning_rate": 0.0002992978153571963, "loss": 0.0089, "step": 995 }, { "epoch": 0.2, "learning_rate": 0.00029929594058230333, "loss": 0.0169, "step": 996 }, { "epoch": 0.2, "learning_rate": 0.0002992940633138864, "loss": 0.011, "step": 997 }, { "epoch": 0.2, "learning_rate": 0.0002992921835519767, "loss": 0.0192, "step": 998 }, { "epoch": 0.2, "learning_rate": 0.0002992903012966059, "loss": 0.0343, "step": 999 }, { "epoch": 0.2, "learning_rate": 0.00029928841654780513, "loss": 0.0999, "step": 1000 }, { "epoch": 0.2, "learning_rate": 0.0002992865293056061, "loss": 0.0121, "step": 1001 }, { "epoch": 0.2, "learning_rate": 0.00029928463957004013, "loss": 0.0408, "step": 1002 }, { "epoch": 0.2, "learning_rate": 0.00029928274734113895, "loss": 0.0253, "step": 1003 }, { "epoch": 0.2, "learning_rate": 0.0002992808526189341, "loss": 0.0261, "step": 1004 }, { "epoch": 0.2, "learning_rate": 0.0002992789554034572, "loss": 0.0291, "step": 1005 }, { "epoch": 0.2, "learning_rate": 0.00029927705569473997, "loss": 0.0601, "step": 1006 }, { "epoch": 0.21, "learning_rate": 0.0002992751534928141, "loss": 0.0287, "step": 1007 }, { "epoch": 0.21, "learning_rate": 0.00029927324879771146, "loss": 0.0151, "step": 1008 }, { "epoch": 0.21, "learning_rate": 0.0002992713416094637, "loss": 0.0269, "step": 1009 }, { "epoch": 0.21, "learning_rate": 0.0002992694319281028, "loss": 0.02, "step": 1010 }, { "epoch": 0.21, "learning_rate": 0.00029926751975366066, "loss": 0.047, "step": 1011 }, { "epoch": 0.21, "learning_rate": 0.0002992656050861691, "loss": 0.0362, "step": 1012 }, { "epoch": 0.21, "learning_rate": 0.00029926368792566025, "loss": 0.0204, "step": 1013 }, { "epoch": 0.21, "learning_rate": 0.00029926176827216604, "loss": 0.0788, "step": 1014 }, { "epoch": 0.21, "learning_rate": 0.00029925984612571855, "loss": 0.0261, "step": 1015 }, { "epoch": 0.21, "learning_rate": 0.0002992579214863499, "loss": 0.0421, "step": 1016 }, { "epoch": 0.21, "learning_rate": 0.00029925599435409213, "loss": 0.022, "step": 1017 }, { "epoch": 0.21, "learning_rate": 0.0002992540647289776, "loss": 0.028, "step": 1018 }, { "epoch": 0.21, "learning_rate": 0.00029925213261103843, "loss": 0.0803, "step": 1019 }, { "epoch": 0.21, "learning_rate": 0.00029925019800030694, "loss": 0.0408, "step": 1020 }, { "epoch": 0.21, "learning_rate": 0.0002992482608968154, "loss": 0.0088, "step": 1021 }, { "epoch": 0.21, "learning_rate": 0.00029924632130059613, "loss": 0.0283, "step": 1022 }, { "epoch": 0.21, "learning_rate": 0.0002992443792116816, "loss": 0.0096, "step": 1023 }, { "epoch": 0.21, "learning_rate": 0.0002992424346301042, "loss": 0.0151, "step": 1024 }, { "epoch": 0.21, "learning_rate": 0.00029924048755589647, "loss": 0.0586, "step": 1025 }, { "epoch": 0.21, "learning_rate": 0.00029923853798909084, "loss": 0.0282, "step": 1026 }, { "epoch": 0.21, "learning_rate": 0.0002992365859297199, "loss": 0.0243, "step": 1027 }, { "epoch": 0.21, "learning_rate": 0.0002992346313778164, "loss": 0.0313, "step": 1028 }, { "epoch": 0.21, "learning_rate": 0.0002992326743334127, "loss": 0.0223, "step": 1029 }, { "epoch": 0.21, "learning_rate": 0.0002992307147965418, "loss": 0.033, "step": 1030 }, { "epoch": 0.21, "learning_rate": 0.00029922875276723615, "loss": 0.0164, "step": 1031 }, { "epoch": 0.21, "learning_rate": 0.0002992267882455286, "loss": 0.0289, "step": 1032 }, { "epoch": 0.21, "learning_rate": 0.0002992248212314521, "loss": 0.0206, "step": 1033 }, { "epoch": 0.21, "learning_rate": 0.0002992228517250394, "loss": 0.0388, "step": 1034 }, { "epoch": 0.21, "learning_rate": 0.00029922087972632336, "loss": 0.0074, "step": 1035 }, { "epoch": 0.21, "learning_rate": 0.00029921890523533696, "loss": 0.0461, "step": 1036 }, { "epoch": 0.21, "learning_rate": 0.00029921692825211313, "loss": 0.0137, "step": 1037 }, { "epoch": 0.21, "learning_rate": 0.000299214948776685, "loss": 0.0109, "step": 1038 }, { "epoch": 0.21, "learning_rate": 0.0002992129668090855, "loss": 0.0362, "step": 1039 }, { "epoch": 0.21, "learning_rate": 0.00029921098234934787, "loss": 0.0648, "step": 1040 }, { "epoch": 0.21, "learning_rate": 0.0002992089953975051, "loss": 0.0326, "step": 1041 }, { "epoch": 0.21, "learning_rate": 0.00029920700595359055, "loss": 0.0308, "step": 1042 }, { "epoch": 0.21, "learning_rate": 0.0002992050140176373, "loss": 0.0315, "step": 1043 }, { "epoch": 0.21, "learning_rate": 0.0002992030195896787, "loss": 0.0216, "step": 1044 }, { "epoch": 0.21, "learning_rate": 0.000299201022669748, "loss": 0.0097, "step": 1045 }, { "epoch": 0.21, "learning_rate": 0.0002991990232578786, "loss": 0.0193, "step": 1046 }, { "epoch": 0.21, "learning_rate": 0.0002991970213541039, "loss": 0.082, "step": 1047 }, { "epoch": 0.21, "learning_rate": 0.00029919501695845725, "loss": 0.0219, "step": 1048 }, { "epoch": 0.21, "learning_rate": 0.0002991930100709722, "loss": 0.0216, "step": 1049 }, { "epoch": 0.21, "learning_rate": 0.00029919100069168226, "loss": 0.0394, "step": 1050 }, { "epoch": 0.21, "learning_rate": 0.000299188988820621, "loss": 0.0525, "step": 1051 }, { "epoch": 0.21, "learning_rate": 0.00029918697445782206, "loss": 0.0052, "step": 1052 }, { "epoch": 0.21, "learning_rate": 0.000299184957603319, "loss": 0.0644, "step": 1053 }, { "epoch": 0.21, "learning_rate": 0.00029918293825714553, "loss": 0.05, "step": 1054 }, { "epoch": 0.21, "learning_rate": 0.0002991809164193354, "loss": 0.0306, "step": 1055 }, { "epoch": 0.22, "learning_rate": 0.0002991788920899224, "loss": 0.0426, "step": 1056 }, { "epoch": 0.22, "learning_rate": 0.0002991768652689403, "loss": 0.0056, "step": 1057 }, { "epoch": 0.22, "learning_rate": 0.00029917483595642293, "loss": 0.0134, "step": 1058 }, { "epoch": 0.22, "learning_rate": 0.0002991728041524042, "loss": 0.0369, "step": 1059 }, { "epoch": 0.22, "learning_rate": 0.0002991707698569181, "loss": 0.0306, "step": 1060 }, { "epoch": 0.22, "learning_rate": 0.00029916873306999847, "loss": 0.009, "step": 1061 }, { "epoch": 0.22, "learning_rate": 0.00029916669379167956, "loss": 0.0147, "step": 1062 }, { "epoch": 0.22, "learning_rate": 0.0002991646520219952, "loss": 0.0318, "step": 1063 }, { "epoch": 0.22, "learning_rate": 0.00029916260776097957, "loss": 0.0146, "step": 1064 }, { "epoch": 0.22, "learning_rate": 0.0002991605610086669, "loss": 0.033, "step": 1065 }, { "epoch": 0.22, "learning_rate": 0.00029915851176509124, "loss": 0.0121, "step": 1066 }, { "epoch": 0.22, "learning_rate": 0.0002991564600302869, "loss": 0.0536, "step": 1067 }, { "epoch": 0.22, "learning_rate": 0.0002991544058042881, "loss": 0.018, "step": 1068 }, { "epoch": 0.22, "learning_rate": 0.0002991523490871292, "loss": 0.0421, "step": 1069 }, { "epoch": 0.22, "learning_rate": 0.00029915028987884454, "loss": 0.0165, "step": 1070 }, { "epoch": 0.22, "learning_rate": 0.0002991482281794685, "loss": 0.0337, "step": 1071 }, { "epoch": 0.22, "learning_rate": 0.0002991461639890355, "loss": 0.0248, "step": 1072 }, { "epoch": 0.22, "learning_rate": 0.00029914409730758, "loss": 0.0178, "step": 1073 }, { "epoch": 0.22, "learning_rate": 0.00029914202813513654, "loss": 0.034, "step": 1074 }, { "epoch": 0.22, "learning_rate": 0.0002991399564717397, "loss": 0.0216, "step": 1075 }, { "epoch": 0.22, "learning_rate": 0.0002991378823174241, "loss": 0.0225, "step": 1076 }, { "epoch": 0.22, "learning_rate": 0.0002991358056722243, "loss": 0.017, "step": 1077 }, { "epoch": 0.22, "learning_rate": 0.00029913372653617506, "loss": 0.0257, "step": 1078 }, { "epoch": 0.22, "learning_rate": 0.0002991316449093111, "loss": 0.0131, "step": 1079 }, { "epoch": 0.22, "learning_rate": 0.00029912956079166715, "loss": 0.0362, "step": 1080 }, { "epoch": 0.22, "learning_rate": 0.000299127474183278, "loss": 0.0309, "step": 1081 }, { "epoch": 0.22, "learning_rate": 0.00029912538508417854, "loss": 0.0258, "step": 1082 }, { "epoch": 0.22, "learning_rate": 0.0002991232934944037, "loss": 0.0073, "step": 1083 }, { "epoch": 0.22, "learning_rate": 0.0002991211994139883, "loss": 0.0065, "step": 1084 }, { "epoch": 0.22, "learning_rate": 0.00029911910284296747, "loss": 0.032, "step": 1085 }, { "epoch": 0.22, "learning_rate": 0.00029911700378137604, "loss": 0.0233, "step": 1086 }, { "epoch": 0.22, "learning_rate": 0.0002991149022292492, "loss": 0.0878, "step": 1087 }, { "epoch": 0.22, "learning_rate": 0.0002991127981866221, "loss": 0.017, "step": 1088 }, { "epoch": 0.22, "learning_rate": 0.0002991106916535297, "loss": 0.0169, "step": 1089 }, { "epoch": 0.22, "learning_rate": 0.0002991085826300073, "loss": 0.0286, "step": 1090 }, { "epoch": 0.22, "learning_rate": 0.00029910647111609014, "loss": 0.0355, "step": 1091 }, { "epoch": 0.22, "learning_rate": 0.00029910435711181344, "loss": 0.0286, "step": 1092 }, { "epoch": 0.22, "learning_rate": 0.0002991022406172125, "loss": 0.0353, "step": 1093 }, { "epoch": 0.22, "learning_rate": 0.00029910012163232276, "loss": 0.0502, "step": 1094 }, { "epoch": 0.22, "learning_rate": 0.0002990980001571795, "loss": 0.1432, "step": 1095 }, { "epoch": 0.22, "learning_rate": 0.0002990958761918182, "loss": 0.0148, "step": 1096 }, { "epoch": 0.22, "learning_rate": 0.0002990937497362743, "loss": 0.0159, "step": 1097 }, { "epoch": 0.22, "learning_rate": 0.00029909162079058335, "loss": 0.057, "step": 1098 }, { "epoch": 0.22, "learning_rate": 0.0002990894893547809, "loss": 0.0491, "step": 1099 }, { "epoch": 0.22, "learning_rate": 0.0002990873554289026, "loss": 0.0141, "step": 1100 }, { "epoch": 0.22, "learning_rate": 0.000299085219012984, "loss": 0.0504, "step": 1101 }, { "epoch": 0.22, "learning_rate": 0.0002990830801070608, "loss": 0.0285, "step": 1102 }, { "epoch": 0.22, "learning_rate": 0.0002990809387111688, "loss": 0.064, "step": 1103 }, { "epoch": 0.22, "learning_rate": 0.0002990787948253437, "loss": 0.0232, "step": 1104 }, { "epoch": 0.22, "learning_rate": 0.0002990766484496213, "loss": 0.0147, "step": 1105 }, { "epoch": 0.23, "learning_rate": 0.0002990744995840375, "loss": 0.038, "step": 1106 }, { "epoch": 0.23, "learning_rate": 0.00029907234822862817, "loss": 0.0681, "step": 1107 }, { "epoch": 0.23, "learning_rate": 0.0002990701943834292, "loss": 0.0126, "step": 1108 }, { "epoch": 0.23, "learning_rate": 0.0002990680380484766, "loss": 0.0258, "step": 1109 }, { "epoch": 0.23, "learning_rate": 0.0002990658792238064, "loss": 0.0315, "step": 1110 }, { "epoch": 0.23, "learning_rate": 0.00029906371790945456, "loss": 0.0767, "step": 1111 }, { "epoch": 0.23, "learning_rate": 0.00029906155410545736, "loss": 0.0196, "step": 1112 }, { "epoch": 0.23, "learning_rate": 0.0002990593878118508, "loss": 0.0291, "step": 1113 }, { "epoch": 0.23, "learning_rate": 0.00029905721902867105, "loss": 0.0392, "step": 1114 }, { "epoch": 0.23, "learning_rate": 0.00029905504775595436, "loss": 0.0445, "step": 1115 }, { "epoch": 0.23, "learning_rate": 0.0002990528739937371, "loss": 0.0255, "step": 1116 }, { "epoch": 0.23, "learning_rate": 0.0002990506977420554, "loss": 0.0489, "step": 1117 }, { "epoch": 0.23, "learning_rate": 0.00029904851900094574, "loss": 0.0429, "step": 1118 }, { "epoch": 0.23, "learning_rate": 0.00029904633777044445, "loss": 0.0471, "step": 1119 }, { "epoch": 0.23, "learning_rate": 0.000299044154050588, "loss": 0.0388, "step": 1120 }, { "epoch": 0.23, "learning_rate": 0.0002990419678414128, "loss": 0.0194, "step": 1121 }, { "epoch": 0.23, "learning_rate": 0.0002990397791429554, "loss": 0.0315, "step": 1122 }, { "epoch": 0.23, "learning_rate": 0.0002990375879552524, "loss": 0.0514, "step": 1123 }, { "epoch": 0.23, "learning_rate": 0.00029903539427834035, "loss": 0.0403, "step": 1124 }, { "epoch": 0.23, "learning_rate": 0.00029903319811225586, "loss": 0.0561, "step": 1125 }, { "epoch": 0.23, "learning_rate": 0.0002990309994570356, "loss": 0.0283, "step": 1126 }, { "epoch": 0.23, "learning_rate": 0.0002990287983127164, "loss": 0.0368, "step": 1127 }, { "epoch": 0.23, "learning_rate": 0.00029902659467933494, "loss": 0.0302, "step": 1128 }, { "epoch": 0.23, "learning_rate": 0.00029902438855692806, "loss": 0.0312, "step": 1129 }, { "epoch": 0.23, "learning_rate": 0.00029902217994553257, "loss": 0.0248, "step": 1130 }, { "epoch": 0.23, "learning_rate": 0.00029901996884518537, "loss": 0.0465, "step": 1131 }, { "epoch": 0.23, "learning_rate": 0.0002990177552559234, "loss": 0.0238, "step": 1132 }, { "epoch": 0.23, "learning_rate": 0.0002990155391777836, "loss": 0.0675, "step": 1133 }, { "epoch": 0.23, "learning_rate": 0.00029901332061080303, "loss": 0.0812, "step": 1134 }, { "epoch": 0.23, "learning_rate": 0.0002990110995550187, "loss": 0.0157, "step": 1135 }, { "epoch": 0.23, "learning_rate": 0.00029900887601046775, "loss": 0.0493, "step": 1136 }, { "epoch": 0.23, "learning_rate": 0.00029900664997718735, "loss": 0.0362, "step": 1137 }, { "epoch": 0.23, "learning_rate": 0.00029900442145521454, "loss": 0.0196, "step": 1138 }, { "epoch": 0.23, "learning_rate": 0.0002990021904445867, "loss": 0.0473, "step": 1139 }, { "epoch": 0.23, "learning_rate": 0.000298999956945341, "loss": 0.0122, "step": 1140 }, { "epoch": 0.23, "learning_rate": 0.00029899772095751473, "loss": 0.0158, "step": 1141 }, { "epoch": 0.23, "learning_rate": 0.0002989954824811453, "loss": 0.0353, "step": 1142 }, { "epoch": 0.23, "learning_rate": 0.00029899324151627004, "loss": 0.0873, "step": 1143 }, { "epoch": 0.23, "learning_rate": 0.00029899099806292637, "loss": 0.03, "step": 1144 }, { "epoch": 0.23, "learning_rate": 0.00029898875212115185, "loss": 0.0098, "step": 1145 }, { "epoch": 0.23, "learning_rate": 0.0002989865036909839, "loss": 0.0391, "step": 1146 }, { "epoch": 0.23, "learning_rate": 0.0002989842527724601, "loss": 0.0041, "step": 1147 }, { "epoch": 0.23, "learning_rate": 0.00029898199936561807, "loss": 0.0446, "step": 1148 }, { "epoch": 0.23, "learning_rate": 0.00029897974347049545, "loss": 0.0178, "step": 1149 }, { "epoch": 0.23, "learning_rate": 0.0002989774850871299, "loss": 0.0263, "step": 1150 }, { "epoch": 0.23, "learning_rate": 0.00029897522421555903, "loss": 0.0635, "step": 1151 }, { "epoch": 0.23, "learning_rate": 0.0002989729608558208, "loss": 0.0572, "step": 1152 }, { "epoch": 0.23, "learning_rate": 0.0002989706950079529, "loss": 0.0557, "step": 1153 }, { "epoch": 0.23, "learning_rate": 0.0002989684266719932, "loss": 0.0415, "step": 1154 }, { "epoch": 0.24, "learning_rate": 0.00029896615584797955, "loss": 0.0372, "step": 1155 }, { "epoch": 0.24, "learning_rate": 0.00029896388253594994, "loss": 0.029, "step": 1156 }, { "epoch": 0.24, "learning_rate": 0.00029896160673594224, "loss": 0.05, "step": 1157 }, { "epoch": 0.24, "learning_rate": 0.00029895932844799456, "loss": 0.0549, "step": 1158 }, { "epoch": 0.24, "learning_rate": 0.0002989570476721449, "loss": 0.0215, "step": 1159 }, { "epoch": 0.24, "learning_rate": 0.0002989547644084314, "loss": 0.0485, "step": 1160 }, { "epoch": 0.24, "learning_rate": 0.0002989524786568922, "loss": 0.0341, "step": 1161 }, { "epoch": 0.24, "learning_rate": 0.0002989501904175653, "loss": 0.0294, "step": 1162 }, { "epoch": 0.24, "learning_rate": 0.0002989478996904892, "loss": 0.0158, "step": 1163 }, { "epoch": 0.24, "learning_rate": 0.00029894560647570197, "loss": 0.0059, "step": 1164 }, { "epoch": 0.24, "learning_rate": 0.0002989433107732419, "loss": 0.0169, "step": 1165 }, { "epoch": 0.24, "learning_rate": 0.00029894101258314747, "loss": 0.0151, "step": 1166 }, { "epoch": 0.24, "learning_rate": 0.00029893871190545695, "loss": 0.0146, "step": 1167 }, { "epoch": 0.24, "learning_rate": 0.0002989364087402088, "loss": 0.02, "step": 1168 }, { "epoch": 0.24, "learning_rate": 0.0002989341030874415, "loss": 0.0292, "step": 1169 }, { "epoch": 0.24, "learning_rate": 0.0002989317949471935, "loss": 0.031, "step": 1170 }, { "epoch": 0.24, "learning_rate": 0.00029892948431950347, "loss": 0.0299, "step": 1171 }, { "epoch": 0.24, "learning_rate": 0.00029892717120440985, "loss": 0.0247, "step": 1172 }, { "epoch": 0.24, "learning_rate": 0.00029892485560195143, "loss": 0.0119, "step": 1173 }, { "epoch": 0.24, "learning_rate": 0.0002989225375121667, "loss": 0.0218, "step": 1174 }, { "epoch": 0.24, "learning_rate": 0.0002989202169350946, "loss": 0.0194, "step": 1175 }, { "epoch": 0.24, "learning_rate": 0.0002989178938707737, "loss": 0.0545, "step": 1176 }, { "epoch": 0.24, "learning_rate": 0.00029891556831924287, "loss": 0.0085, "step": 1177 }, { "epoch": 0.24, "learning_rate": 0.000298913240280541, "loss": 0.0224, "step": 1178 }, { "epoch": 0.24, "learning_rate": 0.00029891090975470684, "loss": 0.0168, "step": 1179 }, { "epoch": 0.24, "learning_rate": 0.00029890857674177946, "loss": 0.0722, "step": 1180 }, { "epoch": 0.24, "learning_rate": 0.00029890624124179774, "loss": 0.0534, "step": 1181 }, { "epoch": 0.24, "learning_rate": 0.00029890390325480076, "loss": 0.079, "step": 1182 }, { "epoch": 0.24, "learning_rate": 0.00029890156278082744, "loss": 0.0264, "step": 1183 }, { "epoch": 0.24, "learning_rate": 0.000298899219819917, "loss": 0.0852, "step": 1184 }, { "epoch": 0.24, "learning_rate": 0.0002988968743721085, "loss": 0.0234, "step": 1185 }, { "epoch": 0.24, "learning_rate": 0.0002988945264374412, "loss": 0.0066, "step": 1186 }, { "epoch": 0.24, "learning_rate": 0.00029889217601595413, "loss": 0.0399, "step": 1187 }, { "epoch": 0.24, "learning_rate": 0.00029888982310768676, "loss": 0.0273, "step": 1188 }, { "epoch": 0.24, "learning_rate": 0.0002988874677126783, "loss": 0.0274, "step": 1189 }, { "epoch": 0.24, "learning_rate": 0.00029888510983096803, "loss": 0.017, "step": 1190 }, { "epoch": 0.24, "learning_rate": 0.0002988827494625954, "loss": 0.0381, "step": 1191 }, { "epoch": 0.24, "learning_rate": 0.00029888038660759984, "loss": 0.0313, "step": 1192 }, { "epoch": 0.24, "learning_rate": 0.00029887802126602077, "loss": 0.045, "step": 1193 }, { "epoch": 0.24, "learning_rate": 0.00029887565343789774, "loss": 0.0209, "step": 1194 }, { "epoch": 0.24, "learning_rate": 0.0002988732831232702, "loss": 0.0229, "step": 1195 }, { "epoch": 0.24, "learning_rate": 0.0002988709103221779, "loss": 0.028, "step": 1196 }, { "epoch": 0.24, "learning_rate": 0.0002988685350346604, "loss": 0.032, "step": 1197 }, { "epoch": 0.24, "learning_rate": 0.00029886615726075727, "loss": 0.0287, "step": 1198 }, { "epoch": 0.24, "learning_rate": 0.00029886377700050833, "loss": 0.0305, "step": 1199 }, { "epoch": 0.24, "learning_rate": 0.00029886139425395336, "loss": 0.0106, "step": 1200 }, { "epoch": 0.24, "learning_rate": 0.00029885900902113205, "loss": 0.019, "step": 1201 }, { "epoch": 0.24, "learning_rate": 0.0002988566213020844, "loss": 0.0308, "step": 1202 }, { "epoch": 0.24, "learning_rate": 0.00029885423109685013, "loss": 0.0191, "step": 1203 }, { "epoch": 0.25, "learning_rate": 0.00029885183840546917, "loss": 0.043, "step": 1204 }, { "epoch": 0.25, "learning_rate": 0.00029884944322798156, "loss": 0.0501, "step": 1205 }, { "epoch": 0.25, "learning_rate": 0.0002988470455644273, "loss": 0.0363, "step": 1206 }, { "epoch": 0.25, "learning_rate": 0.0002988446454148464, "loss": 0.0266, "step": 1207 }, { "epoch": 0.25, "learning_rate": 0.00029884224277927895, "loss": 0.0173, "step": 1208 }, { "epoch": 0.25, "learning_rate": 0.0002988398376577651, "loss": 0.034, "step": 1209 }, { "epoch": 0.25, "learning_rate": 0.000298837430050345, "loss": 0.017, "step": 1210 }, { "epoch": 0.25, "learning_rate": 0.00029883501995705885, "loss": 0.0134, "step": 1211 }, { "epoch": 0.25, "learning_rate": 0.00029883260737794694, "loss": 0.0387, "step": 1212 }, { "epoch": 0.25, "learning_rate": 0.00029883019231304953, "loss": 0.0113, "step": 1213 }, { "epoch": 0.25, "learning_rate": 0.000298827774762407, "loss": 0.0278, "step": 1214 }, { "epoch": 0.25, "learning_rate": 0.0002988253547260597, "loss": 0.0144, "step": 1215 }, { "epoch": 0.25, "learning_rate": 0.000298822932204048, "loss": 0.0218, "step": 1216 }, { "epoch": 0.25, "learning_rate": 0.00029882050719641246, "loss": 0.0184, "step": 1217 }, { "epoch": 0.25, "learning_rate": 0.0002988180797031935, "loss": 0.0199, "step": 1218 }, { "epoch": 0.25, "learning_rate": 0.00029881564972443166, "loss": 0.0178, "step": 1219 }, { "epoch": 0.25, "learning_rate": 0.00029881321726016763, "loss": 0.0557, "step": 1220 }, { "epoch": 0.25, "learning_rate": 0.00029881078231044195, "loss": 0.0244, "step": 1221 }, { "epoch": 0.25, "learning_rate": 0.0002988083448752953, "loss": 0.0134, "step": 1222 }, { "epoch": 0.25, "learning_rate": 0.00029880590495476837, "loss": 0.0162, "step": 1223 }, { "epoch": 0.25, "learning_rate": 0.00029880346254890195, "loss": 0.0121, "step": 1224 }, { "epoch": 0.25, "learning_rate": 0.00029880101765773683, "loss": 0.0298, "step": 1225 }, { "epoch": 0.25, "learning_rate": 0.00029879857028131384, "loss": 0.0253, "step": 1226 }, { "epoch": 0.25, "learning_rate": 0.00029879612041967384, "loss": 0.0147, "step": 1227 }, { "epoch": 0.25, "learning_rate": 0.0002987936680728578, "loss": 0.0501, "step": 1228 }, { "epoch": 0.25, "learning_rate": 0.0002987912132409065, "loss": 0.0492, "step": 1229 }, { "epoch": 0.25, "learning_rate": 0.0002987887559238612, "loss": 0.0232, "step": 1230 }, { "epoch": 0.25, "learning_rate": 0.0002987862961217628, "loss": 0.0337, "step": 1231 }, { "epoch": 0.25, "learning_rate": 0.00029878383383465237, "loss": 0.0117, "step": 1232 }, { "epoch": 0.25, "learning_rate": 0.0002987813690625711, "loss": 0.0092, "step": 1233 }, { "epoch": 0.25, "learning_rate": 0.00029877890180556006, "loss": 0.0296, "step": 1234 }, { "epoch": 0.25, "learning_rate": 0.0002987764320636606, "loss": 0.046, "step": 1235 }, { "epoch": 0.25, "learning_rate": 0.0002987739598369138, "loss": 0.0241, "step": 1236 }, { "epoch": 0.25, "learning_rate": 0.00029877148512536114, "loss": 0.0483, "step": 1237 }, { "epoch": 0.25, "learning_rate": 0.0002987690079290438, "loss": 0.0246, "step": 1238 }, { "epoch": 0.25, "learning_rate": 0.0002987665282480032, "loss": 0.0164, "step": 1239 }, { "epoch": 0.25, "learning_rate": 0.00029876404608228076, "loss": 0.0345, "step": 1240 }, { "epoch": 0.25, "learning_rate": 0.0002987615614319179, "loss": 0.0329, "step": 1241 }, { "epoch": 0.25, "learning_rate": 0.00029875907429695623, "loss": 0.0591, "step": 1242 }, { "epoch": 0.25, "learning_rate": 0.0002987565846774372, "loss": 0.012, "step": 1243 }, { "epoch": 0.25, "learning_rate": 0.00029875409257340243, "loss": 0.048, "step": 1244 }, { "epoch": 0.25, "learning_rate": 0.00029875159798489347, "loss": 0.0228, "step": 1245 }, { "epoch": 0.25, "learning_rate": 0.0002987491009119521, "loss": 0.0139, "step": 1246 }, { "epoch": 0.25, "learning_rate": 0.00029874660135461987, "loss": 0.0676, "step": 1247 }, { "epoch": 0.25, "learning_rate": 0.00029874409931293866, "loss": 0.0142, "step": 1248 }, { "epoch": 0.25, "learning_rate": 0.0002987415947869502, "loss": 0.0096, "step": 1249 }, { "epoch": 0.25, "learning_rate": 0.0002987390877766964, "loss": 0.0451, "step": 1250 }, { "epoch": 0.25, "learning_rate": 0.000298736578282219, "loss": 0.0386, "step": 1251 }, { "epoch": 0.25, "learning_rate": 0.00029873406630356007, "loss": 0.0276, "step": 1252 }, { "epoch": 0.26, "learning_rate": 0.0002987315518407614, "loss": 0.0215, "step": 1253 }, { "epoch": 0.26, "learning_rate": 0.00029872903489386505, "loss": 0.0191, "step": 1254 }, { "epoch": 0.26, "learning_rate": 0.0002987265154629131, "loss": 0.0458, "step": 1255 }, { "epoch": 0.26, "learning_rate": 0.0002987239935479476, "loss": 0.0141, "step": 1256 }, { "epoch": 0.26, "learning_rate": 0.0002987214691490107, "loss": 0.088, "step": 1257 }, { "epoch": 0.26, "learning_rate": 0.00029871894226614446, "loss": 0.0188, "step": 1258 }, { "epoch": 0.26, "learning_rate": 0.00029871641289939125, "loss": 0.0594, "step": 1259 }, { "epoch": 0.26, "learning_rate": 0.0002987138810487932, "loss": 0.0223, "step": 1260 }, { "epoch": 0.26, "learning_rate": 0.0002987113467143926, "loss": 0.0579, "step": 1261 }, { "epoch": 0.26, "learning_rate": 0.0002987088098962318, "loss": 0.0116, "step": 1262 }, { "epoch": 0.26, "learning_rate": 0.00029870627059435317, "loss": 0.0292, "step": 1263 }, { "epoch": 0.26, "learning_rate": 0.00029870372880879905, "loss": 0.0491, "step": 1264 }, { "epoch": 0.26, "learning_rate": 0.00029870118453961206, "loss": 0.0272, "step": 1265 }, { "epoch": 0.26, "learning_rate": 0.00029869863778683454, "loss": 0.0063, "step": 1266 }, { "epoch": 0.26, "learning_rate": 0.0002986960885505091, "loss": 0.0337, "step": 1267 }, { "epoch": 0.26, "learning_rate": 0.00029869353683067827, "loss": 0.0316, "step": 1268 }, { "epoch": 0.26, "learning_rate": 0.00029869098262738474, "loss": 0.0259, "step": 1269 }, { "epoch": 0.26, "learning_rate": 0.0002986884259406711, "loss": 0.0141, "step": 1270 }, { "epoch": 0.26, "learning_rate": 0.00029868586677058004, "loss": 0.0101, "step": 1271 }, { "epoch": 0.26, "learning_rate": 0.0002986833051171544, "loss": 0.0599, "step": 1272 }, { "epoch": 0.26, "learning_rate": 0.00029868074098043695, "loss": 0.0134, "step": 1273 }, { "epoch": 0.26, "learning_rate": 0.0002986781743604704, "loss": 0.0273, "step": 1274 }, { "epoch": 0.26, "learning_rate": 0.00029867560525729766, "loss": 0.0293, "step": 1275 }, { "epoch": 0.26, "learning_rate": 0.0002986730336709617, "loss": 0.0296, "step": 1276 }, { "epoch": 0.26, "learning_rate": 0.00029867045960150547, "loss": 0.0092, "step": 1277 }, { "epoch": 0.26, "learning_rate": 0.0002986678830489719, "loss": 0.0254, "step": 1278 }, { "epoch": 0.26, "learning_rate": 0.00029866530401340407, "loss": 0.026, "step": 1279 }, { "epoch": 0.26, "learning_rate": 0.000298662722494845, "loss": 0.0138, "step": 1280 }, { "epoch": 0.26, "learning_rate": 0.00029866013849333785, "loss": 0.0288, "step": 1281 }, { "epoch": 0.26, "learning_rate": 0.0002986575520089258, "loss": 0.02, "step": 1282 }, { "epoch": 0.26, "learning_rate": 0.000298654963041652, "loss": 0.0361, "step": 1283 }, { "epoch": 0.26, "learning_rate": 0.0002986523715915597, "loss": 0.0305, "step": 1284 }, { "epoch": 0.26, "learning_rate": 0.0002986497776586922, "loss": 0.0215, "step": 1285 }, { "epoch": 0.26, "learning_rate": 0.00029864718124309283, "loss": 0.0493, "step": 1286 }, { "epoch": 0.26, "learning_rate": 0.00029864458234480496, "loss": 0.0141, "step": 1287 }, { "epoch": 0.26, "learning_rate": 0.00029864198096387197, "loss": 0.0228, "step": 1288 }, { "epoch": 0.26, "learning_rate": 0.0002986393771003373, "loss": 0.0671, "step": 1289 }, { "epoch": 0.26, "learning_rate": 0.00029863677075424446, "loss": 0.0298, "step": 1290 }, { "epoch": 0.26, "learning_rate": 0.000298634161925637, "loss": 0.0827, "step": 1291 }, { "epoch": 0.26, "learning_rate": 0.0002986315506145584, "loss": 0.0421, "step": 1292 }, { "epoch": 0.26, "learning_rate": 0.0002986289368210524, "loss": 0.0117, "step": 1293 }, { "epoch": 0.26, "learning_rate": 0.0002986263205451626, "loss": 0.0109, "step": 1294 }, { "epoch": 0.26, "learning_rate": 0.00029862370178693263, "loss": 0.0291, "step": 1295 }, { "epoch": 0.26, "learning_rate": 0.0002986210805464064, "loss": 0.0339, "step": 1296 }, { "epoch": 0.26, "learning_rate": 0.0002986184568236275, "loss": 0.0577, "step": 1297 }, { "epoch": 0.26, "learning_rate": 0.00029861583061863985, "loss": 0.0117, "step": 1298 }, { "epoch": 0.26, "learning_rate": 0.00029861320193148736, "loss": 0.0189, "step": 1299 }, { "epoch": 0.26, "learning_rate": 0.0002986105707622138, "loss": 0.0333, "step": 1300 }, { "epoch": 0.26, "learning_rate": 0.0002986079371108632, "loss": 0.0292, "step": 1301 }, { "epoch": 0.27, "learning_rate": 0.0002986053009774795, "loss": 0.0243, "step": 1302 }, { "epoch": 0.27, "learning_rate": 0.0002986026623621068, "loss": 0.0346, "step": 1303 }, { "epoch": 0.27, "learning_rate": 0.00029860002126478913, "loss": 0.0302, "step": 1304 }, { "epoch": 0.27, "learning_rate": 0.0002985973776855706, "loss": 0.0041, "step": 1305 }, { "epoch": 0.27, "learning_rate": 0.0002985947316244954, "loss": 0.0194, "step": 1306 }, { "epoch": 0.27, "learning_rate": 0.00029859208308160765, "loss": 0.0103, "step": 1307 }, { "epoch": 0.27, "learning_rate": 0.0002985894320569516, "loss": 0.0192, "step": 1308 }, { "epoch": 0.27, "learning_rate": 0.0002985867785505716, "loss": 0.0387, "step": 1309 }, { "epoch": 0.27, "learning_rate": 0.0002985841225625119, "loss": 0.0095, "step": 1310 }, { "epoch": 0.27, "learning_rate": 0.00029858146409281693, "loss": 0.0461, "step": 1311 }, { "epoch": 0.27, "learning_rate": 0.00029857880314153096, "loss": 0.0577, "step": 1312 }, { "epoch": 0.27, "learning_rate": 0.00029857613970869854, "loss": 0.014, "step": 1313 }, { "epoch": 0.27, "learning_rate": 0.00029857347379436415, "loss": 0.0372, "step": 1314 }, { "epoch": 0.27, "learning_rate": 0.0002985708053985723, "loss": 0.0409, "step": 1315 }, { "epoch": 0.27, "learning_rate": 0.00029856813452136755, "loss": 0.1102, "step": 1316 }, { "epoch": 0.27, "learning_rate": 0.00029856546116279446, "loss": 0.0495, "step": 1317 }, { "epoch": 0.27, "learning_rate": 0.0002985627853228978, "loss": 0.0519, "step": 1318 }, { "epoch": 0.27, "learning_rate": 0.00029856010700172217, "loss": 0.0292, "step": 1319 }, { "epoch": 0.27, "learning_rate": 0.0002985574261993123, "loss": 0.0071, "step": 1320 }, { "epoch": 0.27, "learning_rate": 0.000298554742915713, "loss": 0.0399, "step": 1321 }, { "epoch": 0.27, "learning_rate": 0.0002985520571509691, "loss": 0.0072, "step": 1322 }, { "epoch": 0.27, "learning_rate": 0.0002985493689051254, "loss": 0.0205, "step": 1323 }, { "epoch": 0.27, "learning_rate": 0.00029854667817822686, "loss": 0.0132, "step": 1324 }, { "epoch": 0.27, "learning_rate": 0.0002985439849703184, "loss": 0.0131, "step": 1325 }, { "epoch": 0.27, "learning_rate": 0.00029854128928144503, "loss": 0.0184, "step": 1326 }, { "epoch": 0.27, "learning_rate": 0.00029853859111165164, "loss": 0.0111, "step": 1327 }, { "epoch": 0.27, "learning_rate": 0.00029853589046098343, "loss": 0.0244, "step": 1328 }, { "epoch": 0.27, "learning_rate": 0.0002985331873294855, "loss": 0.036, "step": 1329 }, { "epoch": 0.27, "learning_rate": 0.00029853048171720294, "loss": 0.0202, "step": 1330 }, { "epoch": 0.27, "learning_rate": 0.000298527773624181, "loss": 0.0321, "step": 1331 }, { "epoch": 0.27, "learning_rate": 0.0002985250630504648, "loss": 0.0417, "step": 1332 }, { "epoch": 0.27, "learning_rate": 0.0002985223499960997, "loss": 0.0431, "step": 1333 }, { "epoch": 0.27, "learning_rate": 0.00029851963446113106, "loss": 0.0254, "step": 1334 }, { "epoch": 0.27, "learning_rate": 0.00029851691644560416, "loss": 0.0138, "step": 1335 }, { "epoch": 0.27, "learning_rate": 0.0002985141959495644, "loss": 0.0451, "step": 1336 }, { "epoch": 0.27, "learning_rate": 0.0002985114729730572, "loss": 0.0059, "step": 1337 }, { "epoch": 0.27, "learning_rate": 0.0002985087475161281, "loss": 0.0234, "step": 1338 }, { "epoch": 0.27, "learning_rate": 0.00029850601957882254, "loss": 0.0539, "step": 1339 }, { "epoch": 0.27, "learning_rate": 0.00029850328916118614, "loss": 0.0205, "step": 1340 }, { "epoch": 0.27, "learning_rate": 0.0002985005562632645, "loss": 0.0486, "step": 1341 }, { "epoch": 0.27, "learning_rate": 0.0002984978208851033, "loss": 0.0182, "step": 1342 }, { "epoch": 0.27, "learning_rate": 0.0002984950830267482, "loss": 0.034, "step": 1343 }, { "epoch": 0.27, "learning_rate": 0.0002984923426882448, "loss": 0.0216, "step": 1344 }, { "epoch": 0.27, "learning_rate": 0.000298489599869639, "loss": 0.0305, "step": 1345 }, { "epoch": 0.27, "learning_rate": 0.0002984868545709767, "loss": 0.0512, "step": 1346 }, { "epoch": 0.27, "learning_rate": 0.0002984841067923035, "loss": 0.0515, "step": 1347 }, { "epoch": 0.27, "learning_rate": 0.00029848135653366556, "loss": 0.02, "step": 1348 }, { "epoch": 0.27, "learning_rate": 0.00029847860379510855, "loss": 0.0335, "step": 1349 }, { "epoch": 0.27, "learning_rate": 0.0002984758485766787, "loss": 0.0187, "step": 1350 }, { "epoch": 0.28, "learning_rate": 0.00029847309087842187, "loss": 0.0654, "step": 1351 }, { "epoch": 0.28, "learning_rate": 0.00029847033070038413, "loss": 0.0547, "step": 1352 }, { "epoch": 0.28, "learning_rate": 0.00029846756804261166, "loss": 0.0224, "step": 1353 }, { "epoch": 0.28, "learning_rate": 0.00029846480290515054, "loss": 0.0362, "step": 1354 }, { "epoch": 0.28, "learning_rate": 0.00029846203528804694, "loss": 0.027, "step": 1355 }, { "epoch": 0.28, "learning_rate": 0.0002984592651913471, "loss": 0.0383, "step": 1356 }, { "epoch": 0.28, "learning_rate": 0.00029845649261509737, "loss": 0.0344, "step": 1357 }, { "epoch": 0.28, "learning_rate": 0.00029845371755934393, "loss": 0.0434, "step": 1358 }, { "epoch": 0.28, "learning_rate": 0.00029845094002413315, "loss": 0.0225, "step": 1359 }, { "epoch": 0.28, "learning_rate": 0.0002984481600095115, "loss": 0.0183, "step": 1360 }, { "epoch": 0.28, "learning_rate": 0.00029844537751552534, "loss": 0.0086, "step": 1361 }, { "epoch": 0.28, "learning_rate": 0.0002984425925422211, "loss": 0.0501, "step": 1362 }, { "epoch": 0.28, "learning_rate": 0.0002984398050896455, "loss": 0.0139, "step": 1363 }, { "epoch": 0.28, "learning_rate": 0.00029843701515784484, "loss": 0.0335, "step": 1364 }, { "epoch": 0.28, "learning_rate": 0.00029843422274686586, "loss": 0.0266, "step": 1365 }, { "epoch": 0.28, "learning_rate": 0.00029843142785675517, "loss": 0.0279, "step": 1366 }, { "epoch": 0.28, "learning_rate": 0.0002984286304875595, "loss": 0.0298, "step": 1367 }, { "epoch": 0.28, "learning_rate": 0.0002984258306393255, "loss": 0.0103, "step": 1368 }, { "epoch": 0.28, "learning_rate": 0.0002984230283120999, "loss": 0.0263, "step": 1369 }, { "epoch": 0.28, "learning_rate": 0.00029842022350592967, "loss": 0.033, "step": 1370 }, { "epoch": 0.28, "learning_rate": 0.0002984174162208614, "loss": 0.0636, "step": 1371 }, { "epoch": 0.28, "learning_rate": 0.0002984146064569422, "loss": 0.0261, "step": 1372 }, { "epoch": 0.28, "learning_rate": 0.00029841179421421897, "loss": 0.0264, "step": 1373 }, { "epoch": 0.28, "learning_rate": 0.0002984089794927385, "loss": 0.0081, "step": 1374 }, { "epoch": 0.28, "learning_rate": 0.0002984061622925481, "loss": 0.01, "step": 1375 }, { "epoch": 0.28, "learning_rate": 0.0002984033426136945, "loss": 0.0199, "step": 1376 }, { "epoch": 0.28, "learning_rate": 0.000298400520456225, "loss": 0.0177, "step": 1377 }, { "epoch": 0.28, "learning_rate": 0.0002983976958201867, "loss": 0.0189, "step": 1378 }, { "epoch": 0.28, "learning_rate": 0.00029839486870562675, "loss": 0.0144, "step": 1379 }, { "epoch": 0.28, "learning_rate": 0.00029839203911259237, "loss": 0.0401, "step": 1380 }, { "epoch": 0.28, "learning_rate": 0.00029838920704113085, "loss": 0.0353, "step": 1381 }, { "epoch": 0.28, "learning_rate": 0.0002983863724912894, "loss": 0.0134, "step": 1382 }, { "epoch": 0.28, "learning_rate": 0.00029838353546311546, "loss": 0.0407, "step": 1383 }, { "epoch": 0.28, "learning_rate": 0.00029838069595665645, "loss": 0.0494, "step": 1384 }, { "epoch": 0.28, "learning_rate": 0.00029837785397195967, "loss": 0.0435, "step": 1385 }, { "epoch": 0.28, "learning_rate": 0.00029837500950907265, "loss": 0.0172, "step": 1386 }, { "epoch": 0.28, "learning_rate": 0.00029837216256804294, "loss": 0.0114, "step": 1387 }, { "epoch": 0.28, "learning_rate": 0.000298369313148918, "loss": 0.0516, "step": 1388 }, { "epoch": 0.28, "learning_rate": 0.00029836646125174545, "loss": 0.0359, "step": 1389 }, { "epoch": 0.28, "learning_rate": 0.000298363606876573, "loss": 0.0474, "step": 1390 }, { "epoch": 0.28, "learning_rate": 0.00029836075002344814, "loss": 0.0493, "step": 1391 }, { "epoch": 0.28, "learning_rate": 0.0002983578906924188, "loss": 0.0045, "step": 1392 }, { "epoch": 0.28, "learning_rate": 0.0002983550288835326, "loss": 0.0444, "step": 1393 }, { "epoch": 0.28, "learning_rate": 0.00029835216459683745, "loss": 0.027, "step": 1394 }, { "epoch": 0.28, "learning_rate": 0.00029834929783238104, "loss": 0.0436, "step": 1395 }, { "epoch": 0.28, "learning_rate": 0.00029834642859021134, "loss": 0.0295, "step": 1396 }, { "epoch": 0.28, "learning_rate": 0.00029834355687037627, "loss": 0.0494, "step": 1397 }, { "epoch": 0.28, "learning_rate": 0.0002983406826729238, "loss": 0.0213, "step": 1398 }, { "epoch": 0.28, "learning_rate": 0.0002983378059979019, "loss": 0.0171, "step": 1399 }, { "epoch": 0.29, "learning_rate": 0.0002983349268453586, "loss": 0.0494, "step": 1400 }, { "epoch": 0.29, "learning_rate": 0.00029833204521534205, "loss": 0.0207, "step": 1401 }, { "epoch": 0.29, "learning_rate": 0.00029832916110790036, "loss": 0.0287, "step": 1402 }, { "epoch": 0.29, "learning_rate": 0.0002983262745230817, "loss": 0.0514, "step": 1403 }, { "epoch": 0.29, "learning_rate": 0.0002983233854609342, "loss": 0.0141, "step": 1404 }, { "epoch": 0.29, "learning_rate": 0.00029832049392150626, "loss": 0.027, "step": 1405 }, { "epoch": 0.29, "learning_rate": 0.00029831759990484605, "loss": 0.0231, "step": 1406 }, { "epoch": 0.29, "learning_rate": 0.00029831470341100196, "loss": 0.0249, "step": 1407 }, { "epoch": 0.29, "learning_rate": 0.00029831180444002235, "loss": 0.0055, "step": 1408 }, { "epoch": 0.29, "learning_rate": 0.0002983089029919557, "loss": 0.0196, "step": 1409 }, { "epoch": 0.29, "learning_rate": 0.00029830599906685036, "loss": 0.0265, "step": 1410 }, { "epoch": 0.29, "learning_rate": 0.0002983030926647549, "loss": 0.0097, "step": 1411 }, { "epoch": 0.29, "learning_rate": 0.00029830018378571786, "loss": 0.0242, "step": 1412 }, { "epoch": 0.29, "learning_rate": 0.0002982972724297878, "loss": 0.0275, "step": 1413 }, { "epoch": 0.29, "learning_rate": 0.00029829435859701336, "loss": 0.022, "step": 1414 }, { "epoch": 0.29, "learning_rate": 0.0002982914422874432, "loss": 0.0863, "step": 1415 }, { "epoch": 0.29, "learning_rate": 0.0002982885235011261, "loss": 0.0245, "step": 1416 }, { "epoch": 0.29, "learning_rate": 0.0002982856022381107, "loss": 0.0409, "step": 1417 }, { "epoch": 0.29, "learning_rate": 0.0002982826784984458, "loss": 0.0291, "step": 1418 }, { "epoch": 0.29, "learning_rate": 0.0002982797522821803, "loss": 0.0108, "step": 1419 }, { "epoch": 0.29, "learning_rate": 0.00029827682358936304, "loss": 0.0227, "step": 1420 }, { "epoch": 0.29, "learning_rate": 0.0002982738924200429, "loss": 0.0482, "step": 1421 }, { "epoch": 0.29, "learning_rate": 0.00029827095877426896, "loss": 0.015, "step": 1422 }, { "epoch": 0.29, "learning_rate": 0.00029826802265209, "loss": 0.0363, "step": 1423 }, { "epoch": 0.29, "learning_rate": 0.00029826508405355527, "loss": 0.0261, "step": 1424 }, { "epoch": 0.29, "learning_rate": 0.00029826214297871376, "loss": 0.0495, "step": 1425 }, { "epoch": 0.29, "learning_rate": 0.0002982591994276146, "loss": 0.0327, "step": 1426 }, { "epoch": 0.29, "learning_rate": 0.0002982562534003069, "loss": 0.0194, "step": 1427 }, { "epoch": 0.29, "learning_rate": 0.00029825330489684, "loss": 0.0235, "step": 1428 }, { "epoch": 0.29, "learning_rate": 0.00029825035391726297, "loss": 0.0288, "step": 1429 }, { "epoch": 0.29, "learning_rate": 0.0002982474004616252, "loss": 0.0165, "step": 1430 }, { "epoch": 0.29, "learning_rate": 0.00029824444452997606, "loss": 0.0318, "step": 1431 }, { "epoch": 0.29, "learning_rate": 0.00029824148612236483, "loss": 0.0107, "step": 1432 }, { "epoch": 0.29, "learning_rate": 0.00029823852523884096, "loss": 0.018, "step": 1433 }, { "epoch": 0.29, "learning_rate": 0.0002982355618794539, "loss": 0.0197, "step": 1434 }, { "epoch": 0.29, "learning_rate": 0.0002982325960442531, "loss": 0.0271, "step": 1435 }, { "epoch": 0.29, "learning_rate": 0.00029822962773328826, "loss": 0.0198, "step": 1436 }, { "epoch": 0.29, "learning_rate": 0.0002982266569466087, "loss": 0.0359, "step": 1437 }, { "epoch": 0.29, "learning_rate": 0.0002982236836842643, "loss": 0.0508, "step": 1438 }, { "epoch": 0.29, "learning_rate": 0.00029822070794630447, "loss": 0.0353, "step": 1439 }, { "epoch": 0.29, "learning_rate": 0.00029821772973277907, "loss": 0.016, "step": 1440 }, { "epoch": 0.29, "learning_rate": 0.00029821474904373783, "loss": 0.0372, "step": 1441 }, { "epoch": 0.29, "learning_rate": 0.00029821176587923047, "loss": 0.0227, "step": 1442 }, { "epoch": 0.29, "learning_rate": 0.00029820878023930687, "loss": 0.0114, "step": 1443 }, { "epoch": 0.29, "learning_rate": 0.00029820579212401683, "loss": 0.0141, "step": 1444 }, { "epoch": 0.29, "learning_rate": 0.0002982028015334104, "loss": 0.0233, "step": 1445 }, { "epoch": 0.29, "learning_rate": 0.00029819980846753735, "loss": 0.0386, "step": 1446 }, { "epoch": 0.29, "learning_rate": 0.0002981968129264478, "loss": 0.009, "step": 1447 }, { "epoch": 0.29, "learning_rate": 0.0002981938149101917, "loss": 0.0345, "step": 1448 }, { "epoch": 0.3, "learning_rate": 0.00029819081441881916, "loss": 0.0494, "step": 1449 }, { "epoch": 0.3, "learning_rate": 0.00029818781145238033, "loss": 0.0185, "step": 1450 }, { "epoch": 0.3, "learning_rate": 0.00029818480601092527, "loss": 0.0584, "step": 1451 }, { "epoch": 0.3, "learning_rate": 0.0002981817980945043, "loss": 0.0282, "step": 1452 }, { "epoch": 0.3, "learning_rate": 0.0002981787877031675, "loss": 0.0172, "step": 1453 }, { "epoch": 0.3, "learning_rate": 0.0002981757748369653, "loss": 0.0354, "step": 1454 }, { "epoch": 0.3, "learning_rate": 0.00029817275949594793, "loss": 0.046, "step": 1455 }, { "epoch": 0.3, "learning_rate": 0.0002981697416801658, "loss": 0.0547, "step": 1456 }, { "epoch": 0.3, "learning_rate": 0.00029816672138966924, "loss": 0.0143, "step": 1457 }, { "epoch": 0.3, "learning_rate": 0.00029816369862450883, "loss": 0.0542, "step": 1458 }, { "epoch": 0.3, "learning_rate": 0.00029816067338473486, "loss": 0.033, "step": 1459 }, { "epoch": 0.3, "learning_rate": 0.0002981576456703981, "loss": 0.0339, "step": 1460 }, { "epoch": 0.3, "learning_rate": 0.00029815461548154894, "loss": 0.0382, "step": 1461 }, { "epoch": 0.3, "learning_rate": 0.00029815158281823803, "loss": 0.0323, "step": 1462 }, { "epoch": 0.3, "learning_rate": 0.00029814854768051604, "loss": 0.0315, "step": 1463 }, { "epoch": 0.3, "learning_rate": 0.00029814551006843366, "loss": 0.0151, "step": 1464 }, { "epoch": 0.3, "learning_rate": 0.0002981424699820416, "loss": 0.0366, "step": 1465 }, { "epoch": 0.3, "learning_rate": 0.00029813942742139065, "loss": 0.0071, "step": 1466 }, { "epoch": 0.3, "learning_rate": 0.0002981363823865317, "loss": 0.0094, "step": 1467 }, { "epoch": 0.3, "learning_rate": 0.00029813333487751543, "loss": 0.0067, "step": 1468 }, { "epoch": 0.3, "learning_rate": 0.0002981302848943929, "loss": 0.0408, "step": 1469 }, { "epoch": 0.3, "learning_rate": 0.00029812723243721496, "loss": 0.0238, "step": 1470 }, { "epoch": 0.3, "learning_rate": 0.0002981241775060327, "loss": 0.0168, "step": 1471 }, { "epoch": 0.3, "learning_rate": 0.000298121120100897, "loss": 0.0039, "step": 1472 }, { "epoch": 0.3, "learning_rate": 0.000298118060221859, "loss": 0.0145, "step": 1473 }, { "epoch": 0.3, "learning_rate": 0.00029811499786896984, "loss": 0.0388, "step": 1474 }, { "epoch": 0.3, "learning_rate": 0.00029811193304228064, "loss": 0.0263, "step": 1475 }, { "epoch": 0.3, "learning_rate": 0.0002981088657418425, "loss": 0.0071, "step": 1476 }, { "epoch": 0.3, "learning_rate": 0.0002981057959677068, "loss": 0.0349, "step": 1477 }, { "epoch": 0.3, "learning_rate": 0.0002981027237199247, "loss": 0.044, "step": 1478 }, { "epoch": 0.3, "learning_rate": 0.0002980996489985476, "loss": 0.009, "step": 1479 }, { "epoch": 0.3, "learning_rate": 0.0002980965718036267, "loss": 0.0547, "step": 1480 }, { "epoch": 0.3, "learning_rate": 0.00029809349213521364, "loss": 0.0317, "step": 1481 }, { "epoch": 0.3, "learning_rate": 0.00029809040999335967, "loss": 0.0191, "step": 1482 }, { "epoch": 0.3, "learning_rate": 0.00029808732537811626, "loss": 0.0403, "step": 1483 }, { "epoch": 0.3, "learning_rate": 0.00029808423828953497, "loss": 0.0272, "step": 1484 }, { "epoch": 0.3, "learning_rate": 0.00029808114872766745, "loss": 0.0221, "step": 1485 }, { "epoch": 0.3, "learning_rate": 0.00029807805669256515, "loss": 0.0318, "step": 1486 }, { "epoch": 0.3, "learning_rate": 0.00029807496218427985, "loss": 0.0082, "step": 1487 }, { "epoch": 0.3, "learning_rate": 0.00029807186520286314, "loss": 0.0185, "step": 1488 }, { "epoch": 0.3, "learning_rate": 0.00029806876574836675, "loss": 0.0248, "step": 1489 }, { "epoch": 0.3, "learning_rate": 0.0002980656638208425, "loss": 0.03, "step": 1490 }, { "epoch": 0.3, "learning_rate": 0.00029806255942034217, "loss": 0.0439, "step": 1491 }, { "epoch": 0.3, "learning_rate": 0.0002980594525469176, "loss": 0.014, "step": 1492 }, { "epoch": 0.3, "learning_rate": 0.0002980563432006207, "loss": 0.0078, "step": 1493 }, { "epoch": 0.3, "learning_rate": 0.0002980532313815034, "loss": 0.0527, "step": 1494 }, { "epoch": 0.3, "learning_rate": 0.00029805011708961763, "loss": 0.0084, "step": 1495 }, { "epoch": 0.3, "learning_rate": 0.00029804700032501553, "loss": 0.0228, "step": 1496 }, { "epoch": 0.3, "learning_rate": 0.000298043881087749, "loss": 0.0305, "step": 1497 }, { "epoch": 0.31, "learning_rate": 0.00029804075937787017, "loss": 0.0264, "step": 1498 }, { "epoch": 0.31, "learning_rate": 0.00029803763519543127, "loss": 0.0283, "step": 1499 }, { "epoch": 0.31, "learning_rate": 0.0002980345085404844, "loss": 0.0353, "step": 1500 }, { "epoch": 0.31, "learning_rate": 0.00029803137941308177, "loss": 0.0166, "step": 1501 }, { "epoch": 0.31, "learning_rate": 0.00029802824781327575, "loss": 0.0422, "step": 1502 }, { "epoch": 0.31, "learning_rate": 0.00029802511374111846, "loss": 0.034, "step": 1503 }, { "epoch": 0.31, "learning_rate": 0.00029802197719666244, "loss": 0.0542, "step": 1504 }, { "epoch": 0.31, "learning_rate": 0.00029801883817996, "loss": 0.0132, "step": 1505 }, { "epoch": 0.31, "learning_rate": 0.0002980156966910635, "loss": 0.035, "step": 1506 }, { "epoch": 0.31, "learning_rate": 0.0002980125527300255, "loss": 0.025, "step": 1507 }, { "epoch": 0.31, "learning_rate": 0.00029800940629689843, "loss": 0.0503, "step": 1508 }, { "epoch": 0.31, "learning_rate": 0.00029800625739173495, "loss": 0.0536, "step": 1509 }, { "epoch": 0.31, "learning_rate": 0.0002980031060145876, "loss": 0.0111, "step": 1510 }, { "epoch": 0.31, "learning_rate": 0.00029799995216550895, "loss": 0.0048, "step": 1511 }, { "epoch": 0.31, "learning_rate": 0.00029799679584455174, "loss": 0.0303, "step": 1512 }, { "epoch": 0.31, "learning_rate": 0.0002979936370517687, "loss": 0.0299, "step": 1513 }, { "epoch": 0.31, "learning_rate": 0.0002979904757872125, "loss": 0.0225, "step": 1514 }, { "epoch": 0.31, "learning_rate": 0.0002979873120509361, "loss": 0.0215, "step": 1515 }, { "epoch": 0.31, "learning_rate": 0.0002979841458429922, "loss": 0.0042, "step": 1516 }, { "epoch": 0.31, "learning_rate": 0.0002979809771634337, "loss": 0.0071, "step": 1517 }, { "epoch": 0.31, "learning_rate": 0.00029797780601231353, "loss": 0.0482, "step": 1518 }, { "epoch": 0.31, "learning_rate": 0.00029797463238968473, "loss": 0.0393, "step": 1519 }, { "epoch": 0.31, "learning_rate": 0.0002979714562956002, "loss": 0.0562, "step": 1520 }, { "epoch": 0.31, "learning_rate": 0.00029796827773011307, "loss": 0.0258, "step": 1521 }, { "epoch": 0.31, "learning_rate": 0.00029796509669327635, "loss": 0.0647, "step": 1522 }, { "epoch": 0.31, "learning_rate": 0.00029796191318514324, "loss": 0.0259, "step": 1523 }, { "epoch": 0.31, "learning_rate": 0.0002979587272057669, "loss": 0.0136, "step": 1524 }, { "epoch": 0.31, "learning_rate": 0.0002979555387552005, "loss": 0.0164, "step": 1525 }, { "epoch": 0.31, "learning_rate": 0.00029795234783349734, "loss": 0.0154, "step": 1526 }, { "epoch": 0.31, "learning_rate": 0.0002979491544407107, "loss": 0.0256, "step": 1527 }, { "epoch": 0.31, "learning_rate": 0.00029794595857689384, "loss": 0.0067, "step": 1528 }, { "epoch": 0.31, "learning_rate": 0.0002979427602421002, "loss": 0.0022, "step": 1529 }, { "epoch": 0.31, "learning_rate": 0.0002979395594363833, "loss": 0.0664, "step": 1530 }, { "epoch": 0.31, "learning_rate": 0.0002979363561597964, "loss": 0.0213, "step": 1531 }, { "epoch": 0.31, "learning_rate": 0.0002979331504123932, "loss": 0.016, "step": 1532 }, { "epoch": 0.31, "learning_rate": 0.0002979299421942271, "loss": 0.0474, "step": 1533 }, { "epoch": 0.31, "learning_rate": 0.0002979267315053517, "loss": 0.0245, "step": 1534 }, { "epoch": 0.31, "learning_rate": 0.0002979235183458207, "loss": 0.1097, "step": 1535 }, { "epoch": 0.31, "learning_rate": 0.00029792030271568766, "loss": 0.0092, "step": 1536 }, { "epoch": 0.31, "learning_rate": 0.0002979170846150064, "loss": 0.0283, "step": 1537 }, { "epoch": 0.31, "learning_rate": 0.0002979138640438306, "loss": 0.0703, "step": 1538 }, { "epoch": 0.31, "learning_rate": 0.00029791064100221406, "loss": 0.022, "step": 1539 }, { "epoch": 0.31, "learning_rate": 0.0002979074154902106, "loss": 0.0399, "step": 1540 }, { "epoch": 0.31, "learning_rate": 0.0002979041875078741, "loss": 0.0532, "step": 1541 }, { "epoch": 0.31, "learning_rate": 0.00029790095705525853, "loss": 0.0081, "step": 1542 }, { "epoch": 0.31, "learning_rate": 0.00029789772413241775, "loss": 0.0297, "step": 1543 }, { "epoch": 0.31, "learning_rate": 0.00029789448873940576, "loss": 0.0081, "step": 1544 }, { "epoch": 0.31, "learning_rate": 0.0002978912508762767, "loss": 0.0109, "step": 1545 }, { "epoch": 0.31, "learning_rate": 0.0002978880105430846, "loss": 0.0364, "step": 1546 }, { "epoch": 0.31, "learning_rate": 0.00029788476773988354, "loss": 0.0206, "step": 1547 }, { "epoch": 0.32, "learning_rate": 0.0002978815224667277, "loss": 0.0434, "step": 1548 }, { "epoch": 0.32, "learning_rate": 0.0002978782747236713, "loss": 0.0036, "step": 1549 }, { "epoch": 0.32, "learning_rate": 0.00029787502451076854, "loss": 0.0161, "step": 1550 }, { "epoch": 0.32, "learning_rate": 0.0002978717718280738, "loss": 0.0148, "step": 1551 }, { "epoch": 0.32, "learning_rate": 0.0002978685166756413, "loss": 0.0128, "step": 1552 }, { "epoch": 0.32, "learning_rate": 0.00029786525905352545, "loss": 0.0154, "step": 1553 }, { "epoch": 0.32, "learning_rate": 0.00029786199896178066, "loss": 0.032, "step": 1554 }, { "epoch": 0.32, "learning_rate": 0.0002978587364004614, "loss": 0.0249, "step": 1555 }, { "epoch": 0.32, "learning_rate": 0.00029785547136962213, "loss": 0.0218, "step": 1556 }, { "epoch": 0.32, "learning_rate": 0.00029785220386931735, "loss": 0.0212, "step": 1557 }, { "epoch": 0.32, "learning_rate": 0.0002978489338996017, "loss": 0.0062, "step": 1558 }, { "epoch": 0.32, "learning_rate": 0.0002978456614605298, "loss": 0.0255, "step": 1559 }, { "epoch": 0.32, "learning_rate": 0.00029784238655215626, "loss": 0.0158, "step": 1560 }, { "epoch": 0.32, "learning_rate": 0.0002978391091745357, "loss": 0.0512, "step": 1561 }, { "epoch": 0.32, "learning_rate": 0.0002978358293277231, "loss": 0.0159, "step": 1562 }, { "epoch": 0.32, "learning_rate": 0.00029783254701177305, "loss": 0.0361, "step": 1563 }, { "epoch": 0.32, "learning_rate": 0.0002978292622267404, "loss": 0.0428, "step": 1564 }, { "epoch": 0.32, "learning_rate": 0.00029782597497267994, "loss": 0.0231, "step": 1565 }, { "epoch": 0.32, "learning_rate": 0.00029782268524964673, "loss": 0.0434, "step": 1566 }, { "epoch": 0.32, "learning_rate": 0.00029781939305769566, "loss": 0.0225, "step": 1567 }, { "epoch": 0.32, "learning_rate": 0.0002978160983968817, "loss": 0.046, "step": 1568 }, { "epoch": 0.32, "learning_rate": 0.00029781280126725985, "loss": 0.017, "step": 1569 }, { "epoch": 0.32, "learning_rate": 0.00029780950166888515, "loss": 0.0375, "step": 1570 }, { "epoch": 0.32, "learning_rate": 0.00029780619960181285, "loss": 0.0167, "step": 1571 }, { "epoch": 0.32, "learning_rate": 0.00029780289506609796, "loss": 0.0375, "step": 1572 }, { "epoch": 0.32, "learning_rate": 0.0002977995880617957, "loss": 0.0371, "step": 1573 }, { "epoch": 0.32, "learning_rate": 0.00029779627858896144, "loss": 0.0209, "step": 1574 }, { "epoch": 0.32, "learning_rate": 0.00029779296664765023, "loss": 0.0183, "step": 1575 }, { "epoch": 0.32, "learning_rate": 0.00029778965223791756, "loss": 0.0445, "step": 1576 }, { "epoch": 0.32, "learning_rate": 0.0002977863353598187, "loss": 0.0362, "step": 1577 }, { "epoch": 0.32, "learning_rate": 0.00029778301601340906, "loss": 0.0122, "step": 1578 }, { "epoch": 0.32, "learning_rate": 0.0002977796941987441, "loss": 0.0203, "step": 1579 }, { "epoch": 0.32, "learning_rate": 0.0002977763699158793, "loss": 0.0664, "step": 1580 }, { "epoch": 0.32, "learning_rate": 0.0002977730431648702, "loss": 0.0183, "step": 1581 }, { "epoch": 0.32, "learning_rate": 0.0002977697139457723, "loss": 0.0422, "step": 1582 }, { "epoch": 0.32, "learning_rate": 0.0002977663822586413, "loss": 0.0331, "step": 1583 }, { "epoch": 0.32, "learning_rate": 0.00029776304810353276, "loss": 0.0257, "step": 1584 }, { "epoch": 0.32, "learning_rate": 0.0002977597114805023, "loss": 0.0478, "step": 1585 }, { "epoch": 0.32, "learning_rate": 0.00029775637238960585, "loss": 0.0278, "step": 1586 }, { "epoch": 0.32, "learning_rate": 0.000297753030830899, "loss": 0.0227, "step": 1587 }, { "epoch": 0.32, "learning_rate": 0.0002977496868044377, "loss": 0.0164, "step": 1588 }, { "epoch": 0.32, "learning_rate": 0.0002977463403102777, "loss": 0.009, "step": 1589 }, { "epoch": 0.32, "learning_rate": 0.00029774299134847497, "loss": 0.0272, "step": 1590 }, { "epoch": 0.32, "learning_rate": 0.0002977396399190853, "loss": 0.0185, "step": 1591 }, { "epoch": 0.32, "learning_rate": 0.0002977362860221649, "loss": 0.0446, "step": 1592 }, { "epoch": 0.32, "learning_rate": 0.00029773292965776954, "loss": 0.0142, "step": 1593 }, { "epoch": 0.32, "learning_rate": 0.0002977295708259554, "loss": 0.0255, "step": 1594 }, { "epoch": 0.32, "learning_rate": 0.00029772620952677863, "loss": 0.0595, "step": 1595 }, { "epoch": 0.32, "learning_rate": 0.0002977228457602953, "loss": 0.0544, "step": 1596 }, { "epoch": 0.33, "learning_rate": 0.0002977194795265615, "loss": 0.0147, "step": 1597 }, { "epoch": 0.33, "learning_rate": 0.00029771611082563367, "loss": 0.0281, "step": 1598 }, { "epoch": 0.33, "learning_rate": 0.0002977127396575679, "loss": 0.0759, "step": 1599 }, { "epoch": 0.33, "learning_rate": 0.00029770936602242055, "loss": 0.0243, "step": 1600 }, { "epoch": 0.33, "learning_rate": 0.000297705989920248, "loss": 0.0217, "step": 1601 }, { "epoch": 0.33, "learning_rate": 0.00029770261135110657, "loss": 0.0103, "step": 1602 }, { "epoch": 0.33, "learning_rate": 0.00029769923031505274, "loss": 0.0097, "step": 1603 }, { "epoch": 0.33, "learning_rate": 0.0002976958468121429, "loss": 0.0354, "step": 1604 }, { "epoch": 0.33, "learning_rate": 0.0002976924608424337, "loss": 0.0256, "step": 1605 }, { "epoch": 0.33, "learning_rate": 0.0002976890724059816, "loss": 0.0298, "step": 1606 }, { "epoch": 0.33, "learning_rate": 0.0002976856815028432, "loss": 0.0184, "step": 1607 }, { "epoch": 0.33, "learning_rate": 0.0002976822881330751, "loss": 0.0078, "step": 1608 }, { "epoch": 0.33, "learning_rate": 0.00029767889229673406, "loss": 0.0145, "step": 1609 }, { "epoch": 0.33, "learning_rate": 0.0002976754939938768, "loss": 0.0253, "step": 1610 }, { "epoch": 0.33, "learning_rate": 0.00029767209322456, "loss": 0.0119, "step": 1611 }, { "epoch": 0.33, "learning_rate": 0.00029766868998884043, "loss": 0.0176, "step": 1612 }, { "epoch": 0.33, "learning_rate": 0.0002976652842867751, "loss": 0.0859, "step": 1613 }, { "epoch": 0.33, "learning_rate": 0.00029766187611842066, "loss": 0.0173, "step": 1614 }, { "epoch": 0.33, "learning_rate": 0.0002976584654838342, "loss": 0.0417, "step": 1615 }, { "epoch": 0.33, "learning_rate": 0.00029765505238307273, "loss": 0.0207, "step": 1616 }, { "epoch": 0.33, "learning_rate": 0.0002976516368161931, "loss": 0.0434, "step": 1617 }, { "epoch": 0.33, "learning_rate": 0.0002976482187832524, "loss": 0.0124, "step": 1618 }, { "epoch": 0.33, "learning_rate": 0.0002976447982843078, "loss": 0.0309, "step": 1619 }, { "epoch": 0.33, "learning_rate": 0.0002976413753194163, "loss": 0.0314, "step": 1620 }, { "epoch": 0.33, "learning_rate": 0.00029763794988863515, "loss": 0.0154, "step": 1621 }, { "epoch": 0.33, "learning_rate": 0.0002976345219920216, "loss": 0.0155, "step": 1622 }, { "epoch": 0.33, "learning_rate": 0.00029763109162963283, "loss": 0.0272, "step": 1623 }, { "epoch": 0.33, "learning_rate": 0.00029762765880152615, "loss": 0.0274, "step": 1624 }, { "epoch": 0.33, "learning_rate": 0.00029762422350775887, "loss": 0.0113, "step": 1625 }, { "epoch": 0.33, "learning_rate": 0.00029762078574838846, "loss": 0.0329, "step": 1626 }, { "epoch": 0.33, "learning_rate": 0.00029761734552347227, "loss": 0.0206, "step": 1627 }, { "epoch": 0.33, "learning_rate": 0.0002976139028330677, "loss": 0.0061, "step": 1628 }, { "epoch": 0.33, "learning_rate": 0.00029761045767723234, "loss": 0.0265, "step": 1629 }, { "epoch": 0.33, "learning_rate": 0.00029760701005602375, "loss": 0.0336, "step": 1630 }, { "epoch": 0.33, "learning_rate": 0.00029760355996949944, "loss": 0.025, "step": 1631 }, { "epoch": 0.33, "learning_rate": 0.00029760010741771705, "loss": 0.0149, "step": 1632 }, { "epoch": 0.33, "learning_rate": 0.0002975966524007342, "loss": 0.042, "step": 1633 }, { "epoch": 0.33, "learning_rate": 0.0002975931949186087, "loss": 0.008, "step": 1634 }, { "epoch": 0.33, "learning_rate": 0.00029758973497139826, "loss": 0.0166, "step": 1635 }, { "epoch": 0.33, "learning_rate": 0.0002975862725591606, "loss": 0.0373, "step": 1636 }, { "epoch": 0.33, "learning_rate": 0.0002975828076819536, "loss": 0.0078, "step": 1637 }, { "epoch": 0.33, "learning_rate": 0.00029757934033983516, "loss": 0.019, "step": 1638 }, { "epoch": 0.33, "learning_rate": 0.00029757587053286314, "loss": 0.0538, "step": 1639 }, { "epoch": 0.33, "learning_rate": 0.00029757239826109556, "loss": 0.0108, "step": 1640 }, { "epoch": 0.33, "learning_rate": 0.0002975689235245903, "loss": 0.028, "step": 1641 }, { "epoch": 0.33, "learning_rate": 0.0002975654463234055, "loss": 0.0065, "step": 1642 }, { "epoch": 0.33, "learning_rate": 0.0002975619666575992, "loss": 0.0295, "step": 1643 }, { "epoch": 0.33, "learning_rate": 0.0002975584845272295, "loss": 0.0229, "step": 1644 }, { "epoch": 0.33, "learning_rate": 0.0002975549999323546, "loss": 0.0127, "step": 1645 }, { "epoch": 0.34, "learning_rate": 0.00029755151287303263, "loss": 0.0396, "step": 1646 }, { "epoch": 0.34, "learning_rate": 0.0002975480233493219, "loss": 0.0316, "step": 1647 }, { "epoch": 0.34, "learning_rate": 0.00029754453136128067, "loss": 0.016, "step": 1648 }, { "epoch": 0.34, "learning_rate": 0.0002975410369089672, "loss": 0.0242, "step": 1649 }, { "epoch": 0.34, "learning_rate": 0.00029753753999243993, "loss": 0.0177, "step": 1650 }, { "epoch": 0.34, "learning_rate": 0.0002975340406117573, "loss": 0.0312, "step": 1651 }, { "epoch": 0.34, "learning_rate": 0.00029753053876697765, "loss": 0.0136, "step": 1652 }, { "epoch": 0.34, "learning_rate": 0.00029752703445815954, "loss": 0.0235, "step": 1653 }, { "epoch": 0.34, "learning_rate": 0.00029752352768536145, "loss": 0.0296, "step": 1654 }, { "epoch": 0.34, "learning_rate": 0.000297520018448642, "loss": 0.0263, "step": 1655 }, { "epoch": 0.34, "learning_rate": 0.0002975165067480598, "loss": 0.0248, "step": 1656 }, { "epoch": 0.34, "learning_rate": 0.00029751299258367345, "loss": 0.0106, "step": 1657 }, { "epoch": 0.34, "learning_rate": 0.0002975094759555417, "loss": 0.0533, "step": 1658 }, { "epoch": 0.34, "learning_rate": 0.00029750595686372323, "loss": 0.0178, "step": 1659 }, { "epoch": 0.34, "learning_rate": 0.00029750243530827684, "loss": 0.0355, "step": 1660 }, { "epoch": 0.34, "learning_rate": 0.0002974989112892614, "loss": 0.0144, "step": 1661 }, { "epoch": 0.34, "learning_rate": 0.0002974953848067356, "loss": 0.0049, "step": 1662 }, { "epoch": 0.34, "learning_rate": 0.0002974918558607586, "loss": 0.0223, "step": 1663 }, { "epoch": 0.34, "learning_rate": 0.00029748832445138914, "loss": 0.0097, "step": 1664 }, { "epoch": 0.34, "learning_rate": 0.0002974847905786862, "loss": 0.0277, "step": 1665 }, { "epoch": 0.34, "learning_rate": 0.00029748125424270896, "loss": 0.0231, "step": 1666 }, { "epoch": 0.34, "learning_rate": 0.0002974777154435163, "loss": 0.0177, "step": 1667 }, { "epoch": 0.34, "learning_rate": 0.0002974741741811674, "loss": 0.0542, "step": 1668 }, { "epoch": 0.34, "learning_rate": 0.00029747063045572147, "loss": 0.0449, "step": 1669 }, { "epoch": 0.34, "learning_rate": 0.00029746708426723765, "loss": 0.0146, "step": 1670 }, { "epoch": 0.34, "learning_rate": 0.00029746353561577513, "loss": 0.0321, "step": 1671 }, { "epoch": 0.34, "learning_rate": 0.00029745998450139325, "loss": 0.0177, "step": 1672 }, { "epoch": 0.34, "learning_rate": 0.0002974564309241512, "loss": 0.0313, "step": 1673 }, { "epoch": 0.34, "learning_rate": 0.00029745287488410843, "loss": 0.0424, "step": 1674 }, { "epoch": 0.34, "learning_rate": 0.0002974493163813244, "loss": 0.0131, "step": 1675 }, { "epoch": 0.34, "learning_rate": 0.00029744575541585836, "loss": 0.0187, "step": 1676 }, { "epoch": 0.34, "learning_rate": 0.0002974421919877699, "loss": 0.0378, "step": 1677 }, { "epoch": 0.34, "learning_rate": 0.0002974386260971185, "loss": 0.0134, "step": 1678 }, { "epoch": 0.34, "learning_rate": 0.0002974350577439638, "loss": 0.0082, "step": 1679 }, { "epoch": 0.34, "learning_rate": 0.00029743148692836527, "loss": 0.027, "step": 1680 }, { "epoch": 0.34, "learning_rate": 0.00029742791365038263, "loss": 0.0092, "step": 1681 }, { "epoch": 0.34, "learning_rate": 0.0002974243379100756, "loss": 0.0192, "step": 1682 }, { "epoch": 0.34, "learning_rate": 0.0002974207597075038, "loss": 0.0253, "step": 1683 }, { "epoch": 0.34, "learning_rate": 0.000297417179042727, "loss": 0.0092, "step": 1684 }, { "epoch": 0.34, "learning_rate": 0.00029741359591580504, "loss": 0.0101, "step": 1685 }, { "epoch": 0.34, "learning_rate": 0.0002974100103267978, "loss": 0.0228, "step": 1686 }, { "epoch": 0.34, "learning_rate": 0.00029740642227576514, "loss": 0.0293, "step": 1687 }, { "epoch": 0.34, "learning_rate": 0.00029740283176276695, "loss": 0.0498, "step": 1688 }, { "epoch": 0.34, "learning_rate": 0.0002973992387878633, "loss": 0.0321, "step": 1689 }, { "epoch": 0.34, "learning_rate": 0.000297395643351114, "loss": 0.0504, "step": 1690 }, { "epoch": 0.34, "learning_rate": 0.0002973920454525793, "loss": 0.016, "step": 1691 }, { "epoch": 0.34, "learning_rate": 0.0002973884450923193, "loss": 0.0241, "step": 1692 }, { "epoch": 0.34, "learning_rate": 0.00029738484227039393, "loss": 0.0182, "step": 1693 }, { "epoch": 0.34, "learning_rate": 0.00029738123698686345, "loss": 0.062, "step": 1694 }, { "epoch": 0.35, "learning_rate": 0.0002973776292417882, "loss": 0.0212, "step": 1695 }, { "epoch": 0.35, "learning_rate": 0.00029737401903522835, "loss": 0.0029, "step": 1696 }, { "epoch": 0.35, "learning_rate": 0.0002973704063672442, "loss": 0.0936, "step": 1697 }, { "epoch": 0.35, "learning_rate": 0.00029736679123789603, "loss": 0.0266, "step": 1698 }, { "epoch": 0.35, "learning_rate": 0.0002973631736472443, "loss": 0.0236, "step": 1699 }, { "epoch": 0.35, "learning_rate": 0.0002973595535953494, "loss": 0.0142, "step": 1700 }, { "epoch": 0.35, "learning_rate": 0.0002973559310822718, "loss": 0.0302, "step": 1701 }, { "epoch": 0.35, "learning_rate": 0.00029735230610807196, "loss": 0.0215, "step": 1702 }, { "epoch": 0.35, "learning_rate": 0.0002973486786728105, "loss": 0.0473, "step": 1703 }, { "epoch": 0.35, "learning_rate": 0.000297345048776548, "loss": 0.0091, "step": 1704 }, { "epoch": 0.35, "learning_rate": 0.00029734141641934493, "loss": 0.0395, "step": 1705 }, { "epoch": 0.35, "learning_rate": 0.0002973377816012622, "loss": 0.0325, "step": 1706 }, { "epoch": 0.35, "learning_rate": 0.00029733414432236033, "loss": 0.0212, "step": 1707 }, { "epoch": 0.35, "learning_rate": 0.00029733050458270017, "loss": 0.0346, "step": 1708 }, { "epoch": 0.35, "learning_rate": 0.0002973268623823425, "loss": 0.0057, "step": 1709 }, { "epoch": 0.35, "learning_rate": 0.00029732321772134806, "loss": 0.0229, "step": 1710 }, { "epoch": 0.35, "learning_rate": 0.0002973195705997778, "loss": 0.0296, "step": 1711 }, { "epoch": 0.35, "learning_rate": 0.0002973159210176927, "loss": 0.0296, "step": 1712 }, { "epoch": 0.35, "learning_rate": 0.0002973122689751536, "loss": 0.0562, "step": 1713 }, { "epoch": 0.35, "learning_rate": 0.0002973086144722215, "loss": 0.0406, "step": 1714 }, { "epoch": 0.35, "learning_rate": 0.00029730495750895756, "loss": 0.0594, "step": 1715 }, { "epoch": 0.35, "learning_rate": 0.0002973012980854227, "loss": 0.0226, "step": 1716 }, { "epoch": 0.35, "learning_rate": 0.0002972976362016781, "loss": 0.0229, "step": 1717 }, { "epoch": 0.35, "learning_rate": 0.00029729397185778496, "loss": 0.0223, "step": 1718 }, { "epoch": 0.35, "learning_rate": 0.0002972903050538045, "loss": 0.0261, "step": 1719 }, { "epoch": 0.35, "learning_rate": 0.00029728663578979783, "loss": 0.0555, "step": 1720 }, { "epoch": 0.35, "learning_rate": 0.0002972829640658264, "loss": 0.0392, "step": 1721 }, { "epoch": 0.35, "learning_rate": 0.00029727928988195135, "loss": 0.017, "step": 1722 }, { "epoch": 0.35, "learning_rate": 0.00029727561323823423, "loss": 0.0094, "step": 1723 }, { "epoch": 0.35, "learning_rate": 0.00029727193413473635, "loss": 0.0143, "step": 1724 }, { "epoch": 0.35, "learning_rate": 0.00029726825257151915, "loss": 0.0199, "step": 1725 }, { "epoch": 0.35, "learning_rate": 0.0002972645685486442, "loss": 0.021, "step": 1726 }, { "epoch": 0.35, "learning_rate": 0.0002972608820661729, "loss": 0.0303, "step": 1727 }, { "epoch": 0.35, "learning_rate": 0.000297257193124167, "loss": 0.0175, "step": 1728 }, { "epoch": 0.35, "learning_rate": 0.0002972535017226879, "loss": 0.0511, "step": 1729 }, { "epoch": 0.35, "learning_rate": 0.0002972498078617974, "loss": 0.0167, "step": 1730 }, { "epoch": 0.35, "learning_rate": 0.00029724611154155717, "loss": 0.0575, "step": 1731 }, { "epoch": 0.35, "learning_rate": 0.0002972424127620289, "loss": 0.0379, "step": 1732 }, { "epoch": 0.35, "learning_rate": 0.00029723871152327445, "loss": 0.0417, "step": 1733 }, { "epoch": 0.35, "learning_rate": 0.00029723500782535557, "loss": 0.0204, "step": 1734 }, { "epoch": 0.35, "learning_rate": 0.00029723130166833404, "loss": 0.0158, "step": 1735 }, { "epoch": 0.35, "learning_rate": 0.00029722759305227196, "loss": 0.0368, "step": 1736 }, { "epoch": 0.35, "learning_rate": 0.00029722388197723115, "loss": 0.0165, "step": 1737 }, { "epoch": 0.35, "learning_rate": 0.00029722016844327355, "loss": 0.0167, "step": 1738 }, { "epoch": 0.35, "learning_rate": 0.00029721645245046126, "loss": 0.0042, "step": 1739 }, { "epoch": 0.35, "learning_rate": 0.00029721273399885636, "loss": 0.0682, "step": 1740 }, { "epoch": 0.35, "learning_rate": 0.00029720901308852093, "loss": 0.0282, "step": 1741 }, { "epoch": 0.35, "learning_rate": 0.000297205289719517, "loss": 0.0268, "step": 1742 }, { "epoch": 0.35, "learning_rate": 0.000297201563891907, "loss": 0.0285, "step": 1743 }, { "epoch": 0.36, "learning_rate": 0.0002971978356057529, "loss": 0.0153, "step": 1744 }, { "epoch": 0.36, "learning_rate": 0.00029719410486111716, "loss": 0.0325, "step": 1745 }, { "epoch": 0.36, "learning_rate": 0.000297190371658062, "loss": 0.0164, "step": 1746 }, { "epoch": 0.36, "learning_rate": 0.0002971866359966498, "loss": 0.0348, "step": 1747 }, { "epoch": 0.36, "learning_rate": 0.00029718289787694294, "loss": 0.0217, "step": 1748 }, { "epoch": 0.36, "learning_rate": 0.0002971791572990039, "loss": 0.0079, "step": 1749 }, { "epoch": 0.36, "learning_rate": 0.00029717541426289504, "loss": 0.0734, "step": 1750 }, { "epoch": 0.36, "learning_rate": 0.000297171668768679, "loss": 0.0463, "step": 1751 }, { "epoch": 0.36, "learning_rate": 0.00029716792081641827, "loss": 0.0374, "step": 1752 }, { "epoch": 0.36, "learning_rate": 0.00029716417040617543, "loss": 0.0328, "step": 1753 }, { "epoch": 0.36, "learning_rate": 0.0002971604175380132, "loss": 0.0193, "step": 1754 }, { "epoch": 0.36, "learning_rate": 0.00029715666221199414, "loss": 0.034, "step": 1755 }, { "epoch": 0.36, "learning_rate": 0.00029715290442818113, "loss": 0.0358, "step": 1756 }, { "epoch": 0.36, "learning_rate": 0.00029714914418663683, "loss": 0.0299, "step": 1757 }, { "epoch": 0.36, "learning_rate": 0.000297145381487424, "loss": 0.0801, "step": 1758 }, { "epoch": 0.36, "learning_rate": 0.0002971416163306056, "loss": 0.0126, "step": 1759 }, { "epoch": 0.36, "learning_rate": 0.00029713784871624447, "loss": 0.0489, "step": 1760 }, { "epoch": 0.36, "learning_rate": 0.0002971340786444035, "loss": 0.0133, "step": 1761 }, { "epoch": 0.36, "learning_rate": 0.00029713030611514565, "loss": 0.0115, "step": 1762 }, { "epoch": 0.36, "learning_rate": 0.00029712653112853404, "loss": 0.0352, "step": 1763 }, { "epoch": 0.36, "learning_rate": 0.00029712275368463156, "loss": 0.0381, "step": 1764 }, { "epoch": 0.36, "learning_rate": 0.0002971189737835014, "loss": 0.0134, "step": 1765 }, { "epoch": 0.36, "learning_rate": 0.00029711519142520666, "loss": 0.0305, "step": 1766 }, { "epoch": 0.36, "learning_rate": 0.0002971114066098105, "loss": 0.0106, "step": 1767 }, { "epoch": 0.36, "learning_rate": 0.00029710761933737627, "loss": 0.0227, "step": 1768 }, { "epoch": 0.36, "learning_rate": 0.000297103829607967, "loss": 0.0055, "step": 1769 }, { "epoch": 0.36, "learning_rate": 0.00029710003742164614, "loss": 0.0431, "step": 1770 }, { "epoch": 0.36, "learning_rate": 0.000297096242778477, "loss": 0.0171, "step": 1771 }, { "epoch": 0.36, "learning_rate": 0.0002970924456785229, "loss": 0.0086, "step": 1772 }, { "epoch": 0.36, "learning_rate": 0.0002970886461218473, "loss": 0.0214, "step": 1773 }, { "epoch": 0.36, "learning_rate": 0.0002970848441085137, "loss": 0.0306, "step": 1774 }, { "epoch": 0.36, "learning_rate": 0.00029708103963858553, "loss": 0.0301, "step": 1775 }, { "epoch": 0.36, "learning_rate": 0.0002970772327121264, "loss": 0.0502, "step": 1776 }, { "epoch": 0.36, "learning_rate": 0.0002970734233291998, "loss": 0.0674, "step": 1777 }, { "epoch": 0.36, "learning_rate": 0.00029706961148986944, "loss": 0.0315, "step": 1778 }, { "epoch": 0.36, "learning_rate": 0.000297065797194199, "loss": 0.0087, "step": 1779 }, { "epoch": 0.36, "learning_rate": 0.00029706198044225206, "loss": 0.0291, "step": 1780 }, { "epoch": 0.36, "learning_rate": 0.0002970581612340925, "loss": 0.0386, "step": 1781 }, { "epoch": 0.36, "learning_rate": 0.000297054339569784, "loss": 0.0156, "step": 1782 }, { "epoch": 0.36, "learning_rate": 0.0002970505154493905, "loss": 0.0065, "step": 1783 }, { "epoch": 0.36, "learning_rate": 0.0002970466888729758, "loss": 0.0555, "step": 1784 }, { "epoch": 0.36, "learning_rate": 0.00029704285984060385, "loss": 0.0242, "step": 1785 }, { "epoch": 0.36, "learning_rate": 0.00029703902835233857, "loss": 0.0789, "step": 1786 }, { "epoch": 0.36, "learning_rate": 0.0002970351944082439, "loss": 0.0428, "step": 1787 }, { "epoch": 0.36, "learning_rate": 0.00029703135800838396, "loss": 0.0176, "step": 1788 }, { "epoch": 0.36, "learning_rate": 0.00029702751915282284, "loss": 0.0196, "step": 1789 }, { "epoch": 0.36, "learning_rate": 0.0002970236778416246, "loss": 0.0548, "step": 1790 }, { "epoch": 0.36, "learning_rate": 0.00029701983407485344, "loss": 0.0098, "step": 1791 }, { "epoch": 0.36, "learning_rate": 0.0002970159878525735, "loss": 0.0104, "step": 1792 }, { "epoch": 0.37, "learning_rate": 0.00029701213917484904, "loss": 0.0844, "step": 1793 }, { "epoch": 0.37, "learning_rate": 0.00029700828804174435, "loss": 0.0219, "step": 1794 }, { "epoch": 0.37, "learning_rate": 0.00029700443445332376, "loss": 0.0183, "step": 1795 }, { "epoch": 0.37, "learning_rate": 0.0002970005784096516, "loss": 0.025, "step": 1796 }, { "epoch": 0.37, "learning_rate": 0.00029699671991079233, "loss": 0.0332, "step": 1797 }, { "epoch": 0.37, "learning_rate": 0.00029699285895681035, "loss": 0.0542, "step": 1798 }, { "epoch": 0.37, "learning_rate": 0.0002969889955477702, "loss": 0.0171, "step": 1799 }, { "epoch": 0.37, "learning_rate": 0.0002969851296837363, "loss": 0.0165, "step": 1800 }, { "epoch": 0.37, "learning_rate": 0.0002969812613647733, "loss": 0.0303, "step": 1801 }, { "epoch": 0.37, "learning_rate": 0.0002969773905909458, "loss": 0.0486, "step": 1802 }, { "epoch": 0.37, "learning_rate": 0.0002969735173623184, "loss": 0.0259, "step": 1803 }, { "epoch": 0.37, "learning_rate": 0.00029696964167895586, "loss": 0.0089, "step": 1804 }, { "epoch": 0.37, "learning_rate": 0.00029696576354092287, "loss": 0.0165, "step": 1805 }, { "epoch": 0.37, "learning_rate": 0.00029696188294828425, "loss": 0.0693, "step": 1806 }, { "epoch": 0.37, "learning_rate": 0.0002969579999011047, "loss": 0.0104, "step": 1807 }, { "epoch": 0.37, "learning_rate": 0.0002969541143994492, "loss": 0.0208, "step": 1808 }, { "epoch": 0.37, "learning_rate": 0.00029695022644338263, "loss": 0.0444, "step": 1809 }, { "epoch": 0.37, "learning_rate": 0.0002969463360329698, "loss": 0.0347, "step": 1810 }, { "epoch": 0.37, "learning_rate": 0.00029694244316827586, "loss": 0.0542, "step": 1811 }, { "epoch": 0.37, "learning_rate": 0.0002969385478493657, "loss": 0.0564, "step": 1812 }, { "epoch": 0.37, "learning_rate": 0.0002969346500763044, "loss": 0.0173, "step": 1813 }, { "epoch": 0.37, "learning_rate": 0.00029693074984915715, "loss": 0.0277, "step": 1814 }, { "epoch": 0.37, "learning_rate": 0.00029692684716798895, "loss": 0.0199, "step": 1815 }, { "epoch": 0.37, "learning_rate": 0.00029692294203286515, "loss": 0.0343, "step": 1816 }, { "epoch": 0.37, "learning_rate": 0.0002969190344438508, "loss": 0.0152, "step": 1817 }, { "epoch": 0.37, "learning_rate": 0.00029691512440101133, "loss": 0.0338, "step": 1818 }, { "epoch": 0.37, "learning_rate": 0.0002969112119044119, "loss": 0.0165, "step": 1819 }, { "epoch": 0.37, "learning_rate": 0.00029690729695411793, "loss": 0.0091, "step": 1820 }, { "epoch": 0.37, "learning_rate": 0.00029690337955019477, "loss": 0.0415, "step": 1821 }, { "epoch": 0.37, "learning_rate": 0.0002968994596927079, "loss": 0.0141, "step": 1822 }, { "epoch": 0.37, "learning_rate": 0.00029689553738172276, "loss": 0.031, "step": 1823 }, { "epoch": 0.37, "learning_rate": 0.0002968916126173048, "loss": 0.0183, "step": 1824 }, { "epoch": 0.37, "learning_rate": 0.0002968876853995197, "loss": 0.0446, "step": 1825 }, { "epoch": 0.37, "learning_rate": 0.00029688375572843297, "loss": 0.0205, "step": 1826 }, { "epoch": 0.37, "learning_rate": 0.0002968798236041103, "loss": 0.0058, "step": 1827 }, { "epoch": 0.37, "learning_rate": 0.00029687588902661724, "loss": 0.0215, "step": 1828 }, { "epoch": 0.37, "learning_rate": 0.0002968719519960196, "loss": 0.0328, "step": 1829 }, { "epoch": 0.37, "learning_rate": 0.00029686801251238316, "loss": 0.0162, "step": 1830 }, { "epoch": 0.37, "learning_rate": 0.00029686407057577367, "loss": 0.0415, "step": 1831 }, { "epoch": 0.37, "learning_rate": 0.00029686012618625695, "loss": 0.0252, "step": 1832 }, { "epoch": 0.37, "learning_rate": 0.0002968561793438989, "loss": 0.0134, "step": 1833 }, { "epoch": 0.37, "learning_rate": 0.00029685223004876553, "loss": 0.0559, "step": 1834 }, { "epoch": 0.37, "learning_rate": 0.0002968482783009226, "loss": 0.0161, "step": 1835 }, { "epoch": 0.37, "learning_rate": 0.0002968443241004363, "loss": 0.0023, "step": 1836 }, { "epoch": 0.37, "learning_rate": 0.0002968403674473726, "loss": 0.0238, "step": 1837 }, { "epoch": 0.37, "learning_rate": 0.0002968364083417975, "loss": 0.0127, "step": 1838 }, { "epoch": 0.37, "learning_rate": 0.0002968324467837773, "loss": 0.0318, "step": 1839 }, { "epoch": 0.37, "learning_rate": 0.00029682848277337804, "loss": 0.0176, "step": 1840 }, { "epoch": 0.37, "learning_rate": 0.000296824516310666, "loss": 0.031, "step": 1841 }, { "epoch": 0.38, "learning_rate": 0.00029682054739570726, "loss": 0.0158, "step": 1842 }, { "epoch": 0.38, "learning_rate": 0.00029681657602856836, "loss": 0.0169, "step": 1843 }, { "epoch": 0.38, "learning_rate": 0.00029681260220931543, "loss": 0.0148, "step": 1844 }, { "epoch": 0.38, "learning_rate": 0.000296808625938015, "loss": 0.031, "step": 1845 }, { "epoch": 0.38, "learning_rate": 0.0002968046472147333, "loss": 0.0499, "step": 1846 }, { "epoch": 0.38, "learning_rate": 0.00029680066603953695, "loss": 0.0712, "step": 1847 }, { "epoch": 0.38, "learning_rate": 0.00029679668241249234, "loss": 0.0242, "step": 1848 }, { "epoch": 0.38, "learning_rate": 0.00029679269633366606, "loss": 0.0081, "step": 1849 }, { "epoch": 0.38, "learning_rate": 0.00029678870780312463, "loss": 0.0205, "step": 1850 }, { "epoch": 0.38, "learning_rate": 0.0002967847168209347, "loss": 0.0427, "step": 1851 }, { "epoch": 0.38, "learning_rate": 0.0002967807233871629, "loss": 0.0441, "step": 1852 }, { "epoch": 0.38, "learning_rate": 0.00029677672750187597, "loss": 0.0123, "step": 1853 }, { "epoch": 0.38, "learning_rate": 0.0002967727291651407, "loss": 0.0159, "step": 1854 }, { "epoch": 0.38, "learning_rate": 0.0002967687283770237, "loss": 0.0183, "step": 1855 }, { "epoch": 0.38, "learning_rate": 0.00029676472513759193, "loss": 0.0232, "step": 1856 }, { "epoch": 0.38, "learning_rate": 0.0002967607194469122, "loss": 0.0409, "step": 1857 }, { "epoch": 0.38, "learning_rate": 0.00029675671130505144, "loss": 0.0072, "step": 1858 }, { "epoch": 0.38, "learning_rate": 0.0002967527007120766, "loss": 0.0434, "step": 1859 }, { "epoch": 0.38, "learning_rate": 0.0002967486876680546, "loss": 0.015, "step": 1860 }, { "epoch": 0.38, "learning_rate": 0.00029674467217305256, "loss": 0.0269, "step": 1861 }, { "epoch": 0.38, "learning_rate": 0.00029674065422713745, "loss": 0.0189, "step": 1862 }, { "epoch": 0.38, "learning_rate": 0.00029673663383037645, "loss": 0.0433, "step": 1863 }, { "epoch": 0.38, "learning_rate": 0.00029673261098283666, "loss": 0.0838, "step": 1864 }, { "epoch": 0.38, "learning_rate": 0.00029672858568458526, "loss": 0.0249, "step": 1865 }, { "epoch": 0.38, "learning_rate": 0.00029672455793568957, "loss": 0.0131, "step": 1866 }, { "epoch": 0.38, "learning_rate": 0.00029672052773621675, "loss": 0.0289, "step": 1867 }, { "epoch": 0.38, "learning_rate": 0.0002967164950862342, "loss": 0.0109, "step": 1868 }, { "epoch": 0.38, "learning_rate": 0.0002967124599858092, "loss": 0.0341, "step": 1869 }, { "epoch": 0.38, "learning_rate": 0.00029670842243500925, "loss": 0.0102, "step": 1870 }, { "epoch": 0.38, "learning_rate": 0.00029670438243390167, "loss": 0.0174, "step": 1871 }, { "epoch": 0.38, "learning_rate": 0.00029670033998255394, "loss": 0.0064, "step": 1872 }, { "epoch": 0.38, "learning_rate": 0.00029669629508103366, "loss": 0.0107, "step": 1873 }, { "epoch": 0.38, "learning_rate": 0.0002966922477294083, "loss": 0.0081, "step": 1874 }, { "epoch": 0.38, "learning_rate": 0.0002966881979277455, "loss": 0.0338, "step": 1875 }, { "epoch": 0.38, "learning_rate": 0.00029668414567611296, "loss": 0.0139, "step": 1876 }, { "epoch": 0.38, "learning_rate": 0.00029668009097457825, "loss": 0.0433, "step": 1877 }, { "epoch": 0.38, "learning_rate": 0.0002966760338232092, "loss": 0.0552, "step": 1878 }, { "epoch": 0.38, "learning_rate": 0.0002966719742220735, "loss": 0.0139, "step": 1879 }, { "epoch": 0.38, "learning_rate": 0.00029666791217123896, "loss": 0.0037, "step": 1880 }, { "epoch": 0.38, "learning_rate": 0.0002966638476707734, "loss": 0.0332, "step": 1881 }, { "epoch": 0.38, "learning_rate": 0.00029665978072074473, "loss": 0.0366, "step": 1882 }, { "epoch": 0.38, "learning_rate": 0.0002966557113212209, "loss": 0.0171, "step": 1883 }, { "epoch": 0.38, "learning_rate": 0.0002966516394722699, "loss": 0.0158, "step": 1884 }, { "epoch": 0.38, "learning_rate": 0.00029664756517395964, "loss": 0.0162, "step": 1885 }, { "epoch": 0.38, "learning_rate": 0.00029664348842635825, "loss": 0.0222, "step": 1886 }, { "epoch": 0.38, "learning_rate": 0.0002966394092295338, "loss": 0.0297, "step": 1887 }, { "epoch": 0.38, "learning_rate": 0.0002966353275835544, "loss": 0.0084, "step": 1888 }, { "epoch": 0.38, "learning_rate": 0.00029663124348848827, "loss": 0.0247, "step": 1889 }, { "epoch": 0.38, "learning_rate": 0.00029662715694440354, "loss": 0.0115, "step": 1890 }, { "epoch": 0.39, "learning_rate": 0.00029662306795136847, "loss": 0.009, "step": 1891 }, { "epoch": 0.39, "learning_rate": 0.0002966189765094515, "loss": 0.0132, "step": 1892 }, { "epoch": 0.39, "learning_rate": 0.00029661488261872084, "loss": 0.0361, "step": 1893 }, { "epoch": 0.39, "learning_rate": 0.0002966107862792449, "loss": 0.0623, "step": 1894 }, { "epoch": 0.39, "learning_rate": 0.000296606687491092, "loss": 0.0133, "step": 1895 }, { "epoch": 0.39, "learning_rate": 0.0002966025862543307, "loss": 0.0168, "step": 1896 }, { "epoch": 0.39, "learning_rate": 0.00029659848256902946, "loss": 0.0376, "step": 1897 }, { "epoch": 0.39, "learning_rate": 0.0002965943764352569, "loss": 0.0198, "step": 1898 }, { "epoch": 0.39, "learning_rate": 0.0002965902678530815, "loss": 0.0281, "step": 1899 }, { "epoch": 0.39, "learning_rate": 0.00029658615682257196, "loss": 0.0277, "step": 1900 }, { "epoch": 0.39, "learning_rate": 0.00029658204334379685, "loss": 0.0501, "step": 1901 }, { "epoch": 0.39, "learning_rate": 0.00029657792741682494, "loss": 0.0131, "step": 1902 }, { "epoch": 0.39, "learning_rate": 0.000296573809041725, "loss": 0.0338, "step": 1903 }, { "epoch": 0.39, "learning_rate": 0.0002965696882185657, "loss": 0.012, "step": 1904 }, { "epoch": 0.39, "learning_rate": 0.000296565564947416, "loss": 0.0051, "step": 1905 }, { "epoch": 0.39, "learning_rate": 0.00029656143922834465, "loss": 0.0278, "step": 1906 }, { "epoch": 0.39, "learning_rate": 0.0002965573110614206, "loss": 0.0793, "step": 1907 }, { "epoch": 0.39, "learning_rate": 0.0002965531804467129, "loss": 0.0251, "step": 1908 }, { "epoch": 0.39, "learning_rate": 0.00029654904738429035, "loss": 0.0085, "step": 1909 }, { "epoch": 0.39, "learning_rate": 0.0002965449118742221, "loss": 0.0454, "step": 1910 }, { "epoch": 0.39, "learning_rate": 0.00029654077391657723, "loss": 0.025, "step": 1911 }, { "epoch": 0.39, "learning_rate": 0.00029653663351142476, "loss": 0.0273, "step": 1912 }, { "epoch": 0.39, "learning_rate": 0.000296532490658834, "loss": 0.02, "step": 1913 }, { "epoch": 0.39, "learning_rate": 0.000296528345358874, "loss": 0.0199, "step": 1914 }, { "epoch": 0.39, "learning_rate": 0.000296524197611614, "loss": 0.0193, "step": 1915 }, { "epoch": 0.39, "learning_rate": 0.0002965200474171234, "loss": 0.0201, "step": 1916 }, { "epoch": 0.39, "learning_rate": 0.00029651589477547134, "loss": 0.0131, "step": 1917 }, { "epoch": 0.39, "learning_rate": 0.0002965117396867273, "loss": 0.0068, "step": 1918 }, { "epoch": 0.39, "learning_rate": 0.0002965075821509607, "loss": 0.0495, "step": 1919 }, { "epoch": 0.39, "learning_rate": 0.0002965034221682409, "loss": 0.02, "step": 1920 }, { "epoch": 0.39, "learning_rate": 0.00029649925973863737, "loss": 0.0129, "step": 1921 }, { "epoch": 0.39, "learning_rate": 0.00029649509486221967, "loss": 0.0229, "step": 1922 }, { "epoch": 0.39, "learning_rate": 0.00029649092753905734, "loss": 0.0112, "step": 1923 }, { "epoch": 0.39, "learning_rate": 0.00029648675776922003, "loss": 0.0117, "step": 1924 }, { "epoch": 0.39, "learning_rate": 0.00029648258555277737, "loss": 0.0551, "step": 1925 }, { "epoch": 0.39, "learning_rate": 0.000296478410889799, "loss": 0.0199, "step": 1926 }, { "epoch": 0.39, "learning_rate": 0.0002964742337803547, "loss": 0.0439, "step": 1927 }, { "epoch": 0.39, "learning_rate": 0.00029647005422451416, "loss": 0.0073, "step": 1928 }, { "epoch": 0.39, "learning_rate": 0.0002964658722223473, "loss": 0.0366, "step": 1929 }, { "epoch": 0.39, "learning_rate": 0.00029646168777392384, "loss": 0.0168, "step": 1930 }, { "epoch": 0.39, "learning_rate": 0.0002964575008793137, "loss": 0.0852, "step": 1931 }, { "epoch": 0.39, "learning_rate": 0.00029645331153858694, "loss": 0.009, "step": 1932 }, { "epoch": 0.39, "learning_rate": 0.00029644911975181334, "loss": 0.0159, "step": 1933 }, { "epoch": 0.39, "learning_rate": 0.000296444925519063, "loss": 0.0167, "step": 1934 }, { "epoch": 0.39, "learning_rate": 0.00029644072884040597, "loss": 0.0327, "step": 1935 }, { "epoch": 0.39, "learning_rate": 0.00029643652971591243, "loss": 0.0219, "step": 1936 }, { "epoch": 0.39, "learning_rate": 0.00029643232814565237, "loss": 0.0324, "step": 1937 }, { "epoch": 0.39, "learning_rate": 0.000296428124129696, "loss": 0.0307, "step": 1938 }, { "epoch": 0.39, "learning_rate": 0.00029642391766811357, "loss": 0.0381, "step": 1939 }, { "epoch": 0.4, "learning_rate": 0.0002964197087609753, "loss": 0.0098, "step": 1940 }, { "epoch": 0.4, "learning_rate": 0.0002964154974083515, "loss": 0.0089, "step": 1941 }, { "epoch": 0.4, "learning_rate": 0.00029641128361031254, "loss": 0.0117, "step": 1942 }, { "epoch": 0.4, "learning_rate": 0.00029640706736692876, "loss": 0.0327, "step": 1943 }, { "epoch": 0.4, "learning_rate": 0.00029640284867827064, "loss": 0.0555, "step": 1944 }, { "epoch": 0.4, "learning_rate": 0.00029639862754440855, "loss": 0.0215, "step": 1945 }, { "epoch": 0.4, "learning_rate": 0.00029639440396541305, "loss": 0.0127, "step": 1946 }, { "epoch": 0.4, "learning_rate": 0.00029639017794135463, "loss": 0.0205, "step": 1947 }, { "epoch": 0.4, "learning_rate": 0.000296385949472304, "loss": 0.0373, "step": 1948 }, { "epoch": 0.4, "learning_rate": 0.00029638171855833156, "loss": 0.0081, "step": 1949 }, { "epoch": 0.4, "learning_rate": 0.0002963774851995082, "loss": 0.0232, "step": 1950 }, { "epoch": 0.4, "learning_rate": 0.00029637324939590443, "loss": 0.0188, "step": 1951 }, { "epoch": 0.4, "learning_rate": 0.0002963690111475912, "loss": 0.0223, "step": 1952 }, { "epoch": 0.4, "learning_rate": 0.00029636477045463913, "loss": 0.0121, "step": 1953 }, { "epoch": 0.4, "learning_rate": 0.00029636052731711913, "loss": 0.0353, "step": 1954 }, { "epoch": 0.4, "learning_rate": 0.00029635628173510205, "loss": 0.0196, "step": 1955 }, { "epoch": 0.4, "learning_rate": 0.00029635203370865885, "loss": 0.0442, "step": 1956 }, { "epoch": 0.4, "learning_rate": 0.00029634778323786034, "loss": 0.0172, "step": 1957 }, { "epoch": 0.4, "learning_rate": 0.0002963435303227777, "loss": 0.0082, "step": 1958 }, { "epoch": 0.4, "learning_rate": 0.00029633927496348174, "loss": 0.0191, "step": 1959 }, { "epoch": 0.4, "learning_rate": 0.00029633501716004373, "loss": 0.0305, "step": 1960 }, { "epoch": 0.4, "learning_rate": 0.0002963307569125347, "loss": 0.0144, "step": 1961 }, { "epoch": 0.4, "learning_rate": 0.0002963264942210258, "loss": 0.0642, "step": 1962 }, { "epoch": 0.4, "learning_rate": 0.00029632222908558824, "loss": 0.0115, "step": 1963 }, { "epoch": 0.4, "learning_rate": 0.00029631796150629325, "loss": 0.0183, "step": 1964 }, { "epoch": 0.4, "learning_rate": 0.0002963136914832121, "loss": 0.0129, "step": 1965 }, { "epoch": 0.4, "learning_rate": 0.0002963094190164161, "loss": 0.0319, "step": 1966 }, { "epoch": 0.4, "learning_rate": 0.0002963051441059766, "loss": 0.0322, "step": 1967 }, { "epoch": 0.4, "learning_rate": 0.0002963008667519651, "loss": 0.0314, "step": 1968 }, { "epoch": 0.4, "learning_rate": 0.00029629658695445296, "loss": 0.0132, "step": 1969 }, { "epoch": 0.4, "learning_rate": 0.0002962923047135116, "loss": 0.0539, "step": 1970 }, { "epoch": 0.4, "learning_rate": 0.0002962880200292127, "loss": 0.0128, "step": 1971 }, { "epoch": 0.4, "learning_rate": 0.0002962837329016277, "loss": 0.0524, "step": 1972 }, { "epoch": 0.4, "learning_rate": 0.00029627944333082814, "loss": 0.0186, "step": 1973 }, { "epoch": 0.4, "learning_rate": 0.0002962751513168858, "loss": 0.0187, "step": 1974 }, { "epoch": 0.4, "learning_rate": 0.0002962708568598723, "loss": 0.0233, "step": 1975 }, { "epoch": 0.4, "learning_rate": 0.00029626655995985946, "loss": 0.0263, "step": 1976 }, { "epoch": 0.4, "learning_rate": 0.00029626226061691893, "loss": 0.0232, "step": 1977 }, { "epoch": 0.4, "learning_rate": 0.00029625795883112254, "loss": 0.0198, "step": 1978 }, { "epoch": 0.4, "learning_rate": 0.00029625365460254216, "loss": 0.0393, "step": 1979 }, { "epoch": 0.4, "learning_rate": 0.0002962493479312497, "loss": 0.025, "step": 1980 }, { "epoch": 0.4, "learning_rate": 0.00029624503881731703, "loss": 0.0562, "step": 1981 }, { "epoch": 0.4, "learning_rate": 0.00029624072726081615, "loss": 0.0283, "step": 1982 }, { "epoch": 0.4, "learning_rate": 0.00029623641326181915, "loss": 0.0262, "step": 1983 }, { "epoch": 0.4, "learning_rate": 0.00029623209682039795, "loss": 0.0058, "step": 1984 }, { "epoch": 0.4, "learning_rate": 0.0002962277779366247, "loss": 0.0461, "step": 1985 }, { "epoch": 0.4, "learning_rate": 0.00029622345661057154, "loss": 0.0261, "step": 1986 }, { "epoch": 0.4, "learning_rate": 0.00029621913284231063, "loss": 0.0364, "step": 1987 }, { "epoch": 0.4, "learning_rate": 0.0002962148066319142, "loss": 0.0408, "step": 1988 }, { "epoch": 0.4, "learning_rate": 0.0002962104779794545, "loss": 0.0363, "step": 1989 }, { "epoch": 0.41, "learning_rate": 0.00029620614688500386, "loss": 0.032, "step": 1990 }, { "epoch": 0.41, "learning_rate": 0.0002962018133486345, "loss": 0.0064, "step": 1991 }, { "epoch": 0.41, "learning_rate": 0.00029619747737041896, "loss": 0.0481, "step": 1992 }, { "epoch": 0.41, "learning_rate": 0.0002961931389504296, "loss": 0.0077, "step": 1993 }, { "epoch": 0.41, "learning_rate": 0.0002961887980887388, "loss": 0.1338, "step": 1994 }, { "epoch": 0.41, "learning_rate": 0.00029618445478541913, "loss": 0.0204, "step": 1995 }, { "epoch": 0.41, "learning_rate": 0.00029618010904054314, "loss": 0.0156, "step": 1996 }, { "epoch": 0.41, "learning_rate": 0.00029617576085418334, "loss": 0.0374, "step": 1997 }, { "epoch": 0.41, "learning_rate": 0.00029617141022641243, "loss": 0.0081, "step": 1998 }, { "epoch": 0.41, "learning_rate": 0.0002961670571573031, "loss": 0.0108, "step": 1999 }, { "epoch": 0.41, "learning_rate": 0.000296162701646928, "loss": 0.0218, "step": 2000 }, { "epoch": 0.41, "learning_rate": 0.0002961583436953598, "loss": 0.056, "step": 2001 }, { "epoch": 0.41, "learning_rate": 0.00029615398330267145, "loss": 0.0077, "step": 2002 }, { "epoch": 0.41, "learning_rate": 0.00029614962046893567, "loss": 0.0385, "step": 2003 }, { "epoch": 0.41, "learning_rate": 0.00029614525519422533, "loss": 0.0229, "step": 2004 }, { "epoch": 0.41, "learning_rate": 0.0002961408874786134, "loss": 0.013, "step": 2005 }, { "epoch": 0.41, "learning_rate": 0.0002961365173221728, "loss": 0.0191, "step": 2006 }, { "epoch": 0.41, "learning_rate": 0.00029613214472497647, "loss": 0.009, "step": 2007 }, { "epoch": 0.41, "learning_rate": 0.00029612776968709746, "loss": 0.0353, "step": 2008 }, { "epoch": 0.41, "learning_rate": 0.0002961233922086089, "loss": 0.0309, "step": 2009 }, { "epoch": 0.41, "learning_rate": 0.0002961190122895838, "loss": 0.0646, "step": 2010 }, { "epoch": 0.41, "learning_rate": 0.00029611462993009544, "loss": 0.0102, "step": 2011 }, { "epoch": 0.41, "learning_rate": 0.00029611024513021694, "loss": 0.0384, "step": 2012 }, { "epoch": 0.41, "learning_rate": 0.0002961058578900215, "loss": 0.0076, "step": 2013 }, { "epoch": 0.41, "learning_rate": 0.0002961014682095825, "loss": 0.0426, "step": 2014 }, { "epoch": 0.41, "learning_rate": 0.00029609707608897317, "loss": 0.0327, "step": 2015 }, { "epoch": 0.41, "learning_rate": 0.0002960926815282669, "loss": 0.0143, "step": 2016 }, { "epoch": 0.41, "learning_rate": 0.00029608828452753707, "loss": 0.026, "step": 2017 }, { "epoch": 0.41, "learning_rate": 0.00029608388508685715, "loss": 0.0372, "step": 2018 }, { "epoch": 0.41, "learning_rate": 0.0002960794832063006, "loss": 0.031, "step": 2019 }, { "epoch": 0.41, "learning_rate": 0.0002960750788859409, "loss": 0.0053, "step": 2020 }, { "epoch": 0.41, "learning_rate": 0.00029607067212585167, "loss": 0.0448, "step": 2021 }, { "epoch": 0.41, "learning_rate": 0.00029606626292610645, "loss": 0.0486, "step": 2022 }, { "epoch": 0.41, "learning_rate": 0.00029606185128677894, "loss": 0.0343, "step": 2023 }, { "epoch": 0.41, "learning_rate": 0.00029605743720794277, "loss": 0.011, "step": 2024 }, { "epoch": 0.41, "learning_rate": 0.0002960530206896717, "loss": 0.0199, "step": 2025 }, { "epoch": 0.41, "learning_rate": 0.0002960486017320396, "loss": 0.0198, "step": 2026 }, { "epoch": 0.41, "learning_rate": 0.0002960441803351201, "loss": 0.0834, "step": 2027 }, { "epoch": 0.41, "learning_rate": 0.00029603975649898705, "loss": 0.0273, "step": 2028 }, { "epoch": 0.41, "learning_rate": 0.00029603533022371447, "loss": 0.0396, "step": 2029 }, { "epoch": 0.41, "learning_rate": 0.0002960309015093762, "loss": 0.0111, "step": 2030 }, { "epoch": 0.41, "learning_rate": 0.0002960264703560462, "loss": 0.0183, "step": 2031 }, { "epoch": 0.41, "learning_rate": 0.0002960220367637985, "loss": 0.0265, "step": 2032 }, { "epoch": 0.41, "learning_rate": 0.00029601760073270716, "loss": 0.0129, "step": 2033 }, { "epoch": 0.41, "learning_rate": 0.00029601316226284625, "loss": 0.0213, "step": 2034 }, { "epoch": 0.41, "learning_rate": 0.0002960087213542899, "loss": 0.0334, "step": 2035 }, { "epoch": 0.41, "learning_rate": 0.00029600427800711233, "loss": 0.0094, "step": 2036 }, { "epoch": 0.41, "learning_rate": 0.0002959998322213877, "loss": 0.0358, "step": 2037 }, { "epoch": 0.41, "learning_rate": 0.0002959953839971903, "loss": 0.0224, "step": 2038 }, { "epoch": 0.42, "learning_rate": 0.00029599093333459433, "loss": 0.0278, "step": 2039 }, { "epoch": 0.42, "learning_rate": 0.00029598648023367426, "loss": 0.0242, "step": 2040 }, { "epoch": 0.42, "learning_rate": 0.0002959820246945044, "loss": 0.0061, "step": 2041 }, { "epoch": 0.42, "learning_rate": 0.00029597756671715915, "loss": 0.0342, "step": 2042 }, { "epoch": 0.42, "learning_rate": 0.000295973106301713, "loss": 0.0067, "step": 2043 }, { "epoch": 0.42, "learning_rate": 0.0002959686434482404, "loss": 0.0182, "step": 2044 }, { "epoch": 0.42, "learning_rate": 0.0002959641781568159, "loss": 0.0059, "step": 2045 }, { "epoch": 0.42, "learning_rate": 0.00029595971042751417, "loss": 0.008, "step": 2046 }, { "epoch": 0.42, "learning_rate": 0.0002959552402604097, "loss": 0.0673, "step": 2047 }, { "epoch": 0.42, "learning_rate": 0.00029595076765557725, "loss": 0.0164, "step": 2048 }, { "epoch": 0.42, "learning_rate": 0.0002959462926130915, "loss": 0.0137, "step": 2049 }, { "epoch": 0.42, "learning_rate": 0.0002959418151330271, "loss": 0.0294, "step": 2050 }, { "epoch": 0.42, "learning_rate": 0.0002959373352154589, "loss": 0.0353, "step": 2051 }, { "epoch": 0.42, "learning_rate": 0.0002959328528604618, "loss": 0.0533, "step": 2052 }, { "epoch": 0.42, "learning_rate": 0.0002959283680681105, "loss": 0.0131, "step": 2053 }, { "epoch": 0.42, "learning_rate": 0.00029592388083848003, "loss": 0.0251, "step": 2054 }, { "epoch": 0.42, "learning_rate": 0.00029591939117164527, "loss": 0.0204, "step": 2055 }, { "epoch": 0.42, "learning_rate": 0.00029591489906768135, "loss": 0.012, "step": 2056 }, { "epoch": 0.42, "learning_rate": 0.00029591040452666307, "loss": 0.0285, "step": 2057 }, { "epoch": 0.42, "learning_rate": 0.0002959059075486656, "loss": 0.054, "step": 2058 }, { "epoch": 0.42, "learning_rate": 0.00029590140813376414, "loss": 0.012, "step": 2059 }, { "epoch": 0.42, "learning_rate": 0.0002958969062820337, "loss": 0.0338, "step": 2060 }, { "epoch": 0.42, "learning_rate": 0.0002958924019935496, "loss": 0.0247, "step": 2061 }, { "epoch": 0.42, "learning_rate": 0.0002958878952683869, "loss": 0.0181, "step": 2062 }, { "epoch": 0.42, "learning_rate": 0.000295883386106621, "loss": 0.045, "step": 2063 }, { "epoch": 0.42, "learning_rate": 0.00029587887450832715, "loss": 0.0402, "step": 2064 }, { "epoch": 0.42, "learning_rate": 0.0002958743604735808, "loss": 0.0264, "step": 2065 }, { "epoch": 0.42, "learning_rate": 0.0002958698440024572, "loss": 0.0587, "step": 2066 }, { "epoch": 0.42, "learning_rate": 0.00029586532509503187, "loss": 0.0285, "step": 2067 }, { "epoch": 0.42, "learning_rate": 0.00029586080375138034, "loss": 0.0046, "step": 2068 }, { "epoch": 0.42, "learning_rate": 0.000295856279971578, "loss": 0.0537, "step": 2069 }, { "epoch": 0.42, "learning_rate": 0.00029585175375570046, "loss": 0.0641, "step": 2070 }, { "epoch": 0.42, "learning_rate": 0.00029584722510382335, "loss": 0.0205, "step": 2071 }, { "epoch": 0.42, "learning_rate": 0.0002958426940160222, "loss": 0.0229, "step": 2072 }, { "epoch": 0.42, "learning_rate": 0.0002958381604923728, "loss": 0.0373, "step": 2073 }, { "epoch": 0.42, "learning_rate": 0.00029583362453295087, "loss": 0.0315, "step": 2074 }, { "epoch": 0.42, "learning_rate": 0.0002958290861378321, "loss": 0.041, "step": 2075 }, { "epoch": 0.42, "learning_rate": 0.0002958245453070923, "loss": 0.0212, "step": 2076 }, { "epoch": 0.42, "learning_rate": 0.0002958200020408074, "loss": 0.0107, "step": 2077 }, { "epoch": 0.42, "learning_rate": 0.00029581545633905313, "loss": 0.0169, "step": 2078 }, { "epoch": 0.42, "learning_rate": 0.00029581090820190553, "loss": 0.0215, "step": 2079 }, { "epoch": 0.42, "learning_rate": 0.0002958063576294405, "loss": 0.0149, "step": 2080 }, { "epoch": 0.42, "learning_rate": 0.0002958018046217341, "loss": 0.0061, "step": 2081 }, { "epoch": 0.42, "learning_rate": 0.00029579724917886237, "loss": 0.0156, "step": 2082 }, { "epoch": 0.42, "learning_rate": 0.0002957926913009013, "loss": 0.0307, "step": 2083 }, { "epoch": 0.42, "learning_rate": 0.0002957881309879271, "loss": 0.0262, "step": 2084 }, { "epoch": 0.42, "learning_rate": 0.00029578356824001595, "loss": 0.0158, "step": 2085 }, { "epoch": 0.42, "learning_rate": 0.000295779003057244, "loss": 0.0169, "step": 2086 }, { "epoch": 0.42, "learning_rate": 0.0002957744354396875, "loss": 0.0177, "step": 2087 }, { "epoch": 0.43, "learning_rate": 0.00029576986538742283, "loss": 0.028, "step": 2088 }, { "epoch": 0.43, "learning_rate": 0.0002957652929005262, "loss": 0.0109, "step": 2089 }, { "epoch": 0.43, "learning_rate": 0.000295760717979074, "loss": 0.0497, "step": 2090 }, { "epoch": 0.43, "learning_rate": 0.0002957561406231427, "loss": 0.0268, "step": 2091 }, { "epoch": 0.43, "learning_rate": 0.0002957515608328087, "loss": 0.0221, "step": 2092 }, { "epoch": 0.43, "learning_rate": 0.0002957469786081485, "loss": 0.0476, "step": 2093 }, { "epoch": 0.43, "learning_rate": 0.00029574239394923867, "loss": 0.0189, "step": 2094 }, { "epoch": 0.43, "learning_rate": 0.0002957378068561558, "loss": 0.0084, "step": 2095 }, { "epoch": 0.43, "learning_rate": 0.00029573321732897633, "loss": 0.0103, "step": 2096 }, { "epoch": 0.43, "learning_rate": 0.00029572862536777713, "loss": 0.034, "step": 2097 }, { "epoch": 0.43, "learning_rate": 0.0002957240309726348, "loss": 0.0299, "step": 2098 }, { "epoch": 0.43, "learning_rate": 0.0002957194341436261, "loss": 0.0063, "step": 2099 }, { "epoch": 0.43, "learning_rate": 0.0002957148348808277, "loss": 0.0449, "step": 2100 }, { "epoch": 0.43, "learning_rate": 0.00029571023318431655, "loss": 0.0356, "step": 2101 }, { "epoch": 0.43, "learning_rate": 0.0002957056290541695, "loss": 0.045, "step": 2102 }, { "epoch": 0.43, "learning_rate": 0.00029570102249046337, "loss": 0.0121, "step": 2103 }, { "epoch": 0.43, "learning_rate": 0.0002956964134932751, "loss": 0.0348, "step": 2104 }, { "epoch": 0.43, "learning_rate": 0.00029569180206268173, "loss": 0.0193, "step": 2105 }, { "epoch": 0.43, "learning_rate": 0.0002956871881987603, "loss": 0.0158, "step": 2106 }, { "epoch": 0.43, "learning_rate": 0.00029568257190158774, "loss": 0.0337, "step": 2107 }, { "epoch": 0.43, "learning_rate": 0.00029567795317124126, "loss": 0.014, "step": 2108 }, { "epoch": 0.43, "learning_rate": 0.000295673332007798, "loss": 0.0161, "step": 2109 }, { "epoch": 0.43, "learning_rate": 0.0002956687084113351, "loss": 0.0175, "step": 2110 }, { "epoch": 0.43, "learning_rate": 0.0002956640823819298, "loss": 0.0177, "step": 2111 }, { "epoch": 0.43, "learning_rate": 0.0002956594539196594, "loss": 0.0429, "step": 2112 }, { "epoch": 0.43, "learning_rate": 0.00029565482302460107, "loss": 0.0177, "step": 2113 }, { "epoch": 0.43, "learning_rate": 0.00029565018969683236, "loss": 0.0075, "step": 2114 }, { "epoch": 0.43, "learning_rate": 0.0002956455539364305, "loss": 0.0345, "step": 2115 }, { "epoch": 0.43, "learning_rate": 0.000295640915743473, "loss": 0.0225, "step": 2116 }, { "epoch": 0.43, "learning_rate": 0.00029563627511803724, "loss": 0.0254, "step": 2117 }, { "epoch": 0.43, "learning_rate": 0.00029563163206020076, "loss": 0.0188, "step": 2118 }, { "epoch": 0.43, "learning_rate": 0.0002956269865700412, "loss": 0.0308, "step": 2119 }, { "epoch": 0.43, "learning_rate": 0.000295622338647636, "loss": 0.0167, "step": 2120 }, { "epoch": 0.43, "learning_rate": 0.0002956176882930629, "loss": 0.0374, "step": 2121 }, { "epoch": 0.43, "learning_rate": 0.00029561303550639954, "loss": 0.0248, "step": 2122 }, { "epoch": 0.43, "learning_rate": 0.0002956083802877236, "loss": 0.0087, "step": 2123 }, { "epoch": 0.43, "learning_rate": 0.0002956037226371129, "loss": 0.029, "step": 2124 }, { "epoch": 0.43, "learning_rate": 0.0002955990625546451, "loss": 0.0186, "step": 2125 }, { "epoch": 0.43, "learning_rate": 0.0002955944000403982, "loss": 0.0154, "step": 2126 }, { "epoch": 0.43, "learning_rate": 0.00029558973509445, "loss": 0.0346, "step": 2127 }, { "epoch": 0.43, "learning_rate": 0.00029558506771687834, "loss": 0.0339, "step": 2128 }, { "epoch": 0.43, "learning_rate": 0.00029558039790776125, "loss": 0.024, "step": 2129 }, { "epoch": 0.43, "learning_rate": 0.00029557572566717675, "loss": 0.0171, "step": 2130 }, { "epoch": 0.43, "learning_rate": 0.0002955710509952028, "loss": 0.0292, "step": 2131 }, { "epoch": 0.43, "learning_rate": 0.00029556637389191757, "loss": 0.029, "step": 2132 }, { "epoch": 0.43, "learning_rate": 0.00029556169435739906, "loss": 0.0461, "step": 2133 }, { "epoch": 0.43, "learning_rate": 0.0002955570123917255, "loss": 0.0444, "step": 2134 }, { "epoch": 0.43, "learning_rate": 0.00029555232799497507, "loss": 0.034, "step": 2135 }, { "epoch": 0.43, "learning_rate": 0.00029554764116722604, "loss": 0.0108, "step": 2136 }, { "epoch": 0.44, "learning_rate": 0.0002955429519085567, "loss": 0.0411, "step": 2137 }, { "epoch": 0.44, "learning_rate": 0.00029553826021904523, "loss": 0.0079, "step": 2138 }, { "epoch": 0.44, "learning_rate": 0.00029553356609877013, "loss": 0.0169, "step": 2139 }, { "epoch": 0.44, "learning_rate": 0.00029552886954780977, "loss": 0.0192, "step": 2140 }, { "epoch": 0.44, "learning_rate": 0.0002955241705662426, "loss": 0.0573, "step": 2141 }, { "epoch": 0.44, "learning_rate": 0.00029551946915414706, "loss": 0.0305, "step": 2142 }, { "epoch": 0.44, "learning_rate": 0.0002955147653116017, "loss": 0.015, "step": 2143 }, { "epoch": 0.44, "learning_rate": 0.0002955100590386851, "loss": 0.0111, "step": 2144 }, { "epoch": 0.44, "learning_rate": 0.0002955053503354758, "loss": 0.0206, "step": 2145 }, { "epoch": 0.44, "learning_rate": 0.00029550063920205253, "loss": 0.0165, "step": 2146 }, { "epoch": 0.44, "learning_rate": 0.00029549592563849397, "loss": 0.0134, "step": 2147 }, { "epoch": 0.44, "learning_rate": 0.00029549120964487876, "loss": 0.0148, "step": 2148 }, { "epoch": 0.44, "learning_rate": 0.0002954864912212857, "loss": 0.0392, "step": 2149 }, { "epoch": 0.44, "learning_rate": 0.00029548177036779364, "loss": 0.0329, "step": 2150 }, { "epoch": 0.44, "learning_rate": 0.0002954770470844814, "loss": 0.0764, "step": 2151 }, { "epoch": 0.44, "learning_rate": 0.0002954723213714278, "loss": 0.0562, "step": 2152 }, { "epoch": 0.44, "learning_rate": 0.0002954675932287119, "loss": 0.0683, "step": 2153 }, { "epoch": 0.44, "learning_rate": 0.0002954628626564126, "loss": 0.0339, "step": 2154 }, { "epoch": 0.44, "learning_rate": 0.0002954581296546089, "loss": 0.0406, "step": 2155 }, { "epoch": 0.44, "learning_rate": 0.00029545339422337984, "loss": 0.0319, "step": 2156 }, { "epoch": 0.44, "learning_rate": 0.00029544865636280457, "loss": 0.0158, "step": 2157 }, { "epoch": 0.44, "learning_rate": 0.00029544391607296217, "loss": 0.0125, "step": 2158 }, { "epoch": 0.44, "learning_rate": 0.0002954391733539319, "loss": 0.0257, "step": 2159 }, { "epoch": 0.44, "learning_rate": 0.0002954344282057928, "loss": 0.0452, "step": 2160 }, { "epoch": 0.44, "learning_rate": 0.00029542968062862426, "loss": 0.0417, "step": 2161 }, { "epoch": 0.44, "learning_rate": 0.0002954249306225055, "loss": 0.0129, "step": 2162 }, { "epoch": 0.44, "learning_rate": 0.00029542017818751597, "loss": 0.028, "step": 2163 }, { "epoch": 0.44, "learning_rate": 0.0002954154233237349, "loss": 0.0151, "step": 2164 }, { "epoch": 0.44, "learning_rate": 0.0002954106660312418, "loss": 0.0503, "step": 2165 }, { "epoch": 0.44, "learning_rate": 0.00029540590631011603, "loss": 0.0217, "step": 2166 }, { "epoch": 0.44, "learning_rate": 0.0002954011441604372, "loss": 0.014, "step": 2167 }, { "epoch": 0.44, "learning_rate": 0.0002953963795822848, "loss": 0.0367, "step": 2168 }, { "epoch": 0.44, "learning_rate": 0.00029539161257573844, "loss": 0.0109, "step": 2169 }, { "epoch": 0.44, "learning_rate": 0.0002953868431408776, "loss": 0.0456, "step": 2170 }, { "epoch": 0.44, "learning_rate": 0.0002953820712777822, "loss": 0.0408, "step": 2171 }, { "epoch": 0.44, "learning_rate": 0.00029537729698653165, "loss": 0.0395, "step": 2172 }, { "epoch": 0.44, "learning_rate": 0.00029537252026720585, "loss": 0.0528, "step": 2173 }, { "epoch": 0.44, "learning_rate": 0.0002953677411198846, "loss": 0.0444, "step": 2174 }, { "epoch": 0.44, "learning_rate": 0.0002953629595446476, "loss": 0.0261, "step": 2175 }, { "epoch": 0.44, "learning_rate": 0.00029535817554157483, "loss": 0.0278, "step": 2176 }, { "epoch": 0.44, "learning_rate": 0.0002953533891107461, "loss": 0.0175, "step": 2177 }, { "epoch": 0.44, "learning_rate": 0.00029534860025224143, "loss": 0.008, "step": 2178 }, { "epoch": 0.44, "learning_rate": 0.0002953438089661408, "loss": 0.017, "step": 2179 }, { "epoch": 0.44, "learning_rate": 0.0002953390152525242, "loss": 0.043, "step": 2180 }, { "epoch": 0.44, "learning_rate": 0.00029533421911147166, "loss": 0.0057, "step": 2181 }, { "epoch": 0.44, "learning_rate": 0.00029532942054306336, "loss": 0.0191, "step": 2182 }, { "epoch": 0.44, "learning_rate": 0.0002953246195473794, "loss": 0.0177, "step": 2183 }, { "epoch": 0.44, "learning_rate": 0.00029531981612449995, "loss": 0.0122, "step": 2184 }, { "epoch": 0.44, "learning_rate": 0.00029531501027450525, "loss": 0.0368, "step": 2185 }, { "epoch": 0.45, "learning_rate": 0.0002953102019974756, "loss": 0.0185, "step": 2186 }, { "epoch": 0.45, "learning_rate": 0.0002953053912934913, "loss": 0.0243, "step": 2187 }, { "epoch": 0.45, "learning_rate": 0.00029530057816263265, "loss": 0.0276, "step": 2188 }, { "epoch": 0.45, "learning_rate": 0.0002952957626049801, "loss": 0.0237, "step": 2189 }, { "epoch": 0.45, "learning_rate": 0.000295290944620614, "loss": 0.0162, "step": 2190 }, { "epoch": 0.45, "learning_rate": 0.00029528612420961494, "loss": 0.0319, "step": 2191 }, { "epoch": 0.45, "learning_rate": 0.0002952813013720633, "loss": 0.0214, "step": 2192 }, { "epoch": 0.45, "learning_rate": 0.00029527647610803974, "loss": 0.0138, "step": 2193 }, { "epoch": 0.45, "learning_rate": 0.00029527164841762477, "loss": 0.0332, "step": 2194 }, { "epoch": 0.45, "learning_rate": 0.000295266818300899, "loss": 0.0187, "step": 2195 }, { "epoch": 0.45, "learning_rate": 0.00029526198575794327, "loss": 0.0845, "step": 2196 }, { "epoch": 0.45, "learning_rate": 0.0002952571507888381, "loss": 0.0432, "step": 2197 }, { "epoch": 0.45, "learning_rate": 0.00029525231339366434, "loss": 0.0449, "step": 2198 }, { "epoch": 0.45, "learning_rate": 0.0002952474735725028, "loss": 0.035, "step": 2199 }, { "epoch": 0.45, "learning_rate": 0.0002952426313254342, "loss": 0.0548, "step": 2200 }, { "epoch": 0.45, "learning_rate": 0.0002952377866525395, "loss": 0.0222, "step": 2201 }, { "epoch": 0.45, "learning_rate": 0.00029523293955389967, "loss": 0.013, "step": 2202 }, { "epoch": 0.45, "learning_rate": 0.0002952280900295955, "loss": 0.0213, "step": 2203 }, { "epoch": 0.45, "learning_rate": 0.0002952232380797082, "loss": 0.0198, "step": 2204 }, { "epoch": 0.45, "learning_rate": 0.0002952183837043187, "loss": 0.0497, "step": 2205 }, { "epoch": 0.45, "learning_rate": 0.000295213526903508, "loss": 0.0228, "step": 2206 }, { "epoch": 0.45, "learning_rate": 0.0002952086676773573, "loss": 0.0453, "step": 2207 }, { "epoch": 0.45, "learning_rate": 0.00029520380602594777, "loss": 0.0263, "step": 2208 }, { "epoch": 0.45, "learning_rate": 0.00029519894194936057, "loss": 0.023, "step": 2209 }, { "epoch": 0.45, "learning_rate": 0.00029519407544767695, "loss": 0.0454, "step": 2210 }, { "epoch": 0.45, "learning_rate": 0.0002951892065209782, "loss": 0.0354, "step": 2211 }, { "epoch": 0.45, "learning_rate": 0.00029518433516934566, "loss": 0.0296, "step": 2212 }, { "epoch": 0.45, "learning_rate": 0.00029517946139286067, "loss": 0.0101, "step": 2213 }, { "epoch": 0.45, "learning_rate": 0.00029517458519160464, "loss": 0.0036, "step": 2214 }, { "epoch": 0.45, "learning_rate": 0.000295169706565659, "loss": 0.0208, "step": 2215 }, { "epoch": 0.45, "learning_rate": 0.0002951648255151052, "loss": 0.021, "step": 2216 }, { "epoch": 0.45, "learning_rate": 0.00029515994204002484, "loss": 0.029, "step": 2217 }, { "epoch": 0.45, "learning_rate": 0.0002951550561404994, "loss": 0.017, "step": 2218 }, { "epoch": 0.45, "learning_rate": 0.00029515016781661053, "loss": 0.0594, "step": 2219 }, { "epoch": 0.45, "learning_rate": 0.0002951452770684398, "loss": 0.0469, "step": 2220 }, { "epoch": 0.45, "learning_rate": 0.00029514038389606906, "loss": 0.0293, "step": 2221 }, { "epoch": 0.45, "learning_rate": 0.0002951354882995799, "loss": 0.0216, "step": 2222 }, { "epoch": 0.45, "learning_rate": 0.00029513059027905415, "loss": 0.0337, "step": 2223 }, { "epoch": 0.45, "learning_rate": 0.00029512568983457356, "loss": 0.0193, "step": 2224 }, { "epoch": 0.45, "learning_rate": 0.00029512078696622006, "loss": 0.0233, "step": 2225 }, { "epoch": 0.45, "learning_rate": 0.0002951158816740754, "loss": 0.0731, "step": 2226 }, { "epoch": 0.45, "learning_rate": 0.0002951109739582216, "loss": 0.0086, "step": 2227 }, { "epoch": 0.45, "learning_rate": 0.00029510606381874066, "loss": 0.0186, "step": 2228 }, { "epoch": 0.45, "learning_rate": 0.00029510115125571453, "loss": 0.0266, "step": 2229 }, { "epoch": 0.45, "learning_rate": 0.00029509623626922533, "loss": 0.0404, "step": 2230 }, { "epoch": 0.45, "learning_rate": 0.00029509131885935503, "loss": 0.0094, "step": 2231 }, { "epoch": 0.45, "learning_rate": 0.0002950863990261858, "loss": 0.0142, "step": 2232 }, { "epoch": 0.45, "learning_rate": 0.0002950814767697999, "loss": 0.0551, "step": 2233 }, { "epoch": 0.45, "learning_rate": 0.00029507655209027944, "loss": 0.0184, "step": 2234 }, { "epoch": 0.46, "learning_rate": 0.00029507162498770676, "loss": 0.0174, "step": 2235 }, { "epoch": 0.46, "learning_rate": 0.00029506669546216406, "loss": 0.0276, "step": 2236 }, { "epoch": 0.46, "learning_rate": 0.0002950617635137337, "loss": 0.0064, "step": 2237 }, { "epoch": 0.46, "learning_rate": 0.00029505682914249807, "loss": 0.0297, "step": 2238 }, { "epoch": 0.46, "learning_rate": 0.0002950518923485396, "loss": 0.0126, "step": 2239 }, { "epoch": 0.46, "learning_rate": 0.00029504695313194076, "loss": 0.0099, "step": 2240 }, { "epoch": 0.46, "learning_rate": 0.0002950420114927839, "loss": 0.0146, "step": 2241 }, { "epoch": 0.46, "learning_rate": 0.00029503706743115175, "loss": 0.0223, "step": 2242 }, { "epoch": 0.46, "learning_rate": 0.0002950321209471268, "loss": 0.0687, "step": 2243 }, { "epoch": 0.46, "learning_rate": 0.00029502717204079156, "loss": 0.0069, "step": 2244 }, { "epoch": 0.46, "learning_rate": 0.0002950222207122289, "loss": 0.0134, "step": 2245 }, { "epoch": 0.46, "learning_rate": 0.00029501726696152137, "loss": 0.033, "step": 2246 }, { "epoch": 0.46, "learning_rate": 0.00029501231078875176, "loss": 0.0228, "step": 2247 }, { "epoch": 0.46, "learning_rate": 0.0002950073521940028, "loss": 0.0152, "step": 2248 }, { "epoch": 0.46, "learning_rate": 0.00029500239117735737, "loss": 0.0266, "step": 2249 }, { "epoch": 0.46, "learning_rate": 0.00029499742773889825, "loss": 0.0236, "step": 2250 }, { "epoch": 0.46, "learning_rate": 0.0002949924618787084, "loss": 0.01, "step": 2251 }, { "epoch": 0.46, "learning_rate": 0.00029498749359687076, "loss": 0.0084, "step": 2252 }, { "epoch": 0.46, "learning_rate": 0.0002949825228934683, "loss": 0.0487, "step": 2253 }, { "epoch": 0.46, "learning_rate": 0.000294977549768584, "loss": 0.0169, "step": 2254 }, { "epoch": 0.46, "learning_rate": 0.000294972574222301, "loss": 0.0206, "step": 2255 }, { "epoch": 0.46, "learning_rate": 0.00029496759625470233, "loss": 0.0409, "step": 2256 }, { "epoch": 0.46, "learning_rate": 0.0002949626158658711, "loss": 0.0093, "step": 2257 }, { "epoch": 0.46, "learning_rate": 0.00029495763305589063, "loss": 0.0397, "step": 2258 }, { "epoch": 0.46, "learning_rate": 0.000294952647824844, "loss": 0.0335, "step": 2259 }, { "epoch": 0.46, "learning_rate": 0.0002949476601728146, "loss": 0.0048, "step": 2260 }, { "epoch": 0.46, "learning_rate": 0.00029494267009988565, "loss": 0.0841, "step": 2261 }, { "epoch": 0.46, "learning_rate": 0.0002949376776061405, "loss": 0.0212, "step": 2262 }, { "epoch": 0.46, "learning_rate": 0.00029493268269166256, "loss": 0.0248, "step": 2263 }, { "epoch": 0.46, "learning_rate": 0.0002949276853565352, "loss": 0.049, "step": 2264 }, { "epoch": 0.46, "learning_rate": 0.0002949226856008419, "loss": 0.0337, "step": 2265 }, { "epoch": 0.46, "learning_rate": 0.00029491768342466626, "loss": 0.0515, "step": 2266 }, { "epoch": 0.46, "learning_rate": 0.00029491267882809176, "loss": 0.013, "step": 2267 }, { "epoch": 0.46, "learning_rate": 0.0002949076718112019, "loss": 0.0187, "step": 2268 }, { "epoch": 0.46, "learning_rate": 0.0002949026623740805, "loss": 0.0206, "step": 2269 }, { "epoch": 0.46, "learning_rate": 0.000294897650516811, "loss": 0.0168, "step": 2270 }, { "epoch": 0.46, "learning_rate": 0.00029489263623947733, "loss": 0.0146, "step": 2271 }, { "epoch": 0.46, "learning_rate": 0.00029488761954216304, "loss": 0.0238, "step": 2272 }, { "epoch": 0.46, "learning_rate": 0.00029488260042495205, "loss": 0.021, "step": 2273 }, { "epoch": 0.46, "learning_rate": 0.0002948775788879282, "loss": 0.0136, "step": 2274 }, { "epoch": 0.46, "learning_rate": 0.00029487255493117524, "loss": 0.0307, "step": 2275 }, { "epoch": 0.46, "learning_rate": 0.00029486752855477713, "loss": 0.0239, "step": 2276 }, { "epoch": 0.46, "learning_rate": 0.0002948624997588179, "loss": 0.0076, "step": 2277 }, { "epoch": 0.46, "learning_rate": 0.00029485746854338143, "loss": 0.0333, "step": 2278 }, { "epoch": 0.46, "learning_rate": 0.0002948524349085518, "loss": 0.0234, "step": 2279 }, { "epoch": 0.46, "learning_rate": 0.0002948473988544131, "loss": 0.0624, "step": 2280 }, { "epoch": 0.46, "learning_rate": 0.00029484236038104935, "loss": 0.028, "step": 2281 }, { "epoch": 0.46, "learning_rate": 0.0002948373194885449, "loss": 0.0108, "step": 2282 }, { "epoch": 0.46, "learning_rate": 0.0002948322761769837, "loss": 0.0279, "step": 2283 }, { "epoch": 0.47, "learning_rate": 0.00029482723044645017, "loss": 0.0147, "step": 2284 }, { "epoch": 0.47, "learning_rate": 0.00029482218229702847, "loss": 0.0271, "step": 2285 }, { "epoch": 0.47, "learning_rate": 0.00029481713172880295, "loss": 0.0327, "step": 2286 }, { "epoch": 0.47, "learning_rate": 0.000294812078741858, "loss": 0.0561, "step": 2287 }, { "epoch": 0.47, "learning_rate": 0.00029480702333627796, "loss": 0.0366, "step": 2288 }, { "epoch": 0.47, "learning_rate": 0.0002948019655121473, "loss": 0.0159, "step": 2289 }, { "epoch": 0.47, "learning_rate": 0.00029479690526955046, "loss": 0.0222, "step": 2290 }, { "epoch": 0.47, "learning_rate": 0.00029479184260857203, "loss": 0.0183, "step": 2291 }, { "epoch": 0.47, "learning_rate": 0.0002947867775292965, "loss": 0.0206, "step": 2292 }, { "epoch": 0.47, "learning_rate": 0.00029478171003180845, "loss": 0.0402, "step": 2293 }, { "epoch": 0.47, "learning_rate": 0.00029477664011619254, "loss": 0.0371, "step": 2294 }, { "epoch": 0.47, "learning_rate": 0.0002947715677825335, "loss": 0.0167, "step": 2295 }, { "epoch": 0.47, "learning_rate": 0.00029476649303091597, "loss": 0.0295, "step": 2296 }, { "epoch": 0.47, "learning_rate": 0.0002947614158614247, "loss": 0.0186, "step": 2297 }, { "epoch": 0.47, "learning_rate": 0.00029475633627414457, "loss": 0.0143, "step": 2298 }, { "epoch": 0.47, "learning_rate": 0.0002947512542691604, "loss": 0.014, "step": 2299 }, { "epoch": 0.47, "learning_rate": 0.00029474616984655704, "loss": 0.019, "step": 2300 }, { "epoch": 0.47, "learning_rate": 0.00029474108300641945, "loss": 0.0103, "step": 2301 }, { "epoch": 0.47, "learning_rate": 0.0002947359937488325, "loss": 0.0524, "step": 2302 }, { "epoch": 0.47, "learning_rate": 0.0002947309020738812, "loss": 0.0183, "step": 2303 }, { "epoch": 0.47, "learning_rate": 0.0002947258079816507, "loss": 0.0267, "step": 2304 }, { "epoch": 0.47, "learning_rate": 0.000294720711472226, "loss": 0.0326, "step": 2305 }, { "epoch": 0.47, "learning_rate": 0.0002947156125456923, "loss": 0.0334, "step": 2306 }, { "epoch": 0.47, "learning_rate": 0.00029471051120213466, "loss": 0.0246, "step": 2307 }, { "epoch": 0.47, "learning_rate": 0.0002947054074416383, "loss": 0.012, "step": 2308 }, { "epoch": 0.47, "learning_rate": 0.0002947003012642885, "loss": 0.0276, "step": 2309 }, { "epoch": 0.47, "learning_rate": 0.0002946951926701705, "loss": 0.0266, "step": 2310 }, { "epoch": 0.47, "learning_rate": 0.0002946900816593697, "loss": 0.0318, "step": 2311 }, { "epoch": 0.47, "learning_rate": 0.0002946849682319714, "loss": 0.0183, "step": 2312 }, { "epoch": 0.47, "learning_rate": 0.000294679852388061, "loss": 0.0116, "step": 2313 }, { "epoch": 0.47, "learning_rate": 0.000294674734127724, "loss": 0.0108, "step": 2314 }, { "epoch": 0.47, "learning_rate": 0.0002946696134510458, "loss": 0.021, "step": 2315 }, { "epoch": 0.47, "learning_rate": 0.00029466449035811195, "loss": 0.0152, "step": 2316 }, { "epoch": 0.47, "learning_rate": 0.0002946593648490081, "loss": 0.0464, "step": 2317 }, { "epoch": 0.47, "learning_rate": 0.00029465423692381974, "loss": 0.0185, "step": 2318 }, { "epoch": 0.47, "learning_rate": 0.0002946491065826326, "loss": 0.0359, "step": 2319 }, { "epoch": 0.47, "learning_rate": 0.00029464397382553234, "loss": 0.0137, "step": 2320 }, { "epoch": 0.47, "learning_rate": 0.0002946388386526047, "loss": 0.0229, "step": 2321 }, { "epoch": 0.47, "learning_rate": 0.0002946337010639354, "loss": 0.0162, "step": 2322 }, { "epoch": 0.47, "learning_rate": 0.0002946285610596103, "loss": 0.0064, "step": 2323 }, { "epoch": 0.47, "learning_rate": 0.0002946234186397152, "loss": 0.0144, "step": 2324 }, { "epoch": 0.47, "learning_rate": 0.00029461827380433605, "loss": 0.0366, "step": 2325 }, { "epoch": 0.47, "learning_rate": 0.0002946131265535587, "loss": 0.0126, "step": 2326 }, { "epoch": 0.47, "learning_rate": 0.00029460797688746914, "loss": 0.0261, "step": 2327 }, { "epoch": 0.47, "learning_rate": 0.0002946028248061535, "loss": 0.0506, "step": 2328 }, { "epoch": 0.47, "learning_rate": 0.0002945976703096976, "loss": 0.0401, "step": 2329 }, { "epoch": 0.47, "learning_rate": 0.0002945925133981877, "loss": 0.0052, "step": 2330 }, { "epoch": 0.47, "learning_rate": 0.00029458735407170996, "loss": 0.0189, "step": 2331 }, { "epoch": 0.47, "learning_rate": 0.0002945821923303504, "loss": 0.038, "step": 2332 }, { "epoch": 0.48, "learning_rate": 0.0002945770281741953, "loss": 0.0121, "step": 2333 }, { "epoch": 0.48, "learning_rate": 0.000294571861603331, "loss": 0.0377, "step": 2334 }, { "epoch": 0.48, "learning_rate": 0.0002945666926178437, "loss": 0.0403, "step": 2335 }, { "epoch": 0.48, "learning_rate": 0.0002945615212178197, "loss": 0.0169, "step": 2336 }, { "epoch": 0.48, "learning_rate": 0.0002945563474033454, "loss": 0.0277, "step": 2337 }, { "epoch": 0.48, "learning_rate": 0.0002945511711745073, "loss": 0.0478, "step": 2338 }, { "epoch": 0.48, "learning_rate": 0.0002945459925313917, "loss": 0.013, "step": 2339 }, { "epoch": 0.48, "learning_rate": 0.00029454081147408523, "loss": 0.0298, "step": 2340 }, { "epoch": 0.48, "learning_rate": 0.00029453562800267434, "loss": 0.0411, "step": 2341 }, { "epoch": 0.48, "learning_rate": 0.00029453044211724563, "loss": 0.0449, "step": 2342 }, { "epoch": 0.48, "learning_rate": 0.0002945252538178858, "loss": 0.017, "step": 2343 }, { "epoch": 0.48, "learning_rate": 0.0002945200631046813, "loss": 0.0262, "step": 2344 }, { "epoch": 0.48, "learning_rate": 0.000294514869977719, "loss": 0.0231, "step": 2345 }, { "epoch": 0.48, "learning_rate": 0.0002945096744370856, "loss": 0.0149, "step": 2346 }, { "epoch": 0.48, "learning_rate": 0.0002945044764828678, "loss": 0.0166, "step": 2347 }, { "epoch": 0.48, "learning_rate": 0.00029449927611515254, "loss": 0.0178, "step": 2348 }, { "epoch": 0.48, "learning_rate": 0.0002944940733340266, "loss": 0.025, "step": 2349 }, { "epoch": 0.48, "learning_rate": 0.0002944888681395768, "loss": 0.0288, "step": 2350 }, { "epoch": 0.48, "learning_rate": 0.00029448366053189026, "loss": 0.0292, "step": 2351 }, { "epoch": 0.48, "learning_rate": 0.0002944784505110538, "loss": 0.0263, "step": 2352 }, { "epoch": 0.48, "learning_rate": 0.0002944732380771545, "loss": 0.022, "step": 2353 }, { "epoch": 0.48, "learning_rate": 0.0002944680232302794, "loss": 0.0301, "step": 2354 }, { "epoch": 0.48, "learning_rate": 0.00029446280597051564, "loss": 0.0249, "step": 2355 }, { "epoch": 0.48, "learning_rate": 0.0002944575862979503, "loss": 0.0181, "step": 2356 }, { "epoch": 0.48, "learning_rate": 0.0002944523642126706, "loss": 0.0144, "step": 2357 }, { "epoch": 0.48, "learning_rate": 0.0002944471397147638, "loss": 0.0107, "step": 2358 }, { "epoch": 0.48, "learning_rate": 0.000294441912804317, "loss": 0.0268, "step": 2359 }, { "epoch": 0.48, "learning_rate": 0.00029443668348141765, "loss": 0.0072, "step": 2360 }, { "epoch": 0.48, "learning_rate": 0.00029443145174615307, "loss": 0.0099, "step": 2361 }, { "epoch": 0.48, "learning_rate": 0.00029442621759861055, "loss": 0.0252, "step": 2362 }, { "epoch": 0.48, "learning_rate": 0.0002944209810388776, "loss": 0.021, "step": 2363 }, { "epoch": 0.48, "learning_rate": 0.0002944157420670417, "loss": 0.0365, "step": 2364 }, { "epoch": 0.48, "learning_rate": 0.0002944105006831902, "loss": 0.0281, "step": 2365 }, { "epoch": 0.48, "learning_rate": 0.0002944052568874109, "loss": 0.0118, "step": 2366 }, { "epoch": 0.48, "learning_rate": 0.0002944000106797911, "loss": 0.0327, "step": 2367 }, { "epoch": 0.48, "learning_rate": 0.0002943947620604186, "loss": 0.004, "step": 2368 }, { "epoch": 0.48, "learning_rate": 0.00029438951102938097, "loss": 0.0248, "step": 2369 }, { "epoch": 0.48, "learning_rate": 0.00029438425758676596, "loss": 0.0196, "step": 2370 }, { "epoch": 0.48, "learning_rate": 0.0002943790017326613, "loss": 0.0315, "step": 2371 }, { "epoch": 0.48, "learning_rate": 0.0002943737434671548, "loss": 0.0106, "step": 2372 }, { "epoch": 0.48, "learning_rate": 0.0002943684827903343, "loss": 0.0163, "step": 2373 }, { "epoch": 0.48, "learning_rate": 0.0002943632197022875, "loss": 0.1069, "step": 2374 }, { "epoch": 0.48, "learning_rate": 0.0002943579542031025, "loss": 0.0514, "step": 2375 }, { "epoch": 0.48, "learning_rate": 0.0002943526862928672, "loss": 0.0102, "step": 2376 }, { "epoch": 0.48, "learning_rate": 0.0002943474159716696, "loss": 0.0495, "step": 2377 }, { "epoch": 0.48, "learning_rate": 0.00029434214323959755, "loss": 0.0246, "step": 2378 }, { "epoch": 0.48, "learning_rate": 0.00029433686809673926, "loss": 0.022, "step": 2379 }, { "epoch": 0.48, "learning_rate": 0.0002943315905431829, "loss": 0.0425, "step": 2380 }, { "epoch": 0.48, "learning_rate": 0.00029432631057901647, "loss": 0.0356, "step": 2381 }, { "epoch": 0.49, "learning_rate": 0.0002943210282043282, "loss": 0.007, "step": 2382 }, { "epoch": 0.49, "learning_rate": 0.0002943157434192064, "loss": 0.014, "step": 2383 }, { "epoch": 0.49, "learning_rate": 0.0002943104562237393, "loss": 0.0228, "step": 2384 }, { "epoch": 0.49, "learning_rate": 0.00029430516661801503, "loss": 0.0188, "step": 2385 }, { "epoch": 0.49, "learning_rate": 0.0002942998746021222, "loss": 0.0376, "step": 2386 }, { "epoch": 0.49, "learning_rate": 0.000294294580176149, "loss": 0.0114, "step": 2387 }, { "epoch": 0.49, "learning_rate": 0.00029428928334018404, "loss": 0.0198, "step": 2388 }, { "epoch": 0.49, "learning_rate": 0.0002942839840943156, "loss": 0.0128, "step": 2389 }, { "epoch": 0.49, "learning_rate": 0.0002942786824386323, "loss": 0.0318, "step": 2390 }, { "epoch": 0.49, "learning_rate": 0.0002942733783732226, "loss": 0.0116, "step": 2391 }, { "epoch": 0.49, "learning_rate": 0.0002942680718981752, "loss": 0.0433, "step": 2392 }, { "epoch": 0.49, "learning_rate": 0.0002942627630135787, "loss": 0.0345, "step": 2393 }, { "epoch": 0.49, "learning_rate": 0.00029425745171952173, "loss": 0.0433, "step": 2394 }, { "epoch": 0.49, "learning_rate": 0.00029425213801609297, "loss": 0.0093, "step": 2395 }, { "epoch": 0.49, "learning_rate": 0.00029424682190338125, "loss": 0.061, "step": 2396 }, { "epoch": 0.49, "learning_rate": 0.00029424150338147533, "loss": 0.0303, "step": 2397 }, { "epoch": 0.49, "learning_rate": 0.000294236182450464, "loss": 0.0067, "step": 2398 }, { "epoch": 0.49, "learning_rate": 0.00029423085911043615, "loss": 0.0138, "step": 2399 }, { "epoch": 0.49, "learning_rate": 0.0002942255333614807, "loss": 0.0412, "step": 2400 }, { "epoch": 0.49, "learning_rate": 0.0002942202052036866, "loss": 0.0068, "step": 2401 }, { "epoch": 0.49, "learning_rate": 0.0002942148746371428, "loss": 0.0132, "step": 2402 }, { "epoch": 0.49, "learning_rate": 0.0002942095416619384, "loss": 0.0911, "step": 2403 }, { "epoch": 0.49, "learning_rate": 0.00029420420627816247, "loss": 0.0233, "step": 2404 }, { "epoch": 0.49, "learning_rate": 0.0002941988684859041, "loss": 0.0526, "step": 2405 }, { "epoch": 0.49, "learning_rate": 0.0002941935282852524, "loss": 0.0133, "step": 2406 }, { "epoch": 0.49, "learning_rate": 0.0002941881856762966, "loss": 0.0275, "step": 2407 }, { "epoch": 0.49, "learning_rate": 0.00029418284065912595, "loss": 0.0274, "step": 2408 }, { "epoch": 0.49, "learning_rate": 0.00029417749323382966, "loss": 0.0032, "step": 2409 }, { "epoch": 0.49, "learning_rate": 0.00029417214340049703, "loss": 0.0313, "step": 2410 }, { "epoch": 0.49, "learning_rate": 0.0002941667911592175, "loss": 0.0182, "step": 2411 }, { "epoch": 0.49, "learning_rate": 0.0002941614365100805, "loss": 0.0114, "step": 2412 }, { "epoch": 0.49, "learning_rate": 0.0002941560794531753, "loss": 0.0043, "step": 2413 }, { "epoch": 0.49, "learning_rate": 0.0002941507199885915, "loss": 0.0141, "step": 2414 }, { "epoch": 0.49, "learning_rate": 0.00029414535811641857, "loss": 0.0165, "step": 2415 }, { "epoch": 0.49, "learning_rate": 0.00029413999383674604, "loss": 0.0295, "step": 2416 }, { "epoch": 0.49, "learning_rate": 0.00029413462714966357, "loss": 0.0215, "step": 2417 }, { "epoch": 0.49, "learning_rate": 0.0002941292580552607, "loss": 0.006, "step": 2418 }, { "epoch": 0.49, "learning_rate": 0.0002941238865536272, "loss": 0.0404, "step": 2419 }, { "epoch": 0.49, "learning_rate": 0.00029411851264485273, "loss": 0.0374, "step": 2420 }, { "epoch": 0.49, "learning_rate": 0.00029411313632902704, "loss": 0.0629, "step": 2421 }, { "epoch": 0.49, "learning_rate": 0.00029410775760623994, "loss": 0.0097, "step": 2422 }, { "epoch": 0.49, "learning_rate": 0.00029410237647658127, "loss": 0.0092, "step": 2423 }, { "epoch": 0.49, "learning_rate": 0.00029409699294014095, "loss": 0.0278, "step": 2424 }, { "epoch": 0.49, "learning_rate": 0.00029409160699700877, "loss": 0.0176, "step": 2425 }, { "epoch": 0.49, "learning_rate": 0.0002940862186472748, "loss": 0.0398, "step": 2426 }, { "epoch": 0.49, "learning_rate": 0.000294080827891029, "loss": 0.0164, "step": 2427 }, { "epoch": 0.49, "learning_rate": 0.0002940754347283614, "loss": 0.0339, "step": 2428 }, { "epoch": 0.49, "learning_rate": 0.00029407003915936207, "loss": 0.026, "step": 2429 }, { "epoch": 0.49, "learning_rate": 0.0002940646411841211, "loss": 0.0155, "step": 2430 }, { "epoch": 0.49, "learning_rate": 0.0002940592408027288, "loss": 0.0341, "step": 2431 }, { "epoch": 0.5, "learning_rate": 0.00029405383801527513, "loss": 0.0318, "step": 2432 }, { "epoch": 0.5, "learning_rate": 0.00029404843282185045, "loss": 0.0283, "step": 2433 }, { "epoch": 0.5, "learning_rate": 0.0002940430252225451, "loss": 0.0163, "step": 2434 }, { "epoch": 0.5, "learning_rate": 0.0002940376152174493, "loss": 0.0316, "step": 2435 }, { "epoch": 0.5, "learning_rate": 0.00029403220280665337, "loss": 0.0121, "step": 2436 }, { "epoch": 0.5, "learning_rate": 0.00029402678799024783, "loss": 0.0208, "step": 2437 }, { "epoch": 0.5, "learning_rate": 0.0002940213707683231, "loss": 0.0406, "step": 2438 }, { "epoch": 0.5, "learning_rate": 0.00029401595114096954, "loss": 0.0269, "step": 2439 }, { "epoch": 0.5, "learning_rate": 0.0002940105291082778, "loss": 0.0231, "step": 2440 }, { "epoch": 0.5, "learning_rate": 0.0002940051046703384, "loss": 0.0529, "step": 2441 }, { "epoch": 0.5, "learning_rate": 0.00029399967782724185, "loss": 0.0257, "step": 2442 }, { "epoch": 0.5, "learning_rate": 0.00029399424857907893, "loss": 0.0195, "step": 2443 }, { "epoch": 0.5, "learning_rate": 0.00029398881692594016, "loss": 0.0443, "step": 2444 }, { "epoch": 0.5, "learning_rate": 0.00029398338286791646, "loss": 0.0188, "step": 2445 }, { "epoch": 0.5, "learning_rate": 0.00029397794640509845, "loss": 0.0145, "step": 2446 }, { "epoch": 0.5, "learning_rate": 0.00029397250753757694, "loss": 0.0137, "step": 2447 }, { "epoch": 0.5, "learning_rate": 0.00029396706626544274, "loss": 0.0217, "step": 2448 }, { "epoch": 0.5, "learning_rate": 0.0002939616225887868, "loss": 0.0093, "step": 2449 }, { "epoch": 0.5, "learning_rate": 0.00029395617650770006, "loss": 0.014, "step": 2450 }, { "epoch": 0.5, "learning_rate": 0.00029395072802227345, "loss": 0.0231, "step": 2451 }, { "epoch": 0.5, "learning_rate": 0.0002939452771325979, "loss": 0.0066, "step": 2452 }, { "epoch": 0.5, "learning_rate": 0.0002939398238387645, "loss": 0.0705, "step": 2453 }, { "epoch": 0.5, "learning_rate": 0.0002939343681408644, "loss": 0.0357, "step": 2454 }, { "epoch": 0.5, "learning_rate": 0.0002939289100389886, "loss": 0.0508, "step": 2455 }, { "epoch": 0.5, "learning_rate": 0.0002939234495332283, "loss": 0.016, "step": 2456 }, { "epoch": 0.5, "learning_rate": 0.0002939179866236748, "loss": 0.0223, "step": 2457 }, { "epoch": 0.5, "learning_rate": 0.0002939125213104192, "loss": 0.0182, "step": 2458 }, { "epoch": 0.5, "learning_rate": 0.00029390705359355287, "loss": 0.0079, "step": 2459 }, { "epoch": 0.5, "learning_rate": 0.0002939015834731671, "loss": 0.0142, "step": 2460 }, { "epoch": 0.5, "learning_rate": 0.0002938961109493532, "loss": 0.0205, "step": 2461 }, { "epoch": 0.5, "learning_rate": 0.00029389063602220267, "loss": 0.0111, "step": 2462 }, { "epoch": 0.5, "learning_rate": 0.0002938851586918069, "loss": 0.0168, "step": 2463 }, { "epoch": 0.5, "learning_rate": 0.0002938796789582574, "loss": 0.0253, "step": 2464 }, { "epoch": 0.5, "learning_rate": 0.0002938741968216456, "loss": 0.0122, "step": 2465 }, { "epoch": 0.5, "learning_rate": 0.00029386871228206316, "loss": 0.0286, "step": 2466 }, { "epoch": 0.5, "learning_rate": 0.0002938632253396017, "loss": 0.0149, "step": 2467 }, { "epoch": 0.5, "learning_rate": 0.00029385773599435277, "loss": 0.0246, "step": 2468 }, { "epoch": 0.5, "learning_rate": 0.0002938522442464081, "loss": 0.0124, "step": 2469 }, { "epoch": 0.5, "learning_rate": 0.00029384675009585945, "loss": 0.0213, "step": 2470 }, { "epoch": 0.5, "learning_rate": 0.0002938412535427985, "loss": 0.0215, "step": 2471 }, { "epoch": 0.5, "learning_rate": 0.0002938357545873171, "loss": 0.0134, "step": 2472 }, { "epoch": 0.5, "learning_rate": 0.0002938302532295071, "loss": 0.0449, "step": 2473 }, { "epoch": 0.5, "learning_rate": 0.0002938247494694604, "loss": 0.0236, "step": 2474 }, { "epoch": 0.5, "learning_rate": 0.0002938192433072688, "loss": 0.0225, "step": 2475 }, { "epoch": 0.5, "learning_rate": 0.0002938137347430245, "loss": 0.0202, "step": 2476 }, { "epoch": 0.5, "learning_rate": 0.00029380822377681924, "loss": 0.0198, "step": 2477 }, { "epoch": 0.5, "learning_rate": 0.00029380271040874525, "loss": 0.02, "step": 2478 }, { "epoch": 0.5, "learning_rate": 0.0002937971946388945, "loss": 0.0283, "step": 2479 }, { "epoch": 0.5, "learning_rate": 0.00029379167646735924, "loss": 0.0176, "step": 2480 }, { "epoch": 0.51, "learning_rate": 0.0002937861558942315, "loss": 0.0244, "step": 2481 }, { "epoch": 0.51, "learning_rate": 0.00029378063291960355, "loss": 0.0252, "step": 2482 }, { "epoch": 0.51, "learning_rate": 0.00029377510754356766, "loss": 0.0133, "step": 2483 }, { "epoch": 0.51, "learning_rate": 0.00029376957976621603, "loss": 0.0419, "step": 2484 }, { "epoch": 0.51, "learning_rate": 0.00029376404958764103, "loss": 0.0332, "step": 2485 }, { "epoch": 0.51, "learning_rate": 0.0002937585170079351, "loss": 0.0038, "step": 2486 }, { "epoch": 0.51, "learning_rate": 0.0002937529820271905, "loss": 0.0253, "step": 2487 }, { "epoch": 0.51, "learning_rate": 0.00029374744464549975, "loss": 0.0162, "step": 2488 }, { "epoch": 0.51, "learning_rate": 0.0002937419048629554, "loss": 0.0249, "step": 2489 }, { "epoch": 0.51, "learning_rate": 0.00029373636267964983, "loss": 0.0426, "step": 2490 }, { "epoch": 0.51, "learning_rate": 0.0002937308180956757, "loss": 0.0198, "step": 2491 }, { "epoch": 0.51, "learning_rate": 0.0002937252711111256, "loss": 0.0438, "step": 2492 }, { "epoch": 0.51, "learning_rate": 0.0002937197217260922, "loss": 0.0397, "step": 2493 }, { "epoch": 0.51, "learning_rate": 0.00029371416994066813, "loss": 0.0173, "step": 2494 }, { "epoch": 0.51, "learning_rate": 0.00029370861575494616, "loss": 0.0266, "step": 2495 }, { "epoch": 0.51, "learning_rate": 0.000293703059169019, "loss": 0.0191, "step": 2496 }, { "epoch": 0.51, "learning_rate": 0.00029369750018297955, "loss": 0.0137, "step": 2497 }, { "epoch": 0.51, "learning_rate": 0.0002936919387969205, "loss": 0.0231, "step": 2498 }, { "epoch": 0.51, "learning_rate": 0.00029368637501093494, "loss": 0.0174, "step": 2499 }, { "epoch": 0.51, "learning_rate": 0.00029368080882511566, "loss": 0.035, "step": 2500 }, { "epoch": 0.51, "learning_rate": 0.00029367524023955565, "loss": 0.0097, "step": 2501 }, { "epoch": 0.51, "learning_rate": 0.00029366966925434794, "loss": 0.0375, "step": 2502 }, { "epoch": 0.51, "learning_rate": 0.0002936640958695855, "loss": 0.0385, "step": 2503 }, { "epoch": 0.51, "learning_rate": 0.0002936585200853615, "loss": 0.0147, "step": 2504 }, { "epoch": 0.51, "learning_rate": 0.0002936529419017691, "loss": 0.055, "step": 2505 }, { "epoch": 0.51, "learning_rate": 0.0002936473613189013, "loss": 0.0334, "step": 2506 }, { "epoch": 0.51, "learning_rate": 0.00029364177833685154, "loss": 0.0626, "step": 2507 }, { "epoch": 0.51, "learning_rate": 0.0002936361929557129, "loss": 0.0245, "step": 2508 }, { "epoch": 0.51, "learning_rate": 0.0002936306051755786, "loss": 0.0171, "step": 2509 }, { "epoch": 0.51, "learning_rate": 0.00029362501499654214, "loss": 0.0053, "step": 2510 }, { "epoch": 0.51, "learning_rate": 0.0002936194224186968, "loss": 0.0335, "step": 2511 }, { "epoch": 0.51, "learning_rate": 0.00029361382744213604, "loss": 0.0102, "step": 2512 }, { "epoch": 0.51, "learning_rate": 0.0002936082300669533, "loss": 0.0183, "step": 2513 }, { "epoch": 0.51, "learning_rate": 0.000293602630293242, "loss": 0.0263, "step": 2514 }, { "epoch": 0.51, "learning_rate": 0.00029359702812109566, "loss": 0.021, "step": 2515 }, { "epoch": 0.51, "learning_rate": 0.00029359142355060795, "loss": 0.0239, "step": 2516 }, { "epoch": 0.51, "learning_rate": 0.0002935858165818724, "loss": 0.0237, "step": 2517 }, { "epoch": 0.51, "learning_rate": 0.0002935802072149827, "loss": 0.0327, "step": 2518 }, { "epoch": 0.51, "learning_rate": 0.00029357459545003244, "loss": 0.0646, "step": 2519 }, { "epoch": 0.51, "learning_rate": 0.0002935689812871155, "loss": 0.0391, "step": 2520 }, { "epoch": 0.51, "learning_rate": 0.0002935633647263255, "loss": 0.0395, "step": 2521 }, { "epoch": 0.51, "learning_rate": 0.0002935577457677564, "loss": 0.0223, "step": 2522 }, { "epoch": 0.51, "learning_rate": 0.0002935521244115019, "loss": 0.0391, "step": 2523 }, { "epoch": 0.51, "learning_rate": 0.000293546500657656, "loss": 0.0386, "step": 2524 }, { "epoch": 0.51, "learning_rate": 0.00029354087450631254, "loss": 0.0354, "step": 2525 }, { "epoch": 0.51, "learning_rate": 0.0002935352459575655, "loss": 0.0163, "step": 2526 }, { "epoch": 0.51, "learning_rate": 0.00029352961501150895, "loss": 0.0106, "step": 2527 }, { "epoch": 0.51, "learning_rate": 0.0002935239816682369, "loss": 0.0342, "step": 2528 }, { "epoch": 0.51, "learning_rate": 0.0002935183459278434, "loss": 0.0161, "step": 2529 }, { "epoch": 0.52, "learning_rate": 0.0002935127077904226, "loss": 0.0287, "step": 2530 }, { "epoch": 0.52, "learning_rate": 0.0002935070672560687, "loss": 0.0133, "step": 2531 }, { "epoch": 0.52, "learning_rate": 0.0002935014243248759, "loss": 0.0117, "step": 2532 }, { "epoch": 0.52, "learning_rate": 0.0002934957789969384, "loss": 0.0256, "step": 2533 }, { "epoch": 0.52, "learning_rate": 0.00029349013127235056, "loss": 0.0259, "step": 2534 }, { "epoch": 0.52, "learning_rate": 0.00029348448115120666, "loss": 0.0128, "step": 2535 }, { "epoch": 0.52, "learning_rate": 0.0002934788286336011, "loss": 0.0104, "step": 2536 }, { "epoch": 0.52, "learning_rate": 0.00029347317371962824, "loss": 0.0047, "step": 2537 }, { "epoch": 0.52, "learning_rate": 0.0002934675164093826, "loss": 0.0266, "step": 2538 }, { "epoch": 0.52, "learning_rate": 0.0002934618567029586, "loss": 0.0197, "step": 2539 }, { "epoch": 0.52, "learning_rate": 0.00029345619460045076, "loss": 0.0114, "step": 2540 }, { "epoch": 0.52, "learning_rate": 0.0002934505301019537, "loss": 0.0201, "step": 2541 }, { "epoch": 0.52, "learning_rate": 0.000293444863207562, "loss": 0.0183, "step": 2542 }, { "epoch": 0.52, "learning_rate": 0.0002934391939173703, "loss": 0.0308, "step": 2543 }, { "epoch": 0.52, "learning_rate": 0.0002934335222314733, "loss": 0.0668, "step": 2544 }, { "epoch": 0.52, "learning_rate": 0.00029342784814996575, "loss": 0.0255, "step": 2545 }, { "epoch": 0.52, "learning_rate": 0.00029342217167294235, "loss": 0.0104, "step": 2546 }, { "epoch": 0.52, "learning_rate": 0.000293416492800498, "loss": 0.0028, "step": 2547 }, { "epoch": 0.52, "learning_rate": 0.00029341081153272754, "loss": 0.0246, "step": 2548 }, { "epoch": 0.52, "learning_rate": 0.00029340512786972577, "loss": 0.0212, "step": 2549 }, { "epoch": 0.52, "learning_rate": 0.00029339944181158765, "loss": 0.0243, "step": 2550 }, { "epoch": 0.52, "learning_rate": 0.0002933937533584082, "loss": 0.0144, "step": 2551 }, { "epoch": 0.52, "learning_rate": 0.0002933880625102824, "loss": 0.0121, "step": 2552 }, { "epoch": 0.52, "learning_rate": 0.00029338236926730523, "loss": 0.0261, "step": 2553 }, { "epoch": 0.52, "learning_rate": 0.0002933766736295719, "loss": 0.026, "step": 2554 }, { "epoch": 0.52, "learning_rate": 0.00029337097559717747, "loss": 0.0532, "step": 2555 }, { "epoch": 0.52, "learning_rate": 0.0002933652751702171, "loss": 0.0266, "step": 2556 }, { "epoch": 0.52, "learning_rate": 0.000293359572348786, "loss": 0.0357, "step": 2557 }, { "epoch": 0.52, "learning_rate": 0.00029335386713297946, "loss": 0.0107, "step": 2558 }, { "epoch": 0.52, "learning_rate": 0.0002933481595228928, "loss": 0.0318, "step": 2559 }, { "epoch": 0.52, "learning_rate": 0.0002933424495186212, "loss": 0.0411, "step": 2560 }, { "epoch": 0.52, "learning_rate": 0.0002933367371202601, "loss": 0.0203, "step": 2561 }, { "epoch": 0.52, "learning_rate": 0.00029333102232790496, "loss": 0.0109, "step": 2562 }, { "epoch": 0.52, "learning_rate": 0.00029332530514165125, "loss": 0.036, "step": 2563 }, { "epoch": 0.52, "learning_rate": 0.00029331958556159433, "loss": 0.0464, "step": 2564 }, { "epoch": 0.52, "learning_rate": 0.0002933138635878298, "loss": 0.0209, "step": 2565 }, { "epoch": 0.52, "learning_rate": 0.0002933081392204532, "loss": 0.0103, "step": 2566 }, { "epoch": 0.52, "learning_rate": 0.00029330241245956016, "loss": 0.0333, "step": 2567 }, { "epoch": 0.52, "learning_rate": 0.0002932966833052464, "loss": 0.0395, "step": 2568 }, { "epoch": 0.52, "learning_rate": 0.0002932909517576075, "loss": 0.022, "step": 2569 }, { "epoch": 0.52, "learning_rate": 0.0002932852178167392, "loss": 0.0239, "step": 2570 }, { "epoch": 0.52, "learning_rate": 0.00029327948148273733, "loss": 0.0142, "step": 2571 }, { "epoch": 0.52, "learning_rate": 0.00029327374275569764, "loss": 0.0213, "step": 2572 }, { "epoch": 0.52, "learning_rate": 0.000293268001635716, "loss": 0.0391, "step": 2573 }, { "epoch": 0.52, "learning_rate": 0.00029326225812288827, "loss": 0.0142, "step": 2574 }, { "epoch": 0.52, "learning_rate": 0.00029325651221731044, "loss": 0.0135, "step": 2575 }, { "epoch": 0.52, "learning_rate": 0.00029325076391907844, "loss": 0.0127, "step": 2576 }, { "epoch": 0.52, "learning_rate": 0.0002932450132282883, "loss": 0.0211, "step": 2577 }, { "epoch": 0.52, "learning_rate": 0.000293239260145036, "loss": 0.003, "step": 2578 }, { "epoch": 0.53, "learning_rate": 0.00029323350466941764, "loss": 0.014, "step": 2579 }, { "epoch": 0.53, "learning_rate": 0.00029322774680152943, "loss": 0.0074, "step": 2580 }, { "epoch": 0.53, "learning_rate": 0.00029322198654146747, "loss": 0.0154, "step": 2581 }, { "epoch": 0.53, "learning_rate": 0.000293216223889328, "loss": 0.0143, "step": 2582 }, { "epoch": 0.53, "learning_rate": 0.00029321045884520724, "loss": 0.0151, "step": 2583 }, { "epoch": 0.53, "learning_rate": 0.0002932046914092015, "loss": 0.0487, "step": 2584 }, { "epoch": 0.53, "learning_rate": 0.0002931989215814071, "loss": 0.0214, "step": 2585 }, { "epoch": 0.53, "learning_rate": 0.00029319314936192037, "loss": 0.0121, "step": 2586 }, { "epoch": 0.53, "learning_rate": 0.0002931873747508378, "loss": 0.0144, "step": 2587 }, { "epoch": 0.53, "learning_rate": 0.0002931815977482558, "loss": 0.0081, "step": 2588 }, { "epoch": 0.53, "learning_rate": 0.00029317581835427075, "loss": 0.0283, "step": 2589 }, { "epoch": 0.53, "learning_rate": 0.00029317003656897933, "loss": 0.0101, "step": 2590 }, { "epoch": 0.53, "learning_rate": 0.000293164252392478, "loss": 0.01, "step": 2591 }, { "epoch": 0.53, "learning_rate": 0.00029315846582486345, "loss": 0.0096, "step": 2592 }, { "epoch": 0.53, "learning_rate": 0.00029315267686623236, "loss": 0.0264, "step": 2593 }, { "epoch": 0.53, "learning_rate": 0.00029314688551668124, "loss": 0.0223, "step": 2594 }, { "epoch": 0.53, "learning_rate": 0.00029314109177630695, "loss": 0.0918, "step": 2595 }, { "epoch": 0.53, "learning_rate": 0.00029313529564520626, "loss": 0.0084, "step": 2596 }, { "epoch": 0.53, "learning_rate": 0.0002931294971234759, "loss": 0.0377, "step": 2597 }, { "epoch": 0.53, "learning_rate": 0.0002931236962112128, "loss": 0.0347, "step": 2598 }, { "epoch": 0.53, "learning_rate": 0.00029311789290851375, "loss": 0.0228, "step": 2599 }, { "epoch": 0.53, "learning_rate": 0.00029311208721547583, "loss": 0.0547, "step": 2600 }, { "epoch": 0.53, "learning_rate": 0.0002931062791321959, "loss": 0.0522, "step": 2601 }, { "epoch": 0.53, "learning_rate": 0.0002931004686587709, "loss": 0.0732, "step": 2602 }, { "epoch": 0.53, "learning_rate": 0.000293094655795298, "loss": 0.0132, "step": 2603 }, { "epoch": 0.53, "learning_rate": 0.0002930888405418742, "loss": 0.0368, "step": 2604 }, { "epoch": 0.53, "learning_rate": 0.00029308302289859673, "loss": 0.013, "step": 2605 }, { "epoch": 0.53, "learning_rate": 0.0002930772028655626, "loss": 0.0199, "step": 2606 }, { "epoch": 0.53, "learning_rate": 0.00029307138044286916, "loss": 0.0423, "step": 2607 }, { "epoch": 0.53, "learning_rate": 0.00029306555563061364, "loss": 0.0293, "step": 2608 }, { "epoch": 0.53, "learning_rate": 0.0002930597284288932, "loss": 0.0413, "step": 2609 }, { "epoch": 0.53, "learning_rate": 0.0002930538988378053, "loss": 0.067, "step": 2610 }, { "epoch": 0.53, "learning_rate": 0.0002930480668574472, "loss": 0.0457, "step": 2611 }, { "epoch": 0.53, "learning_rate": 0.0002930422324879165, "loss": 0.0185, "step": 2612 }, { "epoch": 0.53, "learning_rate": 0.00029303639572931037, "loss": 0.0198, "step": 2613 }, { "epoch": 0.53, "learning_rate": 0.00029303055658172646, "loss": 0.0067, "step": 2614 }, { "epoch": 0.53, "learning_rate": 0.0002930247150452623, "loss": 0.0196, "step": 2615 }, { "epoch": 0.53, "learning_rate": 0.0002930188711200154, "loss": 0.0339, "step": 2616 }, { "epoch": 0.53, "learning_rate": 0.00029301302480608336, "loss": 0.0298, "step": 2617 }, { "epoch": 0.53, "learning_rate": 0.0002930071761035639, "loss": 0.0216, "step": 2618 }, { "epoch": 0.53, "learning_rate": 0.0002930013250125546, "loss": 0.0204, "step": 2619 }, { "epoch": 0.53, "learning_rate": 0.0002929954715331533, "loss": 0.0324, "step": 2620 }, { "epoch": 0.53, "learning_rate": 0.00029298961566545764, "loss": 0.0385, "step": 2621 }, { "epoch": 0.53, "learning_rate": 0.00029298375740956554, "loss": 0.0223, "step": 2622 }, { "epoch": 0.53, "learning_rate": 0.00029297789676557476, "loss": 0.0153, "step": 2623 }, { "epoch": 0.53, "learning_rate": 0.0002929720337335832, "loss": 0.0147, "step": 2624 }, { "epoch": 0.53, "learning_rate": 0.00029296616831368886, "loss": 0.0341, "step": 2625 }, { "epoch": 0.53, "learning_rate": 0.0002929603005059896, "loss": 0.0315, "step": 2626 }, { "epoch": 0.53, "learning_rate": 0.00029295443031058344, "loss": 0.0037, "step": 2627 }, { "epoch": 0.54, "learning_rate": 0.00029294855772756846, "loss": 0.029, "step": 2628 }, { "epoch": 0.54, "learning_rate": 0.00029294268275704277, "loss": 0.047, "step": 2629 }, { "epoch": 0.54, "learning_rate": 0.0002929368053991044, "loss": 0.0223, "step": 2630 }, { "epoch": 0.54, "learning_rate": 0.00029293092565385164, "loss": 0.0549, "step": 2631 }, { "epoch": 0.54, "learning_rate": 0.00029292504352138255, "loss": 0.0674, "step": 2632 }, { "epoch": 0.54, "learning_rate": 0.0002929191590017955, "loss": 0.0255, "step": 2633 }, { "epoch": 0.54, "learning_rate": 0.00029291327209518867, "loss": 0.0537, "step": 2634 }, { "epoch": 0.54, "learning_rate": 0.00029290738280166045, "loss": 0.0431, "step": 2635 }, { "epoch": 0.54, "learning_rate": 0.0002929014911213092, "loss": 0.0777, "step": 2636 }, { "epoch": 0.54, "learning_rate": 0.00029289559705423325, "loss": 0.0265, "step": 2637 }, { "epoch": 0.54, "learning_rate": 0.0002928897006005311, "loss": 0.0189, "step": 2638 }, { "epoch": 0.54, "learning_rate": 0.00029288380176030124, "loss": 0.0242, "step": 2639 }, { "epoch": 0.54, "learning_rate": 0.0002928779005336422, "loss": 0.0405, "step": 2640 }, { "epoch": 0.54, "learning_rate": 0.0002928719969206525, "loss": 0.0193, "step": 2641 }, { "epoch": 0.54, "learning_rate": 0.0002928660909214308, "loss": 0.0204, "step": 2642 }, { "epoch": 0.54, "learning_rate": 0.00029286018253607565, "loss": 0.0063, "step": 2643 }, { "epoch": 0.54, "learning_rate": 0.0002928542717646858, "loss": 0.0225, "step": 2644 }, { "epoch": 0.54, "learning_rate": 0.00029284835860735997, "loss": 0.0171, "step": 2645 }, { "epoch": 0.54, "learning_rate": 0.0002928424430641969, "loss": 0.0413, "step": 2646 }, { "epoch": 0.54, "learning_rate": 0.00029283652513529537, "loss": 0.0384, "step": 2647 }, { "epoch": 0.54, "learning_rate": 0.0002928306048207543, "loss": 0.0101, "step": 2648 }, { "epoch": 0.54, "learning_rate": 0.00029282468212067246, "loss": 0.0042, "step": 2649 }, { "epoch": 0.54, "learning_rate": 0.00029281875703514884, "loss": 0.0201, "step": 2650 }, { "epoch": 0.54, "learning_rate": 0.00029281282956428244, "loss": 0.0184, "step": 2651 }, { "epoch": 0.54, "learning_rate": 0.00029280689970817217, "loss": 0.0057, "step": 2652 }, { "epoch": 0.54, "learning_rate": 0.0002928009674669171, "loss": 0.0647, "step": 2653 }, { "epoch": 0.54, "learning_rate": 0.0002927950328406163, "loss": 0.0146, "step": 2654 }, { "epoch": 0.54, "learning_rate": 0.0002927890958293689, "loss": 0.0187, "step": 2655 }, { "epoch": 0.54, "learning_rate": 0.0002927831564332741, "loss": 0.0128, "step": 2656 }, { "epoch": 0.54, "learning_rate": 0.0002927772146524311, "loss": 0.0168, "step": 2657 }, { "epoch": 0.54, "learning_rate": 0.0002927712704869391, "loss": 0.01, "step": 2658 }, { "epoch": 0.54, "learning_rate": 0.00029276532393689733, "loss": 0.0675, "step": 2659 }, { "epoch": 0.54, "learning_rate": 0.0002927593750024052, "loss": 0.0157, "step": 2660 }, { "epoch": 0.54, "learning_rate": 0.000292753423683562, "loss": 0.0083, "step": 2661 }, { "epoch": 0.54, "learning_rate": 0.0002927474699804672, "loss": 0.0369, "step": 2662 }, { "epoch": 0.54, "learning_rate": 0.00029274151389322014, "loss": 0.0158, "step": 2663 }, { "epoch": 0.54, "learning_rate": 0.0002927355554219204, "loss": 0.0168, "step": 2664 }, { "epoch": 0.54, "learning_rate": 0.0002927295945666674, "loss": 0.0194, "step": 2665 }, { "epoch": 0.54, "learning_rate": 0.0002927236313275608, "loss": 0.0128, "step": 2666 }, { "epoch": 0.54, "learning_rate": 0.00029271766570470014, "loss": 0.0435, "step": 2667 }, { "epoch": 0.54, "learning_rate": 0.00029271169769818506, "loss": 0.0298, "step": 2668 }, { "epoch": 0.54, "learning_rate": 0.0002927057273081152, "loss": 0.0132, "step": 2669 }, { "epoch": 0.54, "learning_rate": 0.0002926997545345904, "loss": 0.0078, "step": 2670 }, { "epoch": 0.54, "learning_rate": 0.0002926937793777102, "loss": 0.038, "step": 2671 }, { "epoch": 0.54, "learning_rate": 0.0002926878018375747, "loss": 0.0073, "step": 2672 }, { "epoch": 0.54, "learning_rate": 0.00029268182191428347, "loss": 0.0197, "step": 2673 }, { "epoch": 0.54, "learning_rate": 0.0002926758396079365, "loss": 0.047, "step": 2674 }, { "epoch": 0.54, "learning_rate": 0.0002926698549186337, "loss": 0.0207, "step": 2675 }, { "epoch": 0.54, "learning_rate": 0.00029266386784647494, "loss": 0.0417, "step": 2676 }, { "epoch": 0.55, "learning_rate": 0.0002926578783915604, "loss": 0.0103, "step": 2677 }, { "epoch": 0.55, "learning_rate": 0.00029265188655398994, "loss": 0.0266, "step": 2678 }, { "epoch": 0.55, "learning_rate": 0.0002926458923338637, "loss": 0.0437, "step": 2679 }, { "epoch": 0.55, "learning_rate": 0.0002926398957312818, "loss": 0.0682, "step": 2680 }, { "epoch": 0.55, "learning_rate": 0.00029263389674634443, "loss": 0.0527, "step": 2681 }, { "epoch": 0.55, "learning_rate": 0.00029262789537915174, "loss": 0.0155, "step": 2682 }, { "epoch": 0.55, "learning_rate": 0.0002926218916298039, "loss": 0.0384, "step": 2683 }, { "epoch": 0.55, "learning_rate": 0.0002926158854984013, "loss": 0.0337, "step": 2684 }, { "epoch": 0.55, "learning_rate": 0.00029260987698504425, "loss": 0.0133, "step": 2685 }, { "epoch": 0.55, "learning_rate": 0.000292603866089833, "loss": 0.0048, "step": 2686 }, { "epoch": 0.55, "learning_rate": 0.000292597852812868, "loss": 0.0163, "step": 2687 }, { "epoch": 0.55, "learning_rate": 0.0002925918371542497, "loss": 0.0237, "step": 2688 }, { "epoch": 0.55, "learning_rate": 0.00029258581911407853, "loss": 0.0366, "step": 2689 }, { "epoch": 0.55, "learning_rate": 0.00029257979869245506, "loss": 0.0425, "step": 2690 }, { "epoch": 0.55, "learning_rate": 0.0002925737758894798, "loss": 0.0084, "step": 2691 }, { "epoch": 0.55, "learning_rate": 0.0002925677507052534, "loss": 0.0349, "step": 2692 }, { "epoch": 0.55, "learning_rate": 0.00029256172313987637, "loss": 0.007, "step": 2693 }, { "epoch": 0.55, "learning_rate": 0.00029255569319344953, "loss": 0.0052, "step": 2694 }, { "epoch": 0.55, "learning_rate": 0.0002925496608660735, "loss": 0.0267, "step": 2695 }, { "epoch": 0.55, "learning_rate": 0.0002925436261578491, "loss": 0.0186, "step": 2696 }, { "epoch": 0.55, "learning_rate": 0.00029253758906887695, "loss": 0.0373, "step": 2697 }, { "epoch": 0.55, "learning_rate": 0.0002925315495992581, "loss": 0.0072, "step": 2698 }, { "epoch": 0.55, "learning_rate": 0.0002925255077490933, "loss": 0.0246, "step": 2699 }, { "epoch": 0.55, "learning_rate": 0.00029251946351848345, "loss": 0.0329, "step": 2700 }, { "epoch": 0.55, "learning_rate": 0.0002925134169075296, "loss": 0.0197, "step": 2701 }, { "epoch": 0.55, "learning_rate": 0.00029250736791633256, "loss": 0.0333, "step": 2702 }, { "epoch": 0.55, "learning_rate": 0.0002925013165449936, "loss": 0.0304, "step": 2703 }, { "epoch": 0.55, "learning_rate": 0.0002924952627936136, "loss": 0.0024, "step": 2704 }, { "epoch": 0.55, "learning_rate": 0.0002924892066622937, "loss": 0.0462, "step": 2705 }, { "epoch": 0.55, "learning_rate": 0.0002924831481511352, "loss": 0.0181, "step": 2706 }, { "epoch": 0.55, "learning_rate": 0.0002924770872602391, "loss": 0.0192, "step": 2707 }, { "epoch": 0.55, "learning_rate": 0.0002924710239897067, "loss": 0.018, "step": 2708 }, { "epoch": 0.55, "learning_rate": 0.0002924649583396393, "loss": 0.0304, "step": 2709 }, { "epoch": 0.55, "learning_rate": 0.0002924588903101381, "loss": 0.0145, "step": 2710 }, { "epoch": 0.55, "learning_rate": 0.0002924528199013045, "loss": 0.0094, "step": 2711 }, { "epoch": 0.55, "learning_rate": 0.00029244674711324, "loss": 0.0299, "step": 2712 }, { "epoch": 0.55, "learning_rate": 0.00029244067194604594, "loss": 0.0142, "step": 2713 }, { "epoch": 0.55, "learning_rate": 0.00029243459439982374, "loss": 0.0118, "step": 2714 }, { "epoch": 0.55, "learning_rate": 0.00029242851447467495, "loss": 0.0414, "step": 2715 }, { "epoch": 0.55, "learning_rate": 0.0002924224321707011, "loss": 0.0181, "step": 2716 }, { "epoch": 0.55, "learning_rate": 0.00029241634748800385, "loss": 0.0304, "step": 2717 }, { "epoch": 0.55, "learning_rate": 0.0002924102604266847, "loss": 0.0305, "step": 2718 }, { "epoch": 0.55, "learning_rate": 0.00029240417098684547, "loss": 0.0108, "step": 2719 }, { "epoch": 0.55, "learning_rate": 0.0002923980791685877, "loss": 0.0159, "step": 2720 }, { "epoch": 0.55, "learning_rate": 0.0002923919849720132, "loss": 0.0272, "step": 2721 }, { "epoch": 0.55, "learning_rate": 0.00029238588839722383, "loss": 0.0145, "step": 2722 }, { "epoch": 0.55, "learning_rate": 0.00029237978944432133, "loss": 0.021, "step": 2723 }, { "epoch": 0.55, "learning_rate": 0.0002923736881134076, "loss": 0.0385, "step": 2724 }, { "epoch": 0.55, "learning_rate": 0.0002923675844045845, "loss": 0.0102, "step": 2725 }, { "epoch": 0.56, "learning_rate": 0.000292361478317954, "loss": 0.033, "step": 2726 }, { "epoch": 0.56, "learning_rate": 0.00029235536985361806, "loss": 0.0144, "step": 2727 }, { "epoch": 0.56, "learning_rate": 0.00029234925901167877, "loss": 0.0283, "step": 2728 }, { "epoch": 0.56, "learning_rate": 0.0002923431457922382, "loss": 0.0101, "step": 2729 }, { "epoch": 0.56, "learning_rate": 0.0002923370301953983, "loss": 0.0139, "step": 2730 }, { "epoch": 0.56, "learning_rate": 0.0002923309122212614, "loss": 0.0072, "step": 2731 }, { "epoch": 0.56, "learning_rate": 0.00029232479186992955, "loss": 0.0103, "step": 2732 }, { "epoch": 0.56, "learning_rate": 0.000292318669141505, "loss": 0.0368, "step": 2733 }, { "epoch": 0.56, "learning_rate": 0.0002923125440360901, "loss": 0.014, "step": 2734 }, { "epoch": 0.56, "learning_rate": 0.000292306416553787, "loss": 0.0302, "step": 2735 }, { "epoch": 0.56, "learning_rate": 0.00029230028669469815, "loss": 0.0507, "step": 2736 }, { "epoch": 0.56, "learning_rate": 0.00029229415445892597, "loss": 0.0446, "step": 2737 }, { "epoch": 0.56, "learning_rate": 0.0002922880198465727, "loss": 0.0378, "step": 2738 }, { "epoch": 0.56, "learning_rate": 0.000292281882857741, "loss": 0.0243, "step": 2739 }, { "epoch": 0.56, "learning_rate": 0.00029227574349253326, "loss": 0.0254, "step": 2740 }, { "epoch": 0.56, "learning_rate": 0.000292269601751052, "loss": 0.0243, "step": 2741 }, { "epoch": 0.56, "learning_rate": 0.0002922634576333999, "loss": 0.038, "step": 2742 }, { "epoch": 0.56, "learning_rate": 0.00029225731113967943, "loss": 0.0109, "step": 2743 }, { "epoch": 0.56, "learning_rate": 0.0002922511622699934, "loss": 0.0098, "step": 2744 }, { "epoch": 0.56, "learning_rate": 0.00029224501102444444, "loss": 0.017, "step": 2745 }, { "epoch": 0.56, "learning_rate": 0.00029223885740313526, "loss": 0.0035, "step": 2746 }, { "epoch": 0.56, "learning_rate": 0.0002922327014061687, "loss": 0.0198, "step": 2747 }, { "epoch": 0.56, "learning_rate": 0.00029222654303364754, "loss": 0.007, "step": 2748 }, { "epoch": 0.56, "learning_rate": 0.00029222038228567457, "loss": 0.0105, "step": 2749 }, { "epoch": 0.56, "learning_rate": 0.0002922142191623528, "loss": 0.0137, "step": 2750 }, { "epoch": 0.56, "learning_rate": 0.0002922080536637852, "loss": 0.017, "step": 2751 }, { "epoch": 0.56, "learning_rate": 0.00029220188579007455, "loss": 0.0686, "step": 2752 }, { "epoch": 0.56, "learning_rate": 0.0002921957155413241, "loss": 0.0359, "step": 2753 }, { "epoch": 0.56, "learning_rate": 0.0002921895429176367, "loss": 0.0351, "step": 2754 }, { "epoch": 0.56, "learning_rate": 0.0002921833679191155, "loss": 0.0314, "step": 2755 }, { "epoch": 0.56, "learning_rate": 0.0002921771905458637, "loss": 0.0164, "step": 2756 }, { "epoch": 0.56, "learning_rate": 0.0002921710107979845, "loss": 0.0134, "step": 2757 }, { "epoch": 0.56, "learning_rate": 0.000292164828675581, "loss": 0.0193, "step": 2758 }, { "epoch": 0.56, "learning_rate": 0.0002921586441787565, "loss": 0.0143, "step": 2759 }, { "epoch": 0.56, "learning_rate": 0.0002921524573076143, "loss": 0.0054, "step": 2760 }, { "epoch": 0.56, "learning_rate": 0.00029214626806225774, "loss": 0.021, "step": 2761 }, { "epoch": 0.56, "learning_rate": 0.0002921400764427902, "loss": 0.0171, "step": 2762 }, { "epoch": 0.56, "learning_rate": 0.0002921338824493151, "loss": 0.0175, "step": 2763 }, { "epoch": 0.56, "learning_rate": 0.0002921276860819358, "loss": 0.0448, "step": 2764 }, { "epoch": 0.56, "learning_rate": 0.00029212148734075586, "loss": 0.0141, "step": 2765 }, { "epoch": 0.56, "learning_rate": 0.00029211528622587885, "loss": 0.0118, "step": 2766 }, { "epoch": 0.56, "learning_rate": 0.0002921090827374083, "loss": 0.0101, "step": 2767 }, { "epoch": 0.56, "learning_rate": 0.00029210287687544777, "loss": 0.0433, "step": 2768 }, { "epoch": 0.56, "learning_rate": 0.000292096668640101, "loss": 0.0121, "step": 2769 }, { "epoch": 0.56, "learning_rate": 0.00029209045803147164, "loss": 0.0187, "step": 2770 }, { "epoch": 0.56, "learning_rate": 0.00029208424504966336, "loss": 0.0473, "step": 2771 }, { "epoch": 0.56, "learning_rate": 0.0002920780296947801, "loss": 0.0124, "step": 2772 }, { "epoch": 0.56, "learning_rate": 0.0002920718119669254, "loss": 0.0189, "step": 2773 }, { "epoch": 0.56, "learning_rate": 0.0002920655918662034, "loss": 0.0191, "step": 2774 }, { "epoch": 0.57, "learning_rate": 0.00029205936939271775, "loss": 0.0417, "step": 2775 }, { "epoch": 0.57, "learning_rate": 0.00029205314454657254, "loss": 0.0479, "step": 2776 }, { "epoch": 0.57, "learning_rate": 0.0002920469173278716, "loss": 0.0239, "step": 2777 }, { "epoch": 0.57, "learning_rate": 0.0002920406877367191, "loss": 0.0411, "step": 2778 }, { "epoch": 0.57, "learning_rate": 0.0002920344557732189, "loss": 0.0077, "step": 2779 }, { "epoch": 0.57, "learning_rate": 0.00029202822143747524, "loss": 0.028, "step": 2780 }, { "epoch": 0.57, "learning_rate": 0.0002920219847295922, "loss": 0.0144, "step": 2781 }, { "epoch": 0.57, "learning_rate": 0.0002920157456496739, "loss": 0.0268, "step": 2782 }, { "epoch": 0.57, "learning_rate": 0.0002920095041978245, "loss": 0.0504, "step": 2783 }, { "epoch": 0.57, "learning_rate": 0.00029200326037414845, "loss": 0.0465, "step": 2784 }, { "epoch": 0.57, "learning_rate": 0.00029199701417874987, "loss": 0.0163, "step": 2785 }, { "epoch": 0.57, "learning_rate": 0.0002919907656117331, "loss": 0.0221, "step": 2786 }, { "epoch": 0.57, "learning_rate": 0.00029198451467320245, "loss": 0.0393, "step": 2787 }, { "epoch": 0.57, "learning_rate": 0.0002919782613632625, "loss": 0.0123, "step": 2788 }, { "epoch": 0.57, "learning_rate": 0.0002919720056820175, "loss": 0.0217, "step": 2789 }, { "epoch": 0.57, "learning_rate": 0.000291965747629572, "loss": 0.0305, "step": 2790 }, { "epoch": 0.57, "learning_rate": 0.0002919594872060306, "loss": 0.0116, "step": 2791 }, { "epoch": 0.57, "learning_rate": 0.0002919532244114978, "loss": 0.0295, "step": 2792 }, { "epoch": 0.57, "learning_rate": 0.00029194695924607814, "loss": 0.0268, "step": 2793 }, { "epoch": 0.57, "learning_rate": 0.00029194069170987636, "loss": 0.0085, "step": 2794 }, { "epoch": 0.57, "learning_rate": 0.0002919344218029971, "loss": 0.0198, "step": 2795 }, { "epoch": 0.57, "learning_rate": 0.00029192814952554505, "loss": 0.014, "step": 2796 }, { "epoch": 0.57, "learning_rate": 0.00029192187487762504, "loss": 0.0183, "step": 2797 }, { "epoch": 0.57, "learning_rate": 0.00029191559785934174, "loss": 0.0282, "step": 2798 }, { "epoch": 0.57, "learning_rate": 0.0002919093184708001, "loss": 0.0159, "step": 2799 }, { "epoch": 0.57, "learning_rate": 0.000291903036712105, "loss": 0.0184, "step": 2800 }, { "epoch": 0.57, "learning_rate": 0.00029189675258336134, "loss": 0.0186, "step": 2801 }, { "epoch": 0.57, "learning_rate": 0.000291890466084674, "loss": 0.0224, "step": 2802 }, { "epoch": 0.57, "learning_rate": 0.00029188417721614813, "loss": 0.0122, "step": 2803 }, { "epoch": 0.57, "learning_rate": 0.00029187788597788856, "loss": 0.0251, "step": 2804 }, { "epoch": 0.57, "learning_rate": 0.00029187159237000057, "loss": 0.0255, "step": 2805 }, { "epoch": 0.57, "learning_rate": 0.00029186529639258917, "loss": 0.0209, "step": 2806 }, { "epoch": 0.57, "learning_rate": 0.0002918589980457595, "loss": 0.0161, "step": 2807 }, { "epoch": 0.57, "learning_rate": 0.0002918526973296168, "loss": 0.026, "step": 2808 }, { "epoch": 0.57, "learning_rate": 0.00029184639424426626, "loss": 0.0345, "step": 2809 }, { "epoch": 0.57, "learning_rate": 0.00029184008878981325, "loss": 0.0161, "step": 2810 }, { "epoch": 0.57, "learning_rate": 0.000291833780966363, "loss": 0.0081, "step": 2811 }, { "epoch": 0.57, "learning_rate": 0.0002918274707740208, "loss": 0.0081, "step": 2812 }, { "epoch": 0.57, "learning_rate": 0.0002918211582128922, "loss": 0.0211, "step": 2813 }, { "epoch": 0.57, "learning_rate": 0.0002918148432830825, "loss": 0.013, "step": 2814 }, { "epoch": 0.57, "learning_rate": 0.00029180852598469727, "loss": 0.032, "step": 2815 }, { "epoch": 0.57, "learning_rate": 0.00029180220631784196, "loss": 0.0332, "step": 2816 }, { "epoch": 0.57, "learning_rate": 0.00029179588428262214, "loss": 0.0163, "step": 2817 }, { "epoch": 0.57, "learning_rate": 0.0002917895598791434, "loss": 0.0206, "step": 2818 }, { "epoch": 0.57, "learning_rate": 0.0002917832331075113, "loss": 0.0362, "step": 2819 }, { "epoch": 0.57, "learning_rate": 0.0002917769039678316, "loss": 0.0336, "step": 2820 }, { "epoch": 0.57, "learning_rate": 0.00029177057246021005, "loss": 0.016, "step": 2821 }, { "epoch": 0.57, "learning_rate": 0.0002917642385847523, "loss": 0.014, "step": 2822 }, { "epoch": 0.57, "learning_rate": 0.0002917579023415641, "loss": 0.0702, "step": 2823 }, { "epoch": 0.58, "learning_rate": 0.00029175156373075135, "loss": 0.0261, "step": 2824 }, { "epoch": 0.58, "learning_rate": 0.00029174522275241996, "loss": 0.0199, "step": 2825 }, { "epoch": 0.58, "learning_rate": 0.00029173887940667583, "loss": 0.0124, "step": 2826 }, { "epoch": 0.58, "learning_rate": 0.0002917325336936248, "loss": 0.0096, "step": 2827 }, { "epoch": 0.58, "learning_rate": 0.0002917261856133729, "loss": 0.0269, "step": 2828 }, { "epoch": 0.58, "learning_rate": 0.0002917198351660262, "loss": 0.0068, "step": 2829 }, { "epoch": 0.58, "learning_rate": 0.00029171348235169074, "loss": 0.0097, "step": 2830 }, { "epoch": 0.58, "learning_rate": 0.0002917071271704726, "loss": 0.0127, "step": 2831 }, { "epoch": 0.58, "learning_rate": 0.000291700769622478, "loss": 0.027, "step": 2832 }, { "epoch": 0.58, "learning_rate": 0.000291694409707813, "loss": 0.0105, "step": 2833 }, { "epoch": 0.58, "learning_rate": 0.00029168804742658394, "loss": 0.0457, "step": 2834 }, { "epoch": 0.58, "learning_rate": 0.00029168168277889697, "loss": 0.0162, "step": 2835 }, { "epoch": 0.58, "learning_rate": 0.0002916753157648585, "loss": 0.0957, "step": 2836 }, { "epoch": 0.58, "learning_rate": 0.00029166894638457485, "loss": 0.0051, "step": 2837 }, { "epoch": 0.58, "learning_rate": 0.00029166257463815237, "loss": 0.1087, "step": 2838 }, { "epoch": 0.58, "learning_rate": 0.00029165620052569745, "loss": 0.026, "step": 2839 }, { "epoch": 0.58, "learning_rate": 0.0002916498240473166, "loss": 0.0133, "step": 2840 }, { "epoch": 0.58, "learning_rate": 0.0002916434452031163, "loss": 0.0391, "step": 2841 }, { "epoch": 0.58, "learning_rate": 0.0002916370639932031, "loss": 0.0102, "step": 2842 }, { "epoch": 0.58, "learning_rate": 0.0002916306804176836, "loss": 0.0175, "step": 2843 }, { "epoch": 0.58, "learning_rate": 0.0002916242944766644, "loss": 0.0191, "step": 2844 }, { "epoch": 0.58, "learning_rate": 0.00029161790617025205, "loss": 0.0119, "step": 2845 }, { "epoch": 0.58, "learning_rate": 0.0002916115154985534, "loss": 0.01, "step": 2846 }, { "epoch": 0.58, "learning_rate": 0.00029160512246167514, "loss": 0.014, "step": 2847 }, { "epoch": 0.58, "learning_rate": 0.00029159872705972407, "loss": 0.0068, "step": 2848 }, { "epoch": 0.58, "learning_rate": 0.0002915923292928069, "loss": 0.0419, "step": 2849 }, { "epoch": 0.58, "learning_rate": 0.00029158592916103064, "loss": 0.0491, "step": 2850 }, { "epoch": 0.58, "learning_rate": 0.00029157952666450203, "loss": 0.0129, "step": 2851 }, { "epoch": 0.58, "learning_rate": 0.0002915731218033281, "loss": 0.0147, "step": 2852 }, { "epoch": 0.58, "learning_rate": 0.00029156671457761577, "loss": 0.0174, "step": 2853 }, { "epoch": 0.58, "learning_rate": 0.00029156030498747213, "loss": 0.0347, "step": 2854 }, { "epoch": 0.58, "learning_rate": 0.00029155389303300416, "loss": 0.0397, "step": 2855 }, { "epoch": 0.58, "learning_rate": 0.00029154747871431896, "loss": 0.0497, "step": 2856 }, { "epoch": 0.58, "learning_rate": 0.0002915410620315237, "loss": 0.003, "step": 2857 }, { "epoch": 0.58, "learning_rate": 0.0002915346429847255, "loss": 0.0093, "step": 2858 }, { "epoch": 0.58, "learning_rate": 0.00029152822157403163, "loss": 0.0431, "step": 2859 }, { "epoch": 0.58, "learning_rate": 0.0002915217977995493, "loss": 0.0113, "step": 2860 }, { "epoch": 0.58, "learning_rate": 0.00029151537166138575, "loss": 0.0113, "step": 2861 }, { "epoch": 0.58, "learning_rate": 0.0002915089431596484, "loss": 0.0899, "step": 2862 }, { "epoch": 0.58, "learning_rate": 0.00029150251229444457, "loss": 0.0156, "step": 2863 }, { "epoch": 0.58, "learning_rate": 0.00029149607906588175, "loss": 0.0222, "step": 2864 }, { "epoch": 0.58, "learning_rate": 0.00029148964347406724, "loss": 0.0086, "step": 2865 }, { "epoch": 0.58, "learning_rate": 0.00029148320551910866, "loss": 0.021, "step": 2866 }, { "epoch": 0.58, "learning_rate": 0.00029147676520111345, "loss": 0.0175, "step": 2867 }, { "epoch": 0.58, "learning_rate": 0.0002914703225201892, "loss": 0.0152, "step": 2868 }, { "epoch": 0.58, "learning_rate": 0.0002914638774764435, "loss": 0.0286, "step": 2869 }, { "epoch": 0.58, "learning_rate": 0.00029145743006998403, "loss": 0.0165, "step": 2870 }, { "epoch": 0.58, "learning_rate": 0.00029145098030091847, "loss": 0.0192, "step": 2871 }, { "epoch": 0.58, "learning_rate": 0.0002914445281693545, "loss": 0.0265, "step": 2872 }, { "epoch": 0.58, "learning_rate": 0.00029143807367539997, "loss": 0.0256, "step": 2873 }, { "epoch": 0.59, "learning_rate": 0.0002914316168191626, "loss": 0.0402, "step": 2874 }, { "epoch": 0.59, "learning_rate": 0.00029142515760075026, "loss": 0.0456, "step": 2875 }, { "epoch": 0.59, "learning_rate": 0.0002914186960202708, "loss": 0.0279, "step": 2876 }, { "epoch": 0.59, "learning_rate": 0.0002914122320778322, "loss": 0.0203, "step": 2877 }, { "epoch": 0.59, "learning_rate": 0.0002914057657735424, "loss": 0.0468, "step": 2878 }, { "epoch": 0.59, "learning_rate": 0.00029139929710750935, "loss": 0.0429, "step": 2879 }, { "epoch": 0.59, "learning_rate": 0.00029139282607984116, "loss": 0.0237, "step": 2880 }, { "epoch": 0.59, "learning_rate": 0.00029138635269064587, "loss": 0.0151, "step": 2881 }, { "epoch": 0.59, "learning_rate": 0.00029137987694003163, "loss": 0.0472, "step": 2882 }, { "epoch": 0.59, "learning_rate": 0.00029137339882810654, "loss": 0.0388, "step": 2883 }, { "epoch": 0.59, "learning_rate": 0.0002913669183549788, "loss": 0.0182, "step": 2884 }, { "epoch": 0.59, "learning_rate": 0.0002913604355207567, "loss": 0.0134, "step": 2885 }, { "epoch": 0.59, "learning_rate": 0.00029135395032554856, "loss": 0.007, "step": 2886 }, { "epoch": 0.59, "learning_rate": 0.0002913474627694625, "loss": 0.0274, "step": 2887 }, { "epoch": 0.59, "learning_rate": 0.0002913409728526071, "loss": 0.0238, "step": 2888 }, { "epoch": 0.59, "learning_rate": 0.0002913344805750906, "loss": 0.0194, "step": 2889 }, { "epoch": 0.59, "learning_rate": 0.00029132798593702145, "loss": 0.0155, "step": 2890 }, { "epoch": 0.59, "learning_rate": 0.00029132148893850826, "loss": 0.0394, "step": 2891 }, { "epoch": 0.59, "learning_rate": 0.00029131498957965936, "loss": 0.0208, "step": 2892 }, { "epoch": 0.59, "learning_rate": 0.00029130848786058347, "loss": 0.0248, "step": 2893 }, { "epoch": 0.59, "learning_rate": 0.00029130198378138903, "loss": 0.009, "step": 2894 }, { "epoch": 0.59, "learning_rate": 0.0002912954773421847, "loss": 0.0138, "step": 2895 }, { "epoch": 0.59, "learning_rate": 0.00029128896854307924, "loss": 0.0316, "step": 2896 }, { "epoch": 0.59, "learning_rate": 0.00029128245738418133, "loss": 0.0201, "step": 2897 }, { "epoch": 0.59, "learning_rate": 0.00029127594386559963, "loss": 0.0188, "step": 2898 }, { "epoch": 0.59, "learning_rate": 0.000291269427987443, "loss": 0.0448, "step": 2899 }, { "epoch": 0.59, "learning_rate": 0.0002912629097498203, "loss": 0.0563, "step": 2900 }, { "epoch": 0.59, "learning_rate": 0.0002912563891528403, "loss": 0.0319, "step": 2901 }, { "epoch": 0.59, "learning_rate": 0.000291249866196612, "loss": 0.0149, "step": 2902 }, { "epoch": 0.59, "learning_rate": 0.0002912433408812443, "loss": 0.0439, "step": 2903 }, { "epoch": 0.59, "learning_rate": 0.00029123681320684616, "loss": 0.0026, "step": 2904 }, { "epoch": 0.59, "learning_rate": 0.0002912302831735267, "loss": 0.0309, "step": 2905 }, { "epoch": 0.59, "learning_rate": 0.00029122375078139486, "loss": 0.027, "step": 2906 }, { "epoch": 0.59, "learning_rate": 0.00029121721603055984, "loss": 0.0173, "step": 2907 }, { "epoch": 0.59, "learning_rate": 0.0002912106789211307, "loss": 0.0127, "step": 2908 }, { "epoch": 0.59, "learning_rate": 0.0002912041394532167, "loss": 0.0042, "step": 2909 }, { "epoch": 0.59, "learning_rate": 0.00029119759762692704, "loss": 0.0128, "step": 2910 }, { "epoch": 0.59, "learning_rate": 0.00029119105344237097, "loss": 0.0189, "step": 2911 }, { "epoch": 0.59, "learning_rate": 0.00029118450689965777, "loss": 0.0306, "step": 2912 }, { "epoch": 0.59, "learning_rate": 0.0002911779579988968, "loss": 0.0092, "step": 2913 }, { "epoch": 0.59, "learning_rate": 0.00029117140674019747, "loss": 0.0135, "step": 2914 }, { "epoch": 0.59, "learning_rate": 0.0002911648531236691, "loss": 0.0108, "step": 2915 }, { "epoch": 0.59, "learning_rate": 0.00029115829714942125, "loss": 0.0181, "step": 2916 }, { "epoch": 0.59, "learning_rate": 0.0002911517388175634, "loss": 0.0285, "step": 2917 }, { "epoch": 0.59, "learning_rate": 0.0002911451781282051, "loss": 0.0316, "step": 2918 }, { "epoch": 0.59, "learning_rate": 0.00029113861508145585, "loss": 0.0279, "step": 2919 }, { "epoch": 0.59, "learning_rate": 0.0002911320496774253, "loss": 0.0117, "step": 2920 }, { "epoch": 0.59, "learning_rate": 0.00029112548191622317, "loss": 0.01, "step": 2921 }, { "epoch": 0.59, "learning_rate": 0.000291118911797959, "loss": 0.017, "step": 2922 }, { "epoch": 0.6, "learning_rate": 0.00029111233932274276, "loss": 0.007, "step": 2923 }, { "epoch": 0.6, "learning_rate": 0.00029110576449068397, "loss": 0.0657, "step": 2924 }, { "epoch": 0.6, "learning_rate": 0.0002910991873018926, "loss": 0.0554, "step": 2925 }, { "epoch": 0.6, "learning_rate": 0.00029109260775647846, "loss": 0.0371, "step": 2926 }, { "epoch": 0.6, "learning_rate": 0.00029108602585455143, "loss": 0.0396, "step": 2927 }, { "epoch": 0.6, "learning_rate": 0.0002910794415962214, "loss": 0.0055, "step": 2928 }, { "epoch": 0.6, "learning_rate": 0.0002910728549815985, "loss": 0.0238, "step": 2929 }, { "epoch": 0.6, "learning_rate": 0.00029106626601079253, "loss": 0.0162, "step": 2930 }, { "epoch": 0.6, "learning_rate": 0.0002910596746839137, "loss": 0.0085, "step": 2931 }, { "epoch": 0.6, "learning_rate": 0.000291053081001072, "loss": 0.0094, "step": 2932 }, { "epoch": 0.6, "learning_rate": 0.0002910464849623776, "loss": 0.0296, "step": 2933 }, { "epoch": 0.6, "learning_rate": 0.00029103988656794063, "loss": 0.0431, "step": 2934 }, { "epoch": 0.6, "learning_rate": 0.00029103328581787133, "loss": 0.0188, "step": 2935 }, { "epoch": 0.6, "learning_rate": 0.00029102668271228, "loss": 0.015, "step": 2936 }, { "epoch": 0.6, "learning_rate": 0.0002910200772512768, "loss": 0.0189, "step": 2937 }, { "epoch": 0.6, "learning_rate": 0.00029101346943497214, "loss": 0.0067, "step": 2938 }, { "epoch": 0.6, "learning_rate": 0.00029100685926347636, "loss": 0.005, "step": 2939 }, { "epoch": 0.6, "learning_rate": 0.00029100024673689987, "loss": 0.0291, "step": 2940 }, { "epoch": 0.6, "learning_rate": 0.0002909936318553531, "loss": 0.0186, "step": 2941 }, { "epoch": 0.6, "learning_rate": 0.00029098701461894645, "loss": 0.0077, "step": 2942 }, { "epoch": 0.6, "learning_rate": 0.0002909803950277906, "loss": 0.0325, "step": 2943 }, { "epoch": 0.6, "learning_rate": 0.0002909737730819961, "loss": 0.0479, "step": 2944 }, { "epoch": 0.6, "learning_rate": 0.0002909671487816734, "loss": 0.0362, "step": 2945 }, { "epoch": 0.6, "learning_rate": 0.0002909605221269332, "loss": 0.0425, "step": 2946 }, { "epoch": 0.6, "learning_rate": 0.0002909538931178862, "loss": 0.0163, "step": 2947 }, { "epoch": 0.6, "learning_rate": 0.0002909472617546432, "loss": 0.0154, "step": 2948 }, { "epoch": 0.6, "learning_rate": 0.0002909406280373148, "loss": 0.0151, "step": 2949 }, { "epoch": 0.6, "learning_rate": 0.0002909339919660119, "loss": 0.0571, "step": 2950 }, { "epoch": 0.6, "learning_rate": 0.00029092735354084527, "loss": 0.0428, "step": 2951 }, { "epoch": 0.6, "learning_rate": 0.0002909207127619259, "loss": 0.0141, "step": 2952 }, { "epoch": 0.6, "learning_rate": 0.0002909140696293645, "loss": 0.024, "step": 2953 }, { "epoch": 0.6, "learning_rate": 0.0002909074241432722, "loss": 0.0259, "step": 2954 }, { "epoch": 0.6, "learning_rate": 0.0002909007763037599, "loss": 0.0159, "step": 2955 }, { "epoch": 0.6, "learning_rate": 0.0002908941261109387, "loss": 0.0348, "step": 2956 }, { "epoch": 0.6, "learning_rate": 0.00029088747356491963, "loss": 0.0213, "step": 2957 }, { "epoch": 0.6, "learning_rate": 0.00029088081866581383, "loss": 0.0143, "step": 2958 }, { "epoch": 0.6, "learning_rate": 0.0002908741614137324, "loss": 0.0315, "step": 2959 }, { "epoch": 0.6, "learning_rate": 0.0002908675018087866, "loss": 0.0597, "step": 2960 }, { "epoch": 0.6, "learning_rate": 0.0002908608398510876, "loss": 0.0103, "step": 2961 }, { "epoch": 0.6, "learning_rate": 0.0002908541755407466, "loss": 0.0255, "step": 2962 }, { "epoch": 0.6, "learning_rate": 0.00029084750887787506, "loss": 0.0228, "step": 2963 }, { "epoch": 0.6, "learning_rate": 0.00029084083986258426, "loss": 0.0246, "step": 2964 }, { "epoch": 0.6, "learning_rate": 0.00029083416849498556, "loss": 0.0129, "step": 2965 }, { "epoch": 0.6, "learning_rate": 0.0002908274947751904, "loss": 0.0165, "step": 2966 }, { "epoch": 0.6, "learning_rate": 0.0002908208187033103, "loss": 0.0096, "step": 2967 }, { "epoch": 0.6, "learning_rate": 0.0002908141402794566, "loss": 0.0124, "step": 2968 }, { "epoch": 0.6, "learning_rate": 0.000290807459503741, "loss": 0.0327, "step": 2969 }, { "epoch": 0.6, "learning_rate": 0.00029080077637627503, "loss": 0.0241, "step": 2970 }, { "epoch": 0.6, "learning_rate": 0.00029079409089717036, "loss": 0.0234, "step": 2971 }, { "epoch": 0.61, "learning_rate": 0.00029078740306653857, "loss": 0.015, "step": 2972 }, { "epoch": 0.61, "learning_rate": 0.0002907807128844914, "loss": 0.0166, "step": 2973 }, { "epoch": 0.61, "learning_rate": 0.0002907740203511406, "loss": 0.0084, "step": 2974 }, { "epoch": 0.61, "learning_rate": 0.0002907673254665979, "loss": 0.0213, "step": 2975 }, { "epoch": 0.61, "learning_rate": 0.00029076062823097515, "loss": 0.0575, "step": 2976 }, { "epoch": 0.61, "learning_rate": 0.0002907539286443842, "loss": 0.0092, "step": 2977 }, { "epoch": 0.61, "learning_rate": 0.00029074722670693697, "loss": 0.0483, "step": 2978 }, { "epoch": 0.61, "learning_rate": 0.00029074052241874536, "loss": 0.0283, "step": 2979 }, { "epoch": 0.61, "learning_rate": 0.00029073381577992137, "loss": 0.0211, "step": 2980 }, { "epoch": 0.61, "learning_rate": 0.000290727106790577, "loss": 0.0238, "step": 2981 }, { "epoch": 0.61, "learning_rate": 0.0002907203954508243, "loss": 0.0277, "step": 2982 }, { "epoch": 0.61, "learning_rate": 0.0002907136817607754, "loss": 0.0094, "step": 2983 }, { "epoch": 0.61, "learning_rate": 0.00029070696572054233, "loss": 0.0161, "step": 2984 }, { "epoch": 0.61, "learning_rate": 0.00029070024733023736, "loss": 0.0129, "step": 2985 }, { "epoch": 0.61, "learning_rate": 0.0002906935265899727, "loss": 0.0189, "step": 2986 }, { "epoch": 0.61, "learning_rate": 0.0002906868034998606, "loss": 0.0132, "step": 2987 }, { "epoch": 0.61, "learning_rate": 0.0002906800780600132, "loss": 0.0172, "step": 2988 }, { "epoch": 0.61, "learning_rate": 0.000290673350270543, "loss": 0.0281, "step": 2989 }, { "epoch": 0.61, "learning_rate": 0.00029066662013156234, "loss": 0.0247, "step": 2990 }, { "epoch": 0.61, "learning_rate": 0.00029065988764318353, "loss": 0.009, "step": 2991 }, { "epoch": 0.61, "learning_rate": 0.00029065315280551914, "loss": 0.0121, "step": 2992 }, { "epoch": 0.61, "learning_rate": 0.0002906464156186816, "loss": 0.0118, "step": 2993 }, { "epoch": 0.61, "learning_rate": 0.0002906396760827834, "loss": 0.0375, "step": 2994 }, { "epoch": 0.61, "learning_rate": 0.00029063293419793714, "loss": 0.0147, "step": 2995 }, { "epoch": 0.61, "learning_rate": 0.0002906261899642554, "loss": 0.0331, "step": 2996 }, { "epoch": 0.61, "learning_rate": 0.00029061944338185086, "loss": 0.0143, "step": 2997 }, { "epoch": 0.61, "learning_rate": 0.0002906126944508362, "loss": 0.0071, "step": 2998 }, { "epoch": 0.61, "learning_rate": 0.00029060594317132407, "loss": 0.0135, "step": 2999 }, { "epoch": 0.61, "learning_rate": 0.0002905991895434273, "loss": 0.0219, "step": 3000 }, { "epoch": 0.61, "learning_rate": 0.00029059243356725865, "loss": 0.0141, "step": 3001 }, { "epoch": 0.61, "learning_rate": 0.000290585675242931, "loss": 0.0215, "step": 3002 }, { "epoch": 0.61, "learning_rate": 0.0002905789145705572, "loss": 0.0212, "step": 3003 }, { "epoch": 0.61, "learning_rate": 0.00029057215155025017, "loss": 0.0483, "step": 3004 }, { "epoch": 0.61, "learning_rate": 0.0002905653861821228, "loss": 0.0504, "step": 3005 }, { "epoch": 0.61, "learning_rate": 0.00029055861846628817, "loss": 0.1316, "step": 3006 }, { "epoch": 0.61, "learning_rate": 0.0002905518484028593, "loss": 0.0184, "step": 3007 }, { "epoch": 0.61, "learning_rate": 0.0002905450759919493, "loss": 0.0347, "step": 3008 }, { "epoch": 0.61, "learning_rate": 0.00029053830123367116, "loss": 0.0112, "step": 3009 }, { "epoch": 0.61, "learning_rate": 0.00029053152412813815, "loss": 0.0318, "step": 3010 }, { "epoch": 0.61, "learning_rate": 0.0002905247446754634, "loss": 0.0673, "step": 3011 }, { "epoch": 0.61, "learning_rate": 0.00029051796287576015, "loss": 0.0099, "step": 3012 }, { "epoch": 0.61, "learning_rate": 0.0002905111787291417, "loss": 0.0365, "step": 3013 }, { "epoch": 0.61, "learning_rate": 0.0002905043922357213, "loss": 0.0116, "step": 3014 }, { "epoch": 0.61, "learning_rate": 0.0002904976033956123, "loss": 0.0509, "step": 3015 }, { "epoch": 0.61, "learning_rate": 0.00029049081220892817, "loss": 0.0159, "step": 3016 }, { "epoch": 0.61, "learning_rate": 0.00029048401867578225, "loss": 0.0346, "step": 3017 }, { "epoch": 0.61, "learning_rate": 0.00029047722279628807, "loss": 0.0216, "step": 3018 }, { "epoch": 0.61, "learning_rate": 0.0002904704245705591, "loss": 0.0192, "step": 3019 }, { "epoch": 0.61, "learning_rate": 0.0002904636239987088, "loss": 0.015, "step": 3020 }, { "epoch": 0.62, "learning_rate": 0.0002904568210808509, "loss": 0.0135, "step": 3021 }, { "epoch": 0.62, "learning_rate": 0.00029045001581709897, "loss": 0.0152, "step": 3022 }, { "epoch": 0.62, "learning_rate": 0.0002904432082075666, "loss": 0.0149, "step": 3023 }, { "epoch": 0.62, "learning_rate": 0.00029043639825236764, "loss": 0.0732, "step": 3024 }, { "epoch": 0.62, "learning_rate": 0.00029042958595161566, "loss": 0.0508, "step": 3025 }, { "epoch": 0.62, "learning_rate": 0.00029042277130542456, "loss": 0.007, "step": 3026 }, { "epoch": 0.62, "learning_rate": 0.0002904159543139081, "loss": 0.0442, "step": 3027 }, { "epoch": 0.62, "learning_rate": 0.00029040913497718014, "loss": 0.0252, "step": 3028 }, { "epoch": 0.62, "learning_rate": 0.00029040231329535455, "loss": 0.0413, "step": 3029 }, { "epoch": 0.62, "learning_rate": 0.00029039548926854537, "loss": 0.0268, "step": 3030 }, { "epoch": 0.62, "learning_rate": 0.0002903886628968665, "loss": 0.0255, "step": 3031 }, { "epoch": 0.62, "learning_rate": 0.0002903818341804319, "loss": 0.0329, "step": 3032 }, { "epoch": 0.62, "learning_rate": 0.0002903750031193557, "loss": 0.0059, "step": 3033 }, { "epoch": 0.62, "learning_rate": 0.000290368169713752, "loss": 0.0361, "step": 3034 }, { "epoch": 0.62, "learning_rate": 0.00029036133396373486, "loss": 0.0128, "step": 3035 }, { "epoch": 0.62, "learning_rate": 0.00029035449586941854, "loss": 0.0292, "step": 3036 }, { "epoch": 0.62, "learning_rate": 0.00029034765543091716, "loss": 0.0099, "step": 3037 }, { "epoch": 0.62, "learning_rate": 0.000290340812648345, "loss": 0.0369, "step": 3038 }, { "epoch": 0.62, "learning_rate": 0.0002903339675218164, "loss": 0.0276, "step": 3039 }, { "epoch": 0.62, "learning_rate": 0.0002903271200514456, "loss": 0.0171, "step": 3040 }, { "epoch": 0.62, "learning_rate": 0.00029032027023734704, "loss": 0.017, "step": 3041 }, { "epoch": 0.62, "learning_rate": 0.0002903134180796351, "loss": 0.0058, "step": 3042 }, { "epoch": 0.62, "learning_rate": 0.0002903065635784242, "loss": 0.0349, "step": 3043 }, { "epoch": 0.62, "learning_rate": 0.00029029970673382884, "loss": 0.0074, "step": 3044 }, { "epoch": 0.62, "learning_rate": 0.0002902928475459635, "loss": 0.0143, "step": 3045 }, { "epoch": 0.62, "learning_rate": 0.00029028598601494286, "loss": 0.0402, "step": 3046 }, { "epoch": 0.62, "learning_rate": 0.00029027912214088145, "loss": 0.015, "step": 3047 }, { "epoch": 0.62, "learning_rate": 0.0002902722559238939, "loss": 0.0229, "step": 3048 }, { "epoch": 0.62, "learning_rate": 0.0002902653873640948, "loss": 0.016, "step": 3049 }, { "epoch": 0.62, "learning_rate": 0.00029025851646159907, "loss": 0.0396, "step": 3050 }, { "epoch": 0.62, "learning_rate": 0.0002902516432165213, "loss": 0.0177, "step": 3051 }, { "epoch": 0.62, "learning_rate": 0.00029024476762897633, "loss": 0.0377, "step": 3052 }, { "epoch": 0.62, "learning_rate": 0.00029023788969907905, "loss": 0.0042, "step": 3053 }, { "epoch": 0.62, "learning_rate": 0.00029023100942694426, "loss": 0.0443, "step": 3054 }, { "epoch": 0.62, "learning_rate": 0.000290224126812687, "loss": 0.0166, "step": 3055 }, { "epoch": 0.62, "learning_rate": 0.00029021724185642205, "loss": 0.0256, "step": 3056 }, { "epoch": 0.62, "learning_rate": 0.0002902103545582645, "loss": 0.0253, "step": 3057 }, { "epoch": 0.62, "learning_rate": 0.0002902034649183293, "loss": 0.0131, "step": 3058 }, { "epoch": 0.62, "learning_rate": 0.00029019657293673164, "loss": 0.0416, "step": 3059 }, { "epoch": 0.62, "learning_rate": 0.0002901896786135866, "loss": 0.0162, "step": 3060 }, { "epoch": 0.62, "learning_rate": 0.0002901827819490093, "loss": 0.0115, "step": 3061 }, { "epoch": 0.62, "learning_rate": 0.00029017588294311483, "loss": 0.0715, "step": 3062 }, { "epoch": 0.62, "learning_rate": 0.00029016898159601865, "loss": 0.0698, "step": 3063 }, { "epoch": 0.62, "learning_rate": 0.0002901620779078358, "loss": 0.0402, "step": 3064 }, { "epoch": 0.62, "learning_rate": 0.0002901551718786817, "loss": 0.0321, "step": 3065 }, { "epoch": 0.62, "learning_rate": 0.00029014826350867164, "loss": 0.0178, "step": 3066 }, { "epoch": 0.62, "learning_rate": 0.0002901413527979211, "loss": 0.0297, "step": 3067 }, { "epoch": 0.62, "learning_rate": 0.0002901344397465454, "loss": 0.0267, "step": 3068 }, { "epoch": 0.62, "learning_rate": 0.00029012752435466, "loss": 0.0173, "step": 3069 }, { "epoch": 0.63, "learning_rate": 0.00029012060662238047, "loss": 0.0152, "step": 3070 }, { "epoch": 0.63, "learning_rate": 0.0002901136865498223, "loss": 0.0532, "step": 3071 }, { "epoch": 0.63, "learning_rate": 0.000290106764137101, "loss": 0.0113, "step": 3072 }, { "epoch": 0.63, "learning_rate": 0.00029009983938433243, "loss": 0.0264, "step": 3073 }, { "epoch": 0.63, "learning_rate": 0.000290092912291632, "loss": 0.0678, "step": 3074 }, { "epoch": 0.63, "learning_rate": 0.0002900859828591155, "loss": 0.0223, "step": 3075 }, { "epoch": 0.63, "learning_rate": 0.00029007905108689865, "loss": 0.0273, "step": 3076 }, { "epoch": 0.63, "learning_rate": 0.00029007211697509725, "loss": 0.0485, "step": 3077 }, { "epoch": 0.63, "learning_rate": 0.000290065180523827, "loss": 0.047, "step": 3078 }, { "epoch": 0.63, "learning_rate": 0.0002900582417332039, "loss": 0.0339, "step": 3079 }, { "epoch": 0.63, "learning_rate": 0.0002900513006033438, "loss": 0.0207, "step": 3080 }, { "epoch": 0.63, "learning_rate": 0.00029004435713436265, "loss": 0.0299, "step": 3081 }, { "epoch": 0.63, "learning_rate": 0.0002900374113263763, "loss": 0.0162, "step": 3082 }, { "epoch": 0.63, "learning_rate": 0.000290030463179501, "loss": 0.0287, "step": 3083 }, { "epoch": 0.63, "learning_rate": 0.00029002351269385247, "loss": 0.0451, "step": 3084 }, { "epoch": 0.63, "learning_rate": 0.00029001655986954703, "loss": 0.0629, "step": 3085 }, { "epoch": 0.63, "learning_rate": 0.0002900096047067007, "loss": 0.0286, "step": 3086 }, { "epoch": 0.63, "learning_rate": 0.00029000264720542974, "loss": 0.0537, "step": 3087 }, { "epoch": 0.63, "learning_rate": 0.0002899956873658503, "loss": 0.0044, "step": 3088 }, { "epoch": 0.63, "learning_rate": 0.00028998872518807856, "loss": 0.0574, "step": 3089 }, { "epoch": 0.63, "learning_rate": 0.0002899817606722309, "loss": 0.0082, "step": 3090 }, { "epoch": 0.63, "learning_rate": 0.0002899747938184236, "loss": 0.0194, "step": 3091 }, { "epoch": 0.63, "learning_rate": 0.0002899678246267731, "loss": 0.0197, "step": 3092 }, { "epoch": 0.63, "learning_rate": 0.0002899608530973956, "loss": 0.0095, "step": 3093 }, { "epoch": 0.63, "learning_rate": 0.0002899538792304077, "loss": 0.0134, "step": 3094 }, { "epoch": 0.63, "learning_rate": 0.0002899469030259258, "loss": 0.0114, "step": 3095 }, { "epoch": 0.63, "learning_rate": 0.0002899399244840665, "loss": 0.0372, "step": 3096 }, { "epoch": 0.63, "learning_rate": 0.00028993294360494626, "loss": 0.0084, "step": 3097 }, { "epoch": 0.63, "learning_rate": 0.0002899259603886818, "loss": 0.0954, "step": 3098 }, { "epoch": 0.63, "learning_rate": 0.0002899189748353896, "loss": 0.01, "step": 3099 }, { "epoch": 0.63, "learning_rate": 0.00028991198694518645, "loss": 0.01, "step": 3100 }, { "epoch": 0.63, "learning_rate": 0.00028990499671818895, "loss": 0.0165, "step": 3101 }, { "epoch": 0.63, "learning_rate": 0.000289898004154514, "loss": 0.0311, "step": 3102 }, { "epoch": 0.63, "learning_rate": 0.00028989100925427825, "loss": 0.0078, "step": 3103 }, { "epoch": 0.63, "learning_rate": 0.00028988401201759863, "loss": 0.018, "step": 3104 }, { "epoch": 0.63, "learning_rate": 0.00028987701244459187, "loss": 0.0192, "step": 3105 }, { "epoch": 0.63, "learning_rate": 0.00028987001053537505, "loss": 0.0311, "step": 3106 }, { "epoch": 0.63, "learning_rate": 0.000289863006290065, "loss": 0.011, "step": 3107 }, { "epoch": 0.63, "learning_rate": 0.00028985599970877875, "loss": 0.0264, "step": 3108 }, { "epoch": 0.63, "learning_rate": 0.0002898489907916333, "loss": 0.0184, "step": 3109 }, { "epoch": 0.63, "learning_rate": 0.00028984197953874573, "loss": 0.0113, "step": 3110 }, { "epoch": 0.63, "learning_rate": 0.00028983496595023315, "loss": 0.0244, "step": 3111 }, { "epoch": 0.63, "learning_rate": 0.00028982795002621263, "loss": 0.0568, "step": 3112 }, { "epoch": 0.63, "learning_rate": 0.0002898209317668014, "loss": 0.0224, "step": 3113 }, { "epoch": 0.63, "learning_rate": 0.0002898139111721167, "loss": 0.0727, "step": 3114 }, { "epoch": 0.63, "learning_rate": 0.0002898068882422757, "loss": 0.0464, "step": 3115 }, { "epoch": 0.63, "learning_rate": 0.0002897998629773959, "loss": 0.0111, "step": 3116 }, { "epoch": 0.63, "learning_rate": 0.0002897928353775944, "loss": 0.0196, "step": 3117 }, { "epoch": 0.63, "learning_rate": 0.0002897858054429887, "loss": 0.0126, "step": 3118 }, { "epoch": 0.64, "learning_rate": 0.00028977877317369616, "loss": 0.0146, "step": 3119 }, { "epoch": 0.64, "learning_rate": 0.0002897717385698343, "loss": 0.0364, "step": 3120 }, { "epoch": 0.64, "learning_rate": 0.00028976470163152054, "loss": 0.0364, "step": 3121 }, { "epoch": 0.64, "learning_rate": 0.0002897576623588724, "loss": 0.0241, "step": 3122 }, { "epoch": 0.64, "learning_rate": 0.00028975062075200754, "loss": 0.0342, "step": 3123 }, { "epoch": 0.64, "learning_rate": 0.0002897435768110435, "loss": 0.0253, "step": 3124 }, { "epoch": 0.64, "learning_rate": 0.000289736530536098, "loss": 0.0117, "step": 3125 }, { "epoch": 0.64, "learning_rate": 0.0002897294819272886, "loss": 0.0093, "step": 3126 }, { "epoch": 0.64, "learning_rate": 0.0002897224309847331, "loss": 0.0373, "step": 3127 }, { "epoch": 0.64, "learning_rate": 0.0002897153777085493, "loss": 0.0122, "step": 3128 }, { "epoch": 0.64, "learning_rate": 0.0002897083220988549, "loss": 0.0232, "step": 3129 }, { "epoch": 0.64, "learning_rate": 0.00028970126415576785, "loss": 0.0447, "step": 3130 }, { "epoch": 0.64, "learning_rate": 0.000289694203879406, "loss": 0.0219, "step": 3131 }, { "epoch": 0.64, "learning_rate": 0.0002896871412698872, "loss": 0.0104, "step": 3132 }, { "epoch": 0.64, "learning_rate": 0.00028968007632732944, "loss": 0.0567, "step": 3133 }, { "epoch": 0.64, "learning_rate": 0.0002896730090518508, "loss": 0.0317, "step": 3134 }, { "epoch": 0.64, "learning_rate": 0.00028966593944356925, "loss": 0.0153, "step": 3135 }, { "epoch": 0.64, "learning_rate": 0.00028965886750260283, "loss": 0.0517, "step": 3136 }, { "epoch": 0.64, "learning_rate": 0.00028965179322906976, "loss": 0.034, "step": 3137 }, { "epoch": 0.64, "learning_rate": 0.0002896447166230881, "loss": 0.0411, "step": 3138 }, { "epoch": 0.64, "learning_rate": 0.00028963763768477606, "loss": 0.0072, "step": 3139 }, { "epoch": 0.64, "learning_rate": 0.00028963055641425194, "loss": 0.0287, "step": 3140 }, { "epoch": 0.64, "learning_rate": 0.0002896234728116339, "loss": 0.0126, "step": 3141 }, { "epoch": 0.64, "learning_rate": 0.0002896163868770403, "loss": 0.0057, "step": 3142 }, { "epoch": 0.64, "learning_rate": 0.00028960929861058957, "loss": 0.042, "step": 3143 }, { "epoch": 0.64, "learning_rate": 0.00028960220801239997, "loss": 0.0142, "step": 3144 }, { "epoch": 0.64, "learning_rate": 0.00028959511508258996, "loss": 0.0125, "step": 3145 }, { "epoch": 0.64, "learning_rate": 0.00028958801982127805, "loss": 0.042, "step": 3146 }, { "epoch": 0.64, "learning_rate": 0.0002895809222285827, "loss": 0.034, "step": 3147 }, { "epoch": 0.64, "learning_rate": 0.00028957382230462245, "loss": 0.0203, "step": 3148 }, { "epoch": 0.64, "learning_rate": 0.000289566720049516, "loss": 0.015, "step": 3149 }, { "epoch": 0.64, "learning_rate": 0.00028955961546338175, "loss": 0.0106, "step": 3150 }, { "epoch": 0.64, "learning_rate": 0.00028955250854633855, "loss": 0.0119, "step": 3151 }, { "epoch": 0.64, "learning_rate": 0.00028954539929850506, "loss": 0.0107, "step": 3152 }, { "epoch": 0.64, "learning_rate": 0.00028953828772, "loss": 0.0357, "step": 3153 }, { "epoch": 0.64, "learning_rate": 0.00028953117381094203, "loss": 0.0199, "step": 3154 }, { "epoch": 0.64, "learning_rate": 0.00028952405757145015, "loss": 0.0257, "step": 3155 }, { "epoch": 0.64, "learning_rate": 0.0002895169390016431, "loss": 0.0315, "step": 3156 }, { "epoch": 0.64, "learning_rate": 0.0002895098181016399, "loss": 0.0195, "step": 3157 }, { "epoch": 0.64, "learning_rate": 0.00028950269487155935, "loss": 0.0496, "step": 3158 }, { "epoch": 0.64, "learning_rate": 0.0002894955693115204, "loss": 0.036, "step": 3159 }, { "epoch": 0.64, "learning_rate": 0.0002894884414216422, "loss": 0.0244, "step": 3160 }, { "epoch": 0.64, "learning_rate": 0.0002894813112020437, "loss": 0.0186, "step": 3161 }, { "epoch": 0.64, "learning_rate": 0.000289474178652844, "loss": 0.0096, "step": 3162 }, { "epoch": 0.64, "learning_rate": 0.00028946704377416226, "loss": 0.0199, "step": 3163 }, { "epoch": 0.64, "learning_rate": 0.00028945990656611763, "loss": 0.0544, "step": 3164 }, { "epoch": 0.64, "learning_rate": 0.00028945276702882933, "loss": 0.0235, "step": 3165 }, { "epoch": 0.64, "learning_rate": 0.00028944562516241656, "loss": 0.0126, "step": 3166 }, { "epoch": 0.64, "learning_rate": 0.00028943848096699864, "loss": 0.0433, "step": 3167 }, { "epoch": 0.65, "learning_rate": 0.0002894313344426948, "loss": 0.0126, "step": 3168 }, { "epoch": 0.65, "learning_rate": 0.00028942418558962455, "loss": 0.017, "step": 3169 }, { "epoch": 0.65, "learning_rate": 0.0002894170344079072, "loss": 0.0247, "step": 3170 }, { "epoch": 0.65, "learning_rate": 0.0002894098808976623, "loss": 0.0365, "step": 3171 }, { "epoch": 0.65, "learning_rate": 0.0002894027250590091, "loss": 0.0306, "step": 3172 }, { "epoch": 0.65, "learning_rate": 0.0002893955668920673, "loss": 0.0558, "step": 3173 }, { "epoch": 0.65, "learning_rate": 0.0002893884063969564, "loss": 0.0386, "step": 3174 }, { "epoch": 0.65, "learning_rate": 0.000289381243573796, "loss": 0.0162, "step": 3175 }, { "epoch": 0.65, "learning_rate": 0.0002893740784227058, "loss": 0.015, "step": 3176 }, { "epoch": 0.65, "learning_rate": 0.0002893669109438053, "loss": 0.0206, "step": 3177 }, { "epoch": 0.65, "learning_rate": 0.00028935974113721436, "loss": 0.034, "step": 3178 }, { "epoch": 0.65, "learning_rate": 0.00028935256900305273, "loss": 0.007, "step": 3179 }, { "epoch": 0.65, "learning_rate": 0.0002893453945414401, "loss": 0.0231, "step": 3180 }, { "epoch": 0.65, "learning_rate": 0.0002893382177524963, "loss": 0.0144, "step": 3181 }, { "epoch": 0.65, "learning_rate": 0.0002893310386363413, "loss": 0.0316, "step": 3182 }, { "epoch": 0.65, "learning_rate": 0.00028932385719309496, "loss": 0.0454, "step": 3183 }, { "epoch": 0.65, "learning_rate": 0.00028931667342287716, "loss": 0.0188, "step": 3184 }, { "epoch": 0.65, "learning_rate": 0.000289309487325808, "loss": 0.0036, "step": 3185 }, { "epoch": 0.65, "learning_rate": 0.0002893022989020074, "loss": 0.036, "step": 3186 }, { "epoch": 0.65, "learning_rate": 0.00028929510815159544, "loss": 0.0337, "step": 3187 }, { "epoch": 0.65, "learning_rate": 0.0002892879150746923, "loss": 0.0112, "step": 3188 }, { "epoch": 0.65, "learning_rate": 0.000289280719671418, "loss": 0.0275, "step": 3189 }, { "epoch": 0.65, "learning_rate": 0.0002892735219418928, "loss": 0.029, "step": 3190 }, { "epoch": 0.65, "learning_rate": 0.00028926632188623684, "loss": 0.0075, "step": 3191 }, { "epoch": 0.65, "learning_rate": 0.00028925911950457045, "loss": 0.025, "step": 3192 }, { "epoch": 0.65, "learning_rate": 0.0002892519147970139, "loss": 0.0435, "step": 3193 }, { "epoch": 0.65, "learning_rate": 0.0002892447077636875, "loss": 0.027, "step": 3194 }, { "epoch": 0.65, "learning_rate": 0.0002892374984047116, "loss": 0.0072, "step": 3195 }, { "epoch": 0.65, "learning_rate": 0.00028923028672020673, "loss": 0.034, "step": 3196 }, { "epoch": 0.65, "learning_rate": 0.0002892230727102932, "loss": 0.0175, "step": 3197 }, { "epoch": 0.65, "learning_rate": 0.0002892158563750916, "loss": 0.0152, "step": 3198 }, { "epoch": 0.65, "learning_rate": 0.0002892086377147224, "loss": 0.0144, "step": 3199 }, { "epoch": 0.65, "learning_rate": 0.00028920141672930617, "loss": 0.0476, "step": 3200 }, { "epoch": 0.65, "learning_rate": 0.0002891941934189635, "loss": 0.0161, "step": 3201 }, { "epoch": 0.65, "learning_rate": 0.00028918696778381503, "loss": 0.0315, "step": 3202 }, { "epoch": 0.65, "learning_rate": 0.0002891797398239815, "loss": 0.0385, "step": 3203 }, { "epoch": 0.65, "learning_rate": 0.0002891725095395836, "loss": 0.011, "step": 3204 }, { "epoch": 0.65, "learning_rate": 0.0002891652769307421, "loss": 0.0158, "step": 3205 }, { "epoch": 0.65, "learning_rate": 0.00028915804199757775, "loss": 0.0195, "step": 3206 }, { "epoch": 0.65, "learning_rate": 0.0002891508047402114, "loss": 0.0207, "step": 3207 }, { "epoch": 0.65, "learning_rate": 0.000289143565158764, "loss": 0.0525, "step": 3208 }, { "epoch": 0.65, "learning_rate": 0.0002891363232533564, "loss": 0.0121, "step": 3209 }, { "epoch": 0.65, "learning_rate": 0.00028912907902410947, "loss": 0.0389, "step": 3210 }, { "epoch": 0.65, "learning_rate": 0.0002891218324711444, "loss": 0.0159, "step": 3211 }, { "epoch": 0.65, "learning_rate": 0.00028911458359458204, "loss": 0.0228, "step": 3212 }, { "epoch": 0.65, "learning_rate": 0.0002891073323945436, "loss": 0.0496, "step": 3213 }, { "epoch": 0.65, "learning_rate": 0.0002891000788711501, "loss": 0.0294, "step": 3214 }, { "epoch": 0.65, "learning_rate": 0.00028909282302452274, "loss": 0.0091, "step": 3215 }, { "epoch": 0.65, "learning_rate": 0.00028908556485478265, "loss": 0.0462, "step": 3216 }, { "epoch": 0.66, "learning_rate": 0.00028907830436205115, "loss": 0.0139, "step": 3217 }, { "epoch": 0.66, "learning_rate": 0.00028907104154644934, "loss": 0.0271, "step": 3218 }, { "epoch": 0.66, "learning_rate": 0.00028906377640809867, "loss": 0.0237, "step": 3219 }, { "epoch": 0.66, "learning_rate": 0.0002890565089471204, "loss": 0.0382, "step": 3220 }, { "epoch": 0.66, "learning_rate": 0.000289049239163636, "loss": 0.0225, "step": 3221 }, { "epoch": 0.66, "learning_rate": 0.0002890419670577668, "loss": 0.0255, "step": 3222 }, { "epoch": 0.66, "learning_rate": 0.0002890346926296343, "loss": 0.025, "step": 3223 }, { "epoch": 0.66, "learning_rate": 0.00028902741587935994, "loss": 0.043, "step": 3224 }, { "epoch": 0.66, "learning_rate": 0.0002890201368070653, "loss": 0.0148, "step": 3225 }, { "epoch": 0.66, "learning_rate": 0.00028901285541287205, "loss": 0.0475, "step": 3226 }, { "epoch": 0.66, "learning_rate": 0.0002890055716969016, "loss": 0.0174, "step": 3227 }, { "epoch": 0.66, "learning_rate": 0.0002889982856592758, "loss": 0.0088, "step": 3228 }, { "epoch": 0.66, "learning_rate": 0.0002889909973001162, "loss": 0.0548, "step": 3229 }, { "epoch": 0.66, "learning_rate": 0.0002889837066195446, "loss": 0.0299, "step": 3230 }, { "epoch": 0.66, "learning_rate": 0.0002889764136176827, "loss": 0.0044, "step": 3231 }, { "epoch": 0.66, "learning_rate": 0.0002889691182946525, "loss": 0.0326, "step": 3232 }, { "epoch": 0.66, "learning_rate": 0.00028896182065057556, "loss": 0.0088, "step": 3233 }, { "epoch": 0.66, "learning_rate": 0.00028895452068557393, "loss": 0.0066, "step": 3234 }, { "epoch": 0.66, "learning_rate": 0.0002889472183997696, "loss": 0.0298, "step": 3235 }, { "epoch": 0.66, "learning_rate": 0.0002889399137932843, "loss": 0.0069, "step": 3236 }, { "epoch": 0.66, "learning_rate": 0.00028893260686624025, "loss": 0.0525, "step": 3237 }, { "epoch": 0.66, "learning_rate": 0.0002889252976187594, "loss": 0.0324, "step": 3238 }, { "epoch": 0.66, "learning_rate": 0.00028891798605096383, "loss": 0.0306, "step": 3239 }, { "epoch": 0.66, "learning_rate": 0.0002889106721629757, "loss": 0.0465, "step": 3240 }, { "epoch": 0.66, "learning_rate": 0.00028890335595491715, "loss": 0.0207, "step": 3241 }, { "epoch": 0.66, "learning_rate": 0.0002888960374269103, "loss": 0.009, "step": 3242 }, { "epoch": 0.66, "learning_rate": 0.00028888871657907744, "loss": 0.0399, "step": 3243 }, { "epoch": 0.66, "learning_rate": 0.00028888139341154087, "loss": 0.0386, "step": 3244 }, { "epoch": 0.66, "learning_rate": 0.00028887406792442287, "loss": 0.0082, "step": 3245 }, { "epoch": 0.66, "learning_rate": 0.0002888667401178458, "loss": 0.0191, "step": 3246 }, { "epoch": 0.66, "learning_rate": 0.000288859409991932, "loss": 0.0256, "step": 3247 }, { "epoch": 0.66, "learning_rate": 0.00028885207754680397, "loss": 0.0436, "step": 3248 }, { "epoch": 0.66, "learning_rate": 0.00028884474278258415, "loss": 0.0431, "step": 3249 }, { "epoch": 0.66, "learning_rate": 0.000288837405699395, "loss": 0.0357, "step": 3250 }, { "epoch": 0.66, "learning_rate": 0.00028883006629735916, "loss": 0.0113, "step": 3251 }, { "epoch": 0.66, "learning_rate": 0.0002888227245765991, "loss": 0.0112, "step": 3252 }, { "epoch": 0.66, "learning_rate": 0.0002888153805372375, "loss": 0.0095, "step": 3253 }, { "epoch": 0.66, "learning_rate": 0.00028880803417939704, "loss": 0.0104, "step": 3254 }, { "epoch": 0.66, "learning_rate": 0.0002888006855032004, "loss": 0.0137, "step": 3255 }, { "epoch": 0.66, "learning_rate": 0.00028879333450877026, "loss": 0.0389, "step": 3256 }, { "epoch": 0.66, "learning_rate": 0.0002887859811962294, "loss": 0.0298, "step": 3257 }, { "epoch": 0.66, "learning_rate": 0.0002887786255657008, "loss": 0.0242, "step": 3258 }, { "epoch": 0.66, "learning_rate": 0.0002887712676173071, "loss": 0.0072, "step": 3259 }, { "epoch": 0.66, "learning_rate": 0.00028876390735117134, "loss": 0.0137, "step": 3260 }, { "epoch": 0.66, "learning_rate": 0.0002887565447674164, "loss": 0.0258, "step": 3261 }, { "epoch": 0.66, "learning_rate": 0.0002887491798661652, "loss": 0.0241, "step": 3262 }, { "epoch": 0.66, "learning_rate": 0.00028874181264754075, "loss": 0.0165, "step": 3263 }, { "epoch": 0.66, "learning_rate": 0.0002887344431116662, "loss": 0.0435, "step": 3264 }, { "epoch": 0.66, "learning_rate": 0.00028872707125866457, "loss": 0.0186, "step": 3265 }, { "epoch": 0.67, "learning_rate": 0.00028871969708865893, "loss": 0.0461, "step": 3266 }, { "epoch": 0.67, "learning_rate": 0.0002887123206017725, "loss": 0.0331, "step": 3267 }, { "epoch": 0.67, "learning_rate": 0.0002887049417981285, "loss": 0.0171, "step": 3268 }, { "epoch": 0.67, "learning_rate": 0.0002886975606778502, "loss": 0.019, "step": 3269 }, { "epoch": 0.67, "learning_rate": 0.0002886901772410608, "loss": 0.0225, "step": 3270 }, { "epoch": 0.67, "learning_rate": 0.0002886827914878836, "loss": 0.0143, "step": 3271 }, { "epoch": 0.67, "learning_rate": 0.00028867540341844205, "loss": 0.0211, "step": 3272 }, { "epoch": 0.67, "learning_rate": 0.00028866801303285947, "loss": 0.0299, "step": 3273 }, { "epoch": 0.67, "learning_rate": 0.00028866062033125933, "loss": 0.0116, "step": 3274 }, { "epoch": 0.67, "learning_rate": 0.00028865322531376503, "loss": 0.0243, "step": 3275 }, { "epoch": 0.67, "learning_rate": 0.0002886458279805002, "loss": 0.0292, "step": 3276 }, { "epoch": 0.67, "learning_rate": 0.0002886384283315883, "loss": 0.037, "step": 3277 }, { "epoch": 0.67, "learning_rate": 0.000288631026367153, "loss": 0.0231, "step": 3278 }, { "epoch": 0.67, "learning_rate": 0.00028862362208731786, "loss": 0.0157, "step": 3279 }, { "epoch": 0.67, "learning_rate": 0.0002886162154922065, "loss": 0.0099, "step": 3280 }, { "epoch": 0.67, "learning_rate": 0.00028860880658194277, "loss": 0.0284, "step": 3281 }, { "epoch": 0.67, "learning_rate": 0.00028860139535665023, "loss": 0.027, "step": 3282 }, { "epoch": 0.67, "learning_rate": 0.00028859398181645287, "loss": 0.0381, "step": 3283 }, { "epoch": 0.67, "learning_rate": 0.0002885865659614743, "loss": 0.0151, "step": 3284 }, { "epoch": 0.67, "learning_rate": 0.0002885791477918385, "loss": 0.0661, "step": 3285 }, { "epoch": 0.67, "learning_rate": 0.0002885717273076694, "loss": 0.0441, "step": 3286 }, { "epoch": 0.67, "learning_rate": 0.00028856430450909085, "loss": 0.0101, "step": 3287 }, { "epoch": 0.67, "learning_rate": 0.0002885568793962268, "loss": 0.0172, "step": 3288 }, { "epoch": 0.67, "learning_rate": 0.0002885494519692014, "loss": 0.0318, "step": 3289 }, { "epoch": 0.67, "learning_rate": 0.00028854202222813863, "loss": 0.018, "step": 3290 }, { "epoch": 0.67, "learning_rate": 0.0002885345901731625, "loss": 0.0338, "step": 3291 }, { "epoch": 0.67, "learning_rate": 0.0002885271558043973, "loss": 0.0721, "step": 3292 }, { "epoch": 0.67, "learning_rate": 0.000288519719121967, "loss": 0.0119, "step": 3293 }, { "epoch": 0.67, "learning_rate": 0.000288512280125996, "loss": 0.045, "step": 3294 }, { "epoch": 0.67, "learning_rate": 0.00028850483881660843, "loss": 0.0184, "step": 3295 }, { "epoch": 0.67, "learning_rate": 0.0002884973951939286, "loss": 0.0192, "step": 3296 }, { "epoch": 0.67, "learning_rate": 0.0002884899492580809, "loss": 0.0291, "step": 3297 }, { "epoch": 0.67, "learning_rate": 0.00028848250100918955, "loss": 0.0417, "step": 3298 }, { "epoch": 0.67, "learning_rate": 0.000288475050447379, "loss": 0.0296, "step": 3299 }, { "epoch": 0.67, "learning_rate": 0.0002884675975727738, "loss": 0.0263, "step": 3300 }, { "epoch": 0.67, "learning_rate": 0.00028846014238549834, "loss": 0.0124, "step": 3301 }, { "epoch": 0.67, "learning_rate": 0.0002884526848856771, "loss": 0.0101, "step": 3302 }, { "epoch": 0.67, "learning_rate": 0.0002884452250734347, "loss": 0.045, "step": 3303 }, { "epoch": 0.67, "learning_rate": 0.0002884377629488957, "loss": 0.0144, "step": 3304 }, { "epoch": 0.67, "learning_rate": 0.00028843029851218475, "loss": 0.0238, "step": 3305 }, { "epoch": 0.67, "learning_rate": 0.0002884228317634265, "loss": 0.048, "step": 3306 }, { "epoch": 0.67, "learning_rate": 0.00028841536270274564, "loss": 0.037, "step": 3307 }, { "epoch": 0.67, "learning_rate": 0.000288407891330267, "loss": 0.0333, "step": 3308 }, { "epoch": 0.67, "learning_rate": 0.0002884004176461153, "loss": 0.008, "step": 3309 }, { "epoch": 0.67, "learning_rate": 0.00028839294165041536, "loss": 0.0157, "step": 3310 }, { "epoch": 0.67, "learning_rate": 0.000288385463343292, "loss": 0.0455, "step": 3311 }, { "epoch": 0.67, "learning_rate": 0.00028837798272487026, "loss": 0.0224, "step": 3312 }, { "epoch": 0.67, "learning_rate": 0.000288370499795275, "loss": 0.0386, "step": 3313 }, { "epoch": 0.67, "learning_rate": 0.0002883630145546312, "loss": 0.0497, "step": 3314 }, { "epoch": 0.67, "learning_rate": 0.00028835552700306387, "loss": 0.0189, "step": 3315 }, { "epoch": 0.68, "learning_rate": 0.000288348037140698, "loss": 0.0287, "step": 3316 }, { "epoch": 0.68, "learning_rate": 0.0002883405449676589, "loss": 0.0126, "step": 3317 }, { "epoch": 0.68, "learning_rate": 0.00028833305048407145, "loss": 0.0318, "step": 3318 }, { "epoch": 0.68, "learning_rate": 0.00028832555369006095, "loss": 0.0134, "step": 3319 }, { "epoch": 0.68, "learning_rate": 0.0002883180545857526, "loss": 0.0528, "step": 3320 }, { "epoch": 0.68, "learning_rate": 0.0002883105531712717, "loss": 0.0276, "step": 3321 }, { "epoch": 0.68, "learning_rate": 0.0002883030494467435, "loss": 0.0226, "step": 3322 }, { "epoch": 0.68, "learning_rate": 0.0002882955434122932, "loss": 0.0125, "step": 3323 }, { "epoch": 0.68, "learning_rate": 0.00028828803506804633, "loss": 0.0212, "step": 3324 }, { "epoch": 0.68, "learning_rate": 0.0002882805244141282, "loss": 0.0126, "step": 3325 }, { "epoch": 0.68, "learning_rate": 0.00028827301145066433, "loss": 0.0256, "step": 3326 }, { "epoch": 0.68, "learning_rate": 0.0002882654961777802, "loss": 0.0282, "step": 3327 }, { "epoch": 0.68, "learning_rate": 0.0002882579785956012, "loss": 0.0063, "step": 3328 }, { "epoch": 0.68, "learning_rate": 0.000288250458704253, "loss": 0.0377, "step": 3329 }, { "epoch": 0.68, "learning_rate": 0.0002882429365038612, "loss": 0.0112, "step": 3330 }, { "epoch": 0.68, "learning_rate": 0.0002882354119945514, "loss": 0.0236, "step": 3331 }, { "epoch": 0.68, "learning_rate": 0.0002882278851764493, "loss": 0.0298, "step": 3332 }, { "epoch": 0.68, "learning_rate": 0.00028822035604968057, "loss": 0.0493, "step": 3333 }, { "epoch": 0.68, "learning_rate": 0.000288212824614371, "loss": 0.029, "step": 3334 }, { "epoch": 0.68, "learning_rate": 0.00028820529087064634, "loss": 0.0333, "step": 3335 }, { "epoch": 0.68, "learning_rate": 0.0002881977548186325, "loss": 0.0217, "step": 3336 }, { "epoch": 0.68, "learning_rate": 0.0002881902164584552, "loss": 0.0378, "step": 3337 }, { "epoch": 0.68, "learning_rate": 0.00028818267579024044, "loss": 0.0131, "step": 3338 }, { "epoch": 0.68, "learning_rate": 0.0002881751328141142, "loss": 0.0064, "step": 3339 }, { "epoch": 0.68, "learning_rate": 0.0002881675875302024, "loss": 0.0075, "step": 3340 }, { "epoch": 0.68, "learning_rate": 0.00028816003993863116, "loss": 0.0314, "step": 3341 }, { "epoch": 0.68, "learning_rate": 0.00028815249003952633, "loss": 0.0084, "step": 3342 }, { "epoch": 0.68, "learning_rate": 0.0002881449378330142, "loss": 0.016, "step": 3343 }, { "epoch": 0.68, "learning_rate": 0.0002881373833192208, "loss": 0.0385, "step": 3344 }, { "epoch": 0.68, "learning_rate": 0.0002881298264982724, "loss": 0.0116, "step": 3345 }, { "epoch": 0.68, "learning_rate": 0.00028812226737029515, "loss": 0.0148, "step": 3346 }, { "epoch": 0.68, "learning_rate": 0.0002881147059354153, "loss": 0.0259, "step": 3347 }, { "epoch": 0.68, "learning_rate": 0.00028810714219375917, "loss": 0.0233, "step": 3348 }, { "epoch": 0.68, "learning_rate": 0.000288099576145453, "loss": 0.0068, "step": 3349 }, { "epoch": 0.68, "learning_rate": 0.00028809200779062334, "loss": 0.0226, "step": 3350 }, { "epoch": 0.68, "learning_rate": 0.0002880844371293964, "loss": 0.0444, "step": 3351 }, { "epoch": 0.68, "learning_rate": 0.0002880768641618987, "loss": 0.0265, "step": 3352 }, { "epoch": 0.68, "learning_rate": 0.00028806928888825675, "loss": 0.0436, "step": 3353 }, { "epoch": 0.68, "learning_rate": 0.00028806171130859703, "loss": 0.0088, "step": 3354 }, { "epoch": 0.68, "learning_rate": 0.0002880541314230462, "loss": 0.0166, "step": 3355 }, { "epoch": 0.68, "learning_rate": 0.0002880465492317307, "loss": 0.0151, "step": 3356 }, { "epoch": 0.68, "learning_rate": 0.00028803896473477726, "loss": 0.0188, "step": 3357 }, { "epoch": 0.68, "learning_rate": 0.00028803137793231257, "loss": 0.0121, "step": 3358 }, { "epoch": 0.68, "learning_rate": 0.0002880237888244633, "loss": 0.0367, "step": 3359 }, { "epoch": 0.68, "learning_rate": 0.00028801619741135624, "loss": 0.0167, "step": 3360 }, { "epoch": 0.68, "learning_rate": 0.0002880086036931181, "loss": 0.0192, "step": 3361 }, { "epoch": 0.68, "learning_rate": 0.0002880010076698758, "loss": 0.0136, "step": 3362 }, { "epoch": 0.68, "learning_rate": 0.0002879934093417562, "loss": 0.0205, "step": 3363 }, { "epoch": 0.68, "learning_rate": 0.0002879858087088862, "loss": 0.0184, "step": 3364 }, { "epoch": 0.69, "learning_rate": 0.0002879782057713927, "loss": 0.0027, "step": 3365 }, { "epoch": 0.69, "learning_rate": 0.0002879706005294027, "loss": 0.0185, "step": 3366 }, { "epoch": 0.69, "learning_rate": 0.00028796299298304324, "loss": 0.0763, "step": 3367 }, { "epoch": 0.69, "learning_rate": 0.00028795538313244136, "loss": 0.0107, "step": 3368 }, { "epoch": 0.69, "learning_rate": 0.0002879477709777242, "loss": 0.0089, "step": 3369 }, { "epoch": 0.69, "learning_rate": 0.00028794015651901887, "loss": 0.0438, "step": 3370 }, { "epoch": 0.69, "learning_rate": 0.0002879325397564525, "loss": 0.0259, "step": 3371 }, { "epoch": 0.69, "learning_rate": 0.0002879249206901524, "loss": 0.0086, "step": 3372 }, { "epoch": 0.69, "learning_rate": 0.00028791729932024573, "loss": 0.0162, "step": 3373 }, { "epoch": 0.69, "learning_rate": 0.00028790967564685984, "loss": 0.0309, "step": 3374 }, { "epoch": 0.69, "learning_rate": 0.00028790204967012206, "loss": 0.0196, "step": 3375 }, { "epoch": 0.69, "learning_rate": 0.0002878944213901597, "loss": 0.0658, "step": 3376 }, { "epoch": 0.69, "learning_rate": 0.0002878867908071003, "loss": 0.0288, "step": 3377 }, { "epoch": 0.69, "learning_rate": 0.00028787915792107113, "loss": 0.0155, "step": 3378 }, { "epoch": 0.69, "learning_rate": 0.0002878715227321998, "loss": 0.0074, "step": 3379 }, { "epoch": 0.69, "learning_rate": 0.00028786388524061374, "loss": 0.0048, "step": 3380 }, { "epoch": 0.69, "learning_rate": 0.0002878562454464406, "loss": 0.0148, "step": 3381 }, { "epoch": 0.69, "learning_rate": 0.00028784860334980794, "loss": 0.047, "step": 3382 }, { "epoch": 0.69, "learning_rate": 0.00028784095895084336, "loss": 0.0145, "step": 3383 }, { "epoch": 0.69, "learning_rate": 0.00028783331224967466, "loss": 0.0322, "step": 3384 }, { "epoch": 0.69, "learning_rate": 0.0002878256632464294, "loss": 0.0238, "step": 3385 }, { "epoch": 0.69, "learning_rate": 0.0002878180119412354, "loss": 0.0366, "step": 3386 }, { "epoch": 0.69, "learning_rate": 0.0002878103583342205, "loss": 0.0726, "step": 3387 }, { "epoch": 0.69, "learning_rate": 0.0002878027024255124, "loss": 0.0489, "step": 3388 }, { "epoch": 0.69, "learning_rate": 0.0002877950442152391, "loss": 0.0065, "step": 3389 }, { "epoch": 0.69, "learning_rate": 0.0002877873837035284, "loss": 0.0244, "step": 3390 }, { "epoch": 0.69, "learning_rate": 0.0002877797208905083, "loss": 0.0332, "step": 3391 }, { "epoch": 0.69, "learning_rate": 0.00028777205577630685, "loss": 0.048, "step": 3392 }, { "epoch": 0.69, "learning_rate": 0.000287764388361052, "loss": 0.0485, "step": 3393 }, { "epoch": 0.69, "learning_rate": 0.00028775671864487176, "loss": 0.027, "step": 3394 }, { "epoch": 0.69, "learning_rate": 0.0002877490466278943, "loss": 0.0067, "step": 3395 }, { "epoch": 0.69, "learning_rate": 0.00028774137231024784, "loss": 0.0304, "step": 3396 }, { "epoch": 0.69, "learning_rate": 0.00028773369569206036, "loss": 0.0167, "step": 3397 }, { "epoch": 0.69, "learning_rate": 0.0002877260167734602, "loss": 0.0322, "step": 3398 }, { "epoch": 0.69, "learning_rate": 0.00028771833555457557, "loss": 0.0365, "step": 3399 }, { "epoch": 0.69, "learning_rate": 0.00028771065203553477, "loss": 0.0105, "step": 3400 }, { "epoch": 0.69, "learning_rate": 0.00028770296621646613, "loss": 0.0451, "step": 3401 }, { "epoch": 0.69, "learning_rate": 0.000287695278097498, "loss": 0.0106, "step": 3402 }, { "epoch": 0.69, "learning_rate": 0.00028768758767875886, "loss": 0.0618, "step": 3403 }, { "epoch": 0.69, "learning_rate": 0.0002876798949603771, "loss": 0.0254, "step": 3404 }, { "epoch": 0.69, "learning_rate": 0.0002876721999424812, "loss": 0.0127, "step": 3405 }, { "epoch": 0.69, "learning_rate": 0.00028766450262519963, "loss": 0.0307, "step": 3406 }, { "epoch": 0.69, "learning_rate": 0.0002876568030086611, "loss": 0.0225, "step": 3407 }, { "epoch": 0.69, "learning_rate": 0.000287649101092994, "loss": 0.0117, "step": 3408 }, { "epoch": 0.69, "learning_rate": 0.0002876413968783272, "loss": 0.0411, "step": 3409 }, { "epoch": 0.69, "learning_rate": 0.0002876336903647892, "loss": 0.0187, "step": 3410 }, { "epoch": 0.69, "learning_rate": 0.0002876259815525087, "loss": 0.0092, "step": 3411 }, { "epoch": 0.69, "learning_rate": 0.00028761827044161464, "loss": 0.0094, "step": 3412 }, { "epoch": 0.69, "learning_rate": 0.00028761055703223565, "loss": 0.0563, "step": 3413 }, { "epoch": 0.7, "learning_rate": 0.0002876028413245006, "loss": 0.0251, "step": 3414 }, { "epoch": 0.7, "learning_rate": 0.0002875951233185383, "loss": 0.0101, "step": 3415 }, { "epoch": 0.7, "learning_rate": 0.00028758740301447776, "loss": 0.0242, "step": 3416 }, { "epoch": 0.7, "learning_rate": 0.0002875796804124479, "loss": 0.0246, "step": 3417 }, { "epoch": 0.7, "learning_rate": 0.00028757195551257767, "loss": 0.0108, "step": 3418 }, { "epoch": 0.7, "learning_rate": 0.00028756422831499606, "loss": 0.0235, "step": 3419 }, { "epoch": 0.7, "learning_rate": 0.0002875564988198322, "loss": 0.0184, "step": 3420 }, { "epoch": 0.7, "learning_rate": 0.0002875487670272151, "loss": 0.0374, "step": 3421 }, { "epoch": 0.7, "learning_rate": 0.000287541032937274, "loss": 0.0298, "step": 3422 }, { "epoch": 0.7, "learning_rate": 0.000287533296550138, "loss": 0.0242, "step": 3423 }, { "epoch": 0.7, "learning_rate": 0.00028752555786593634, "loss": 0.0341, "step": 3424 }, { "epoch": 0.7, "learning_rate": 0.0002875178168847983, "loss": 0.0117, "step": 3425 }, { "epoch": 0.7, "learning_rate": 0.0002875100736068531, "loss": 0.0525, "step": 3426 }, { "epoch": 0.7, "learning_rate": 0.0002875023280322301, "loss": 0.0484, "step": 3427 }, { "epoch": 0.7, "learning_rate": 0.00028749458016105863, "loss": 0.0184, "step": 3428 }, { "epoch": 0.7, "learning_rate": 0.0002874868299934682, "loss": 0.0402, "step": 3429 }, { "epoch": 0.7, "learning_rate": 0.00028747907752958815, "loss": 0.0243, "step": 3430 }, { "epoch": 0.7, "learning_rate": 0.00028747132276954804, "loss": 0.0127, "step": 3431 }, { "epoch": 0.7, "learning_rate": 0.00028746356571347727, "loss": 0.0194, "step": 3432 }, { "epoch": 0.7, "learning_rate": 0.0002874558063615055, "loss": 0.0284, "step": 3433 }, { "epoch": 0.7, "learning_rate": 0.0002874480447137623, "loss": 0.0192, "step": 3434 }, { "epoch": 0.7, "learning_rate": 0.00028744028077037735, "loss": 0.0166, "step": 3435 }, { "epoch": 0.7, "learning_rate": 0.0002874325145314802, "loss": 0.0541, "step": 3436 }, { "epoch": 0.7, "learning_rate": 0.0002874247459972007, "loss": 0.0302, "step": 3437 }, { "epoch": 0.7, "learning_rate": 0.0002874169751676685, "loss": 0.0371, "step": 3438 }, { "epoch": 0.7, "learning_rate": 0.0002874092020430134, "loss": 0.0184, "step": 3439 }, { "epoch": 0.7, "learning_rate": 0.0002874014266233653, "loss": 0.0311, "step": 3440 }, { "epoch": 0.7, "learning_rate": 0.00028739364890885394, "loss": 0.0384, "step": 3441 }, { "epoch": 0.7, "learning_rate": 0.0002873858688996094, "loss": 0.0712, "step": 3442 }, { "epoch": 0.7, "learning_rate": 0.00028737808659576146, "loss": 0.0169, "step": 3443 }, { "epoch": 0.7, "learning_rate": 0.00028737030199744014, "loss": 0.0264, "step": 3444 }, { "epoch": 0.7, "learning_rate": 0.0002873625151047755, "loss": 0.0497, "step": 3445 }, { "epoch": 0.7, "learning_rate": 0.00028735472591789754, "loss": 0.0118, "step": 3446 }, { "epoch": 0.7, "learning_rate": 0.00028734693443693637, "loss": 0.0455, "step": 3447 }, { "epoch": 0.7, "learning_rate": 0.00028733914066202213, "loss": 0.0213, "step": 3448 }, { "epoch": 0.7, "learning_rate": 0.000287331344593285, "loss": 0.0189, "step": 3449 }, { "epoch": 0.7, "learning_rate": 0.0002873235462308552, "loss": 0.0122, "step": 3450 }, { "epoch": 0.7, "learning_rate": 0.000287315745574863, "loss": 0.0064, "step": 3451 }, { "epoch": 0.7, "learning_rate": 0.0002873079426254386, "loss": 0.023, "step": 3452 }, { "epoch": 0.7, "learning_rate": 0.0002873001373827124, "loss": 0.0232, "step": 3453 }, { "epoch": 0.7, "learning_rate": 0.0002872923298468147, "loss": 0.0334, "step": 3454 }, { "epoch": 0.7, "learning_rate": 0.00028728452001787594, "loss": 0.0318, "step": 3455 }, { "epoch": 0.7, "learning_rate": 0.00028727670789602657, "loss": 0.0321, "step": 3456 }, { "epoch": 0.7, "learning_rate": 0.000287268893481397, "loss": 0.0495, "step": 3457 }, { "epoch": 0.7, "learning_rate": 0.0002872610767741179, "loss": 0.0131, "step": 3458 }, { "epoch": 0.7, "learning_rate": 0.00028725325777431964, "loss": 0.0117, "step": 3459 }, { "epoch": 0.7, "learning_rate": 0.0002872454364821329, "loss": 0.0504, "step": 3460 }, { "epoch": 0.7, "learning_rate": 0.0002872376128976883, "loss": 0.0153, "step": 3461 }, { "epoch": 0.7, "learning_rate": 0.00028722978702111653, "loss": 0.0157, "step": 3462 }, { "epoch": 0.71, "learning_rate": 0.0002872219588525483, "loss": 0.0387, "step": 3463 }, { "epoch": 0.71, "learning_rate": 0.00028721412839211426, "loss": 0.024, "step": 3464 }, { "epoch": 0.71, "learning_rate": 0.00028720629563994533, "loss": 0.0519, "step": 3465 }, { "epoch": 0.71, "learning_rate": 0.0002871984605961722, "loss": 0.0148, "step": 3466 }, { "epoch": 0.71, "learning_rate": 0.0002871906232609259, "loss": 0.0201, "step": 3467 }, { "epoch": 0.71, "learning_rate": 0.00028718278363433714, "loss": 0.0035, "step": 3468 }, { "epoch": 0.71, "learning_rate": 0.00028717494171653696, "loss": 0.0122, "step": 3469 }, { "epoch": 0.71, "learning_rate": 0.0002871670975076563, "loss": 0.0394, "step": 3470 }, { "epoch": 0.71, "learning_rate": 0.0002871592510078262, "loss": 0.0121, "step": 3471 }, { "epoch": 0.71, "learning_rate": 0.0002871514022171778, "loss": 0.0073, "step": 3472 }, { "epoch": 0.71, "learning_rate": 0.000287143551135842, "loss": 0.0368, "step": 3473 }, { "epoch": 0.71, "learning_rate": 0.00028713569776395, "loss": 0.0228, "step": 3474 }, { "epoch": 0.71, "learning_rate": 0.00028712784210163303, "loss": 0.0268, "step": 3475 }, { "epoch": 0.71, "learning_rate": 0.0002871199841490222, "loss": 0.06, "step": 3476 }, { "epoch": 0.71, "learning_rate": 0.0002871121239062489, "loss": 0.0228, "step": 3477 }, { "epoch": 0.71, "learning_rate": 0.0002871042613734442, "loss": 0.016, "step": 3478 }, { "epoch": 0.71, "learning_rate": 0.0002870963965507396, "loss": 0.0589, "step": 3479 }, { "epoch": 0.71, "learning_rate": 0.00028708852943826635, "loss": 0.0064, "step": 3480 }, { "epoch": 0.71, "learning_rate": 0.00028708066003615593, "loss": 0.0474, "step": 3481 }, { "epoch": 0.71, "learning_rate": 0.00028707278834453975, "loss": 0.0071, "step": 3482 }, { "epoch": 0.71, "learning_rate": 0.0002870649143635492, "loss": 0.024, "step": 3483 }, { "epoch": 0.71, "learning_rate": 0.00028705703809331584, "loss": 0.025, "step": 3484 }, { "epoch": 0.71, "learning_rate": 0.00028704915953397126, "loss": 0.0223, "step": 3485 }, { "epoch": 0.71, "learning_rate": 0.000287041278685647, "loss": 0.0076, "step": 3486 }, { "epoch": 0.71, "learning_rate": 0.00028703339554847474, "loss": 0.0261, "step": 3487 }, { "epoch": 0.71, "learning_rate": 0.0002870255101225861, "loss": 0.0181, "step": 3488 }, { "epoch": 0.71, "learning_rate": 0.00028701762240811277, "loss": 0.0997, "step": 3489 }, { "epoch": 0.71, "learning_rate": 0.0002870097324051865, "loss": 0.0172, "step": 3490 }, { "epoch": 0.71, "learning_rate": 0.0002870018401139391, "loss": 0.0437, "step": 3491 }, { "epoch": 0.71, "learning_rate": 0.00028699394553450235, "loss": 0.0112, "step": 3492 }, { "epoch": 0.71, "learning_rate": 0.00028698604866700807, "loss": 0.0527, "step": 3493 }, { "epoch": 0.71, "learning_rate": 0.00028697814951158824, "loss": 0.0286, "step": 3494 }, { "epoch": 0.71, "learning_rate": 0.00028697024806837476, "loss": 0.011, "step": 3495 }, { "epoch": 0.71, "learning_rate": 0.0002869623443374996, "loss": 0.0113, "step": 3496 }, { "epoch": 0.71, "learning_rate": 0.00028695443831909474, "loss": 0.0125, "step": 3497 }, { "epoch": 0.71, "learning_rate": 0.00028694653001329215, "loss": 0.0268, "step": 3498 }, { "epoch": 0.71, "learning_rate": 0.00028693861942022413, "loss": 0.0227, "step": 3499 }, { "epoch": 0.71, "learning_rate": 0.00028693070654002263, "loss": 0.0228, "step": 3500 }, { "epoch": 0.71, "learning_rate": 0.0002869227913728198, "loss": 0.0535, "step": 3501 }, { "epoch": 0.71, "learning_rate": 0.000286914873918748, "loss": 0.0084, "step": 3502 }, { "epoch": 0.71, "learning_rate": 0.0002869069541779393, "loss": 0.0097, "step": 3503 }, { "epoch": 0.71, "learning_rate": 0.0002868990321505261, "loss": 0.0087, "step": 3504 }, { "epoch": 0.71, "learning_rate": 0.00028689110783664055, "loss": 0.0126, "step": 3505 }, { "epoch": 0.71, "learning_rate": 0.00028688318123641513, "loss": 0.0426, "step": 3506 }, { "epoch": 0.71, "learning_rate": 0.00028687525234998224, "loss": 0.0291, "step": 3507 }, { "epoch": 0.71, "learning_rate": 0.0002868673211774742, "loss": 0.0082, "step": 3508 }, { "epoch": 0.71, "learning_rate": 0.0002868593877190236, "loss": 0.0155, "step": 3509 }, { "epoch": 0.71, "learning_rate": 0.00028685145197476287, "loss": 0.0198, "step": 3510 }, { "epoch": 0.71, "learning_rate": 0.00028684351394482453, "loss": 0.0131, "step": 3511 }, { "epoch": 0.72, "learning_rate": 0.0002868355736293412, "loss": 0.017, "step": 3512 }, { "epoch": 0.72, "learning_rate": 0.00028682763102844556, "loss": 0.0284, "step": 3513 }, { "epoch": 0.72, "learning_rate": 0.0002868196861422701, "loss": 0.0348, "step": 3514 }, { "epoch": 0.72, "learning_rate": 0.0002868117389709477, "loss": 0.0199, "step": 3515 }, { "epoch": 0.72, "learning_rate": 0.000286803789514611, "loss": 0.0174, "step": 3516 }, { "epoch": 0.72, "learning_rate": 0.00028679583777339277, "loss": 0.0401, "step": 3517 }, { "epoch": 0.72, "learning_rate": 0.00028678788374742576, "loss": 0.0112, "step": 3518 }, { "epoch": 0.72, "learning_rate": 0.000286779927436843, "loss": 0.0136, "step": 3519 }, { "epoch": 0.72, "learning_rate": 0.0002867719688417772, "loss": 0.014, "step": 3520 }, { "epoch": 0.72, "learning_rate": 0.00028676400796236136, "loss": 0.0337, "step": 3521 }, { "epoch": 0.72, "learning_rate": 0.0002867560447987284, "loss": 0.0189, "step": 3522 }, { "epoch": 0.72, "learning_rate": 0.00028674807935101136, "loss": 0.0047, "step": 3523 }, { "epoch": 0.72, "learning_rate": 0.0002867401116193433, "loss": 0.0152, "step": 3524 }, { "epoch": 0.72, "learning_rate": 0.0002867321416038572, "loss": 0.0314, "step": 3525 }, { "epoch": 0.72, "learning_rate": 0.0002867241693046863, "loss": 0.0139, "step": 3526 }, { "epoch": 0.72, "learning_rate": 0.0002867161947219636, "loss": 0.0215, "step": 3527 }, { "epoch": 0.72, "learning_rate": 0.00028670821785582246, "loss": 0.0325, "step": 3528 }, { "epoch": 0.72, "learning_rate": 0.00028670023870639604, "loss": 0.0211, "step": 3529 }, { "epoch": 0.72, "learning_rate": 0.00028669225727381755, "loss": 0.0253, "step": 3530 }, { "epoch": 0.72, "learning_rate": 0.00028668427355822034, "loss": 0.0134, "step": 3531 }, { "epoch": 0.72, "learning_rate": 0.0002866762875597377, "loss": 0.0178, "step": 3532 }, { "epoch": 0.72, "learning_rate": 0.00028666829927850314, "loss": 0.014, "step": 3533 }, { "epoch": 0.72, "learning_rate": 0.00028666030871465003, "loss": 0.0152, "step": 3534 }, { "epoch": 0.72, "learning_rate": 0.0002866523158683117, "loss": 0.0209, "step": 3535 }, { "epoch": 0.72, "learning_rate": 0.0002866443207396218, "loss": 0.0497, "step": 3536 }, { "epoch": 0.72, "learning_rate": 0.00028663632332871384, "loss": 0.0384, "step": 3537 }, { "epoch": 0.72, "learning_rate": 0.00028662832363572134, "loss": 0.0285, "step": 3538 }, { "epoch": 0.72, "learning_rate": 0.00028662032166077784, "loss": 0.0169, "step": 3539 }, { "epoch": 0.72, "learning_rate": 0.0002866123174040172, "loss": 0.0034, "step": 3540 }, { "epoch": 0.72, "learning_rate": 0.00028660431086557296, "loss": 0.0388, "step": 3541 }, { "epoch": 0.72, "learning_rate": 0.00028659630204557883, "loss": 0.0159, "step": 3542 }, { "epoch": 0.72, "learning_rate": 0.0002865882909441686, "loss": 0.0268, "step": 3543 }, { "epoch": 0.72, "learning_rate": 0.0002865802775614761, "loss": 0.0534, "step": 3544 }, { "epoch": 0.72, "learning_rate": 0.0002865722618976352, "loss": 0.0176, "step": 3545 }, { "epoch": 0.72, "learning_rate": 0.00028656424395277975, "loss": 0.0117, "step": 3546 }, { "epoch": 0.72, "learning_rate": 0.0002865562237270435, "loss": 0.021, "step": 3547 }, { "epoch": 0.72, "learning_rate": 0.00028654820122056064, "loss": 0.0173, "step": 3548 }, { "epoch": 0.72, "learning_rate": 0.0002865401764334651, "loss": 0.0189, "step": 3549 }, { "epoch": 0.72, "learning_rate": 0.00028653214936589084, "loss": 0.0144, "step": 3550 }, { "epoch": 0.72, "learning_rate": 0.00028652412001797193, "loss": 0.0222, "step": 3551 }, { "epoch": 0.72, "learning_rate": 0.00028651608838984254, "loss": 0.052, "step": 3552 }, { "epoch": 0.72, "learning_rate": 0.0002865080544816368, "loss": 0.0288, "step": 3553 }, { "epoch": 0.72, "learning_rate": 0.0002865000182934889, "loss": 0.0194, "step": 3554 }, { "epoch": 0.72, "learning_rate": 0.00028649197982553293, "loss": 0.0394, "step": 3555 }, { "epoch": 0.72, "learning_rate": 0.0002864839390779033, "loss": 0.0102, "step": 3556 }, { "epoch": 0.72, "learning_rate": 0.0002864758960507342, "loss": 0.0294, "step": 3557 }, { "epoch": 0.72, "learning_rate": 0.0002864678507441601, "loss": 0.0459, "step": 3558 }, { "epoch": 0.72, "learning_rate": 0.00028645980315831533, "loss": 0.0176, "step": 3559 }, { "epoch": 0.72, "learning_rate": 0.0002864517532933342, "loss": 0.042, "step": 3560 }, { "epoch": 0.73, "learning_rate": 0.0002864437011493512, "loss": 0.0099, "step": 3561 }, { "epoch": 0.73, "learning_rate": 0.00028643564672650083, "loss": 0.028, "step": 3562 }, { "epoch": 0.73, "learning_rate": 0.00028642759002491766, "loss": 0.0322, "step": 3563 }, { "epoch": 0.73, "learning_rate": 0.0002864195310447362, "loss": 0.036, "step": 3564 }, { "epoch": 0.73, "learning_rate": 0.00028641146978609103, "loss": 0.0388, "step": 3565 }, { "epoch": 0.73, "learning_rate": 0.00028640340624911683, "loss": 0.0118, "step": 3566 }, { "epoch": 0.73, "learning_rate": 0.0002863953404339483, "loss": 0.0123, "step": 3567 }, { "epoch": 0.73, "learning_rate": 0.0002863872723407201, "loss": 0.0121, "step": 3568 }, { "epoch": 0.73, "learning_rate": 0.000286379201969567, "loss": 0.021, "step": 3569 }, { "epoch": 0.73, "learning_rate": 0.0002863711293206238, "loss": 0.0459, "step": 3570 }, { "epoch": 0.73, "learning_rate": 0.0002863630543940253, "loss": 0.0385, "step": 3571 }, { "epoch": 0.73, "learning_rate": 0.0002863549771899064, "loss": 0.0169, "step": 3572 }, { "epoch": 0.73, "learning_rate": 0.000286346897708402, "loss": 0.009, "step": 3573 }, { "epoch": 0.73, "learning_rate": 0.00028633881594964706, "loss": 0.0336, "step": 3574 }, { "epoch": 0.73, "learning_rate": 0.00028633073191377655, "loss": 0.0496, "step": 3575 }, { "epoch": 0.73, "learning_rate": 0.0002863226456009254, "loss": 0.0175, "step": 3576 }, { "epoch": 0.73, "learning_rate": 0.0002863145570112288, "loss": 0.0109, "step": 3577 }, { "epoch": 0.73, "learning_rate": 0.00028630646614482175, "loss": 0.0205, "step": 3578 }, { "epoch": 0.73, "learning_rate": 0.0002862983730018394, "loss": 0.0183, "step": 3579 }, { "epoch": 0.73, "learning_rate": 0.000286290277582417, "loss": 0.0149, "step": 3580 }, { "epoch": 0.73, "learning_rate": 0.0002862821798866897, "loss": 0.0174, "step": 3581 }, { "epoch": 0.73, "learning_rate": 0.0002862740799147927, "loss": 0.0107, "step": 3582 }, { "epoch": 0.73, "learning_rate": 0.0002862659776668613, "loss": 0.009, "step": 3583 }, { "epoch": 0.73, "learning_rate": 0.00028625787314303096, "loss": 0.0284, "step": 3584 }, { "epoch": 0.73, "learning_rate": 0.00028624976634343687, "loss": 0.0253, "step": 3585 }, { "epoch": 0.73, "learning_rate": 0.0002862416572682145, "loss": 0.0184, "step": 3586 }, { "epoch": 0.73, "learning_rate": 0.00028623354591749924, "loss": 0.0368, "step": 3587 }, { "epoch": 0.73, "learning_rate": 0.00028622543229142665, "loss": 0.0063, "step": 3588 }, { "epoch": 0.73, "learning_rate": 0.00028621731639013215, "loss": 0.0094, "step": 3589 }, { "epoch": 0.73, "learning_rate": 0.0002862091982137514, "loss": 0.0162, "step": 3590 }, { "epoch": 0.73, "learning_rate": 0.00028620107776241986, "loss": 0.0221, "step": 3591 }, { "epoch": 0.73, "learning_rate": 0.0002861929550362733, "loss": 0.0089, "step": 3592 }, { "epoch": 0.73, "learning_rate": 0.00028618483003544726, "loss": 0.0488, "step": 3593 }, { "epoch": 0.73, "learning_rate": 0.0002861767027600775, "loss": 0.0599, "step": 3594 }, { "epoch": 0.73, "learning_rate": 0.00028616857321029976, "loss": 0.0232, "step": 3595 }, { "epoch": 0.73, "learning_rate": 0.0002861604413862498, "loss": 0.0382, "step": 3596 }, { "epoch": 0.73, "learning_rate": 0.00028615230728806345, "loss": 0.0961, "step": 3597 }, { "epoch": 0.73, "learning_rate": 0.00028614417091587656, "loss": 0.0846, "step": 3598 }, { "epoch": 0.73, "learning_rate": 0.00028613603226982504, "loss": 0.0154, "step": 3599 }, { "epoch": 0.73, "learning_rate": 0.0002861278913500448, "loss": 0.022, "step": 3600 }, { "epoch": 0.73, "learning_rate": 0.0002861197481566718, "loss": 0.0665, "step": 3601 }, { "epoch": 0.73, "learning_rate": 0.00028611160268984207, "loss": 0.0128, "step": 3602 }, { "epoch": 0.73, "learning_rate": 0.00028610345494969164, "loss": 0.0342, "step": 3603 }, { "epoch": 0.73, "learning_rate": 0.00028609530493635665, "loss": 0.0401, "step": 3604 }, { "epoch": 0.73, "learning_rate": 0.0002860871526499731, "loss": 0.0418, "step": 3605 }, { "epoch": 0.73, "learning_rate": 0.00028607899809067727, "loss": 0.0148, "step": 3606 }, { "epoch": 0.73, "learning_rate": 0.0002860708412586053, "loss": 0.02, "step": 3607 }, { "epoch": 0.73, "learning_rate": 0.0002860626821538934, "loss": 0.01, "step": 3608 }, { "epoch": 0.73, "learning_rate": 0.00028605452077667785, "loss": 0.0196, "step": 3609 }, { "epoch": 0.74, "learning_rate": 0.000286046357127095, "loss": 0.0526, "step": 3610 }, { "epoch": 0.74, "learning_rate": 0.0002860381912052812, "loss": 0.0233, "step": 3611 }, { "epoch": 0.74, "learning_rate": 0.0002860300230113728, "loss": 0.0459, "step": 3612 }, { "epoch": 0.74, "learning_rate": 0.00028602185254550627, "loss": 0.0463, "step": 3613 }, { "epoch": 0.74, "learning_rate": 0.00028601367980781806, "loss": 0.0534, "step": 3614 }, { "epoch": 0.74, "learning_rate": 0.0002860055047984446, "loss": 0.0292, "step": 3615 }, { "epoch": 0.74, "learning_rate": 0.00028599732751752245, "loss": 0.028, "step": 3616 }, { "epoch": 0.74, "learning_rate": 0.0002859891479651883, "loss": 0.0352, "step": 3617 }, { "epoch": 0.74, "learning_rate": 0.00028598096614157866, "loss": 0.0526, "step": 3618 }, { "epoch": 0.74, "learning_rate": 0.0002859727820468302, "loss": 0.0236, "step": 3619 }, { "epoch": 0.74, "learning_rate": 0.0002859645956810796, "loss": 0.0175, "step": 3620 }, { "epoch": 0.74, "learning_rate": 0.0002859564070444636, "loss": 0.0358, "step": 3621 }, { "epoch": 0.74, "learning_rate": 0.00028594821613711895, "loss": 0.0064, "step": 3622 }, { "epoch": 0.74, "learning_rate": 0.0002859400229591825, "loss": 0.0137, "step": 3623 }, { "epoch": 0.74, "learning_rate": 0.000285931827510791, "loss": 0.0404, "step": 3624 }, { "epoch": 0.74, "learning_rate": 0.0002859236297920815, "loss": 0.0131, "step": 3625 }, { "epoch": 0.74, "learning_rate": 0.00028591542980319073, "loss": 0.0285, "step": 3626 }, { "epoch": 0.74, "learning_rate": 0.00028590722754425575, "loss": 0.0133, "step": 3627 }, { "epoch": 0.74, "learning_rate": 0.0002858990230154135, "loss": 0.0141, "step": 3628 }, { "epoch": 0.74, "learning_rate": 0.0002858908162168011, "loss": 0.0268, "step": 3629 }, { "epoch": 0.74, "learning_rate": 0.0002858826071485555, "loss": 0.0078, "step": 3630 }, { "epoch": 0.74, "learning_rate": 0.0002858743958108139, "loss": 0.055, "step": 3631 }, { "epoch": 0.74, "learning_rate": 0.00028586618220371334, "loss": 0.0169, "step": 3632 }, { "epoch": 0.74, "learning_rate": 0.00028585796632739114, "loss": 0.0441, "step": 3633 }, { "epoch": 0.74, "learning_rate": 0.00028584974818198443, "loss": 0.0097, "step": 3634 }, { "epoch": 0.74, "learning_rate": 0.0002858415277676305, "loss": 0.0233, "step": 3635 }, { "epoch": 0.74, "learning_rate": 0.0002858333050844666, "loss": 0.0096, "step": 3636 }, { "epoch": 0.74, "learning_rate": 0.00028582508013263015, "loss": 0.0212, "step": 3637 }, { "epoch": 0.74, "learning_rate": 0.00028581685291225844, "loss": 0.0149, "step": 3638 }, { "epoch": 0.74, "learning_rate": 0.00028580862342348896, "loss": 0.0096, "step": 3639 }, { "epoch": 0.74, "learning_rate": 0.0002858003916664591, "loss": 0.0374, "step": 3640 }, { "epoch": 0.74, "learning_rate": 0.0002857921576413063, "loss": 0.0322, "step": 3641 }, { "epoch": 0.74, "learning_rate": 0.00028578392134816823, "loss": 0.0156, "step": 3642 }, { "epoch": 0.74, "learning_rate": 0.0002857756827871823, "loss": 0.0235, "step": 3643 }, { "epoch": 0.74, "learning_rate": 0.0002857674419584862, "loss": 0.0376, "step": 3644 }, { "epoch": 0.74, "learning_rate": 0.0002857591988622175, "loss": 0.0261, "step": 3645 }, { "epoch": 0.74, "learning_rate": 0.00028575095349851396, "loss": 0.0173, "step": 3646 }, { "epoch": 0.74, "learning_rate": 0.0002857427058675132, "loss": 0.03, "step": 3647 }, { "epoch": 0.74, "learning_rate": 0.0002857344559693531, "loss": 0.0074, "step": 3648 }, { "epoch": 0.74, "learning_rate": 0.00028572620380417133, "loss": 0.0423, "step": 3649 }, { "epoch": 0.74, "learning_rate": 0.0002857179493721057, "loss": 0.0162, "step": 3650 }, { "epoch": 0.74, "learning_rate": 0.0002857096926732942, "loss": 0.0137, "step": 3651 }, { "epoch": 0.74, "learning_rate": 0.00028570143370787465, "loss": 0.0192, "step": 3652 }, { "epoch": 0.74, "learning_rate": 0.00028569317247598494, "loss": 0.0117, "step": 3653 }, { "epoch": 0.74, "learning_rate": 0.00028568490897776315, "loss": 0.0183, "step": 3654 }, { "epoch": 0.74, "learning_rate": 0.00028567664321334734, "loss": 0.025, "step": 3655 }, { "epoch": 0.74, "learning_rate": 0.00028566837518287537, "loss": 0.014, "step": 3656 }, { "epoch": 0.74, "learning_rate": 0.0002856601048864855, "loss": 0.0211, "step": 3657 }, { "epoch": 0.74, "learning_rate": 0.00028565183232431574, "loss": 0.0219, "step": 3658 }, { "epoch": 0.75, "learning_rate": 0.0002856435574965044, "loss": 0.0156, "step": 3659 }, { "epoch": 0.75, "learning_rate": 0.0002856352804031895, "loss": 0.0042, "step": 3660 }, { "epoch": 0.75, "learning_rate": 0.00028562700104450947, "loss": 0.0177, "step": 3661 }, { "epoch": 0.75, "learning_rate": 0.0002856187194206025, "loss": 0.0168, "step": 3662 }, { "epoch": 0.75, "learning_rate": 0.0002856104355316069, "loss": 0.0183, "step": 3663 }, { "epoch": 0.75, "learning_rate": 0.0002856021493776611, "loss": 0.0432, "step": 3664 }, { "epoch": 0.75, "learning_rate": 0.00028559386095890335, "loss": 0.0163, "step": 3665 }, { "epoch": 0.75, "learning_rate": 0.00028558557027547223, "loss": 0.0083, "step": 3666 }, { "epoch": 0.75, "learning_rate": 0.00028557727732750614, "loss": 0.0117, "step": 3667 }, { "epoch": 0.75, "learning_rate": 0.0002855689821151436, "loss": 0.01, "step": 3668 }, { "epoch": 0.75, "learning_rate": 0.0002855606846385231, "loss": 0.0353, "step": 3669 }, { "epoch": 0.75, "learning_rate": 0.00028555238489778336, "loss": 0.0194, "step": 3670 }, { "epoch": 0.75, "learning_rate": 0.0002855440828930629, "loss": 0.0287, "step": 3671 }, { "epoch": 0.75, "learning_rate": 0.00028553577862450033, "loss": 0.0236, "step": 3672 }, { "epoch": 0.75, "learning_rate": 0.0002855274720922345, "loss": 0.0114, "step": 3673 }, { "epoch": 0.75, "learning_rate": 0.000285519163296404, "loss": 0.0481, "step": 3674 }, { "epoch": 0.75, "learning_rate": 0.0002855108522371477, "loss": 0.0203, "step": 3675 }, { "epoch": 0.75, "learning_rate": 0.0002855025389146043, "loss": 0.009, "step": 3676 }, { "epoch": 0.75, "learning_rate": 0.00028549422332891283, "loss": 0.0256, "step": 3677 }, { "epoch": 0.75, "learning_rate": 0.000285485905480212, "loss": 0.0399, "step": 3678 }, { "epoch": 0.75, "learning_rate": 0.00028547758536864084, "loss": 0.0319, "step": 3679 }, { "epoch": 0.75, "learning_rate": 0.0002854692629943382, "loss": 0.0357, "step": 3680 }, { "epoch": 0.75, "learning_rate": 0.00028546093835744326, "loss": 0.0166, "step": 3681 }, { "epoch": 0.75, "learning_rate": 0.0002854526114580949, "loss": 0.0401, "step": 3682 }, { "epoch": 0.75, "learning_rate": 0.0002854442822964322, "loss": 0.0169, "step": 3683 }, { "epoch": 0.75, "learning_rate": 0.0002854359508725943, "loss": 0.0346, "step": 3684 }, { "epoch": 0.75, "learning_rate": 0.0002854276171867205, "loss": 0.0354, "step": 3685 }, { "epoch": 0.75, "learning_rate": 0.00028541928123894974, "loss": 0.0119, "step": 3686 }, { "epoch": 0.75, "learning_rate": 0.0002854109430294214, "loss": 0.0191, "step": 3687 }, { "epoch": 0.75, "learning_rate": 0.0002854026025582747, "loss": 0.0585, "step": 3688 }, { "epoch": 0.75, "learning_rate": 0.00028539425982564896, "loss": 0.0073, "step": 3689 }, { "epoch": 0.75, "learning_rate": 0.0002853859148316835, "loss": 0.0291, "step": 3690 }, { "epoch": 0.75, "learning_rate": 0.0002853775675765177, "loss": 0.014, "step": 3691 }, { "epoch": 0.75, "learning_rate": 0.00028536921806029096, "loss": 0.055, "step": 3692 }, { "epoch": 0.75, "learning_rate": 0.00028536086628314273, "loss": 0.0142, "step": 3693 }, { "epoch": 0.75, "learning_rate": 0.00028535251224521256, "loss": 0.0373, "step": 3694 }, { "epoch": 0.75, "learning_rate": 0.00028534415594663997, "loss": 0.0133, "step": 3695 }, { "epoch": 0.75, "learning_rate": 0.00028533579738756446, "loss": 0.0572, "step": 3696 }, { "epoch": 0.75, "learning_rate": 0.0002853274365681256, "loss": 0.0078, "step": 3697 }, { "epoch": 0.75, "learning_rate": 0.0002853190734884632, "loss": 0.0665, "step": 3698 }, { "epoch": 0.75, "learning_rate": 0.00028531070814871685, "loss": 0.0099, "step": 3699 }, { "epoch": 0.75, "learning_rate": 0.0002853023405490262, "loss": 0.0201, "step": 3700 }, { "epoch": 0.75, "learning_rate": 0.0002852939706895311, "loss": 0.0363, "step": 3701 }, { "epoch": 0.75, "learning_rate": 0.00028528559857037125, "loss": 0.004, "step": 3702 }, { "epoch": 0.75, "learning_rate": 0.00028527722419168655, "loss": 0.0101, "step": 3703 }, { "epoch": 0.75, "learning_rate": 0.0002852688475536169, "loss": 0.0579, "step": 3704 }, { "epoch": 0.75, "learning_rate": 0.0002852604686563021, "loss": 0.0454, "step": 3705 }, { "epoch": 0.75, "learning_rate": 0.0002852520874998822, "loss": 0.0382, "step": 3706 }, { "epoch": 0.75, "learning_rate": 0.0002852437040844971, "loss": 0.0454, "step": 3707 }, { "epoch": 0.76, "learning_rate": 0.00028523531841028685, "loss": 0.0254, "step": 3708 }, { "epoch": 0.76, "learning_rate": 0.0002852269304773915, "loss": 0.0248, "step": 3709 }, { "epoch": 0.76, "learning_rate": 0.0002852185402859512, "loss": 0.0164, "step": 3710 }, { "epoch": 0.76, "learning_rate": 0.000285210147836106, "loss": 0.0102, "step": 3711 }, { "epoch": 0.76, "learning_rate": 0.0002852017531279961, "loss": 0.0137, "step": 3712 }, { "epoch": 0.76, "learning_rate": 0.0002851933561617617, "loss": 0.0067, "step": 3713 }, { "epoch": 0.76, "learning_rate": 0.0002851849569375431, "loss": 0.021, "step": 3714 }, { "epoch": 0.76, "learning_rate": 0.00028517655545548054, "loss": 0.015, "step": 3715 }, { "epoch": 0.76, "learning_rate": 0.0002851681517157143, "loss": 0.017, "step": 3716 }, { "epoch": 0.76, "learning_rate": 0.0002851597457183848, "loss": 0.014, "step": 3717 }, { "epoch": 0.76, "learning_rate": 0.0002851513374636324, "loss": 0.0258, "step": 3718 }, { "epoch": 0.76, "learning_rate": 0.00028514292695159757, "loss": 0.0212, "step": 3719 }, { "epoch": 0.76, "learning_rate": 0.00028513451418242075, "loss": 0.0066, "step": 3720 }, { "epoch": 0.76, "learning_rate": 0.00028512609915624243, "loss": 0.0315, "step": 3721 }, { "epoch": 0.76, "learning_rate": 0.00028511768187320323, "loss": 0.0262, "step": 3722 }, { "epoch": 0.76, "learning_rate": 0.0002851092623334436, "loss": 0.0283, "step": 3723 }, { "epoch": 0.76, "learning_rate": 0.00028510084053710443, "loss": 0.0358, "step": 3724 }, { "epoch": 0.76, "learning_rate": 0.00028509241648432606, "loss": 0.0135, "step": 3725 }, { "epoch": 0.76, "learning_rate": 0.00028508399017524935, "loss": 0.0312, "step": 3726 }, { "epoch": 0.76, "learning_rate": 0.00028507556161001503, "loss": 0.0113, "step": 3727 }, { "epoch": 0.76, "learning_rate": 0.0002850671307887639, "loss": 0.0199, "step": 3728 }, { "epoch": 0.76, "learning_rate": 0.00028505869771163666, "loss": 0.0181, "step": 3729 }, { "epoch": 0.76, "learning_rate": 0.00028505026237877427, "loss": 0.0322, "step": 3730 }, { "epoch": 0.76, "learning_rate": 0.0002850418247903175, "loss": 0.025, "step": 3731 }, { "epoch": 0.76, "learning_rate": 0.00028503338494640745, "loss": 0.029, "step": 3732 }, { "epoch": 0.76, "learning_rate": 0.0002850249428471849, "loss": 0.006, "step": 3733 }, { "epoch": 0.76, "learning_rate": 0.00028501649849279096, "loss": 0.0151, "step": 3734 }, { "epoch": 0.76, "learning_rate": 0.00028500805188336664, "loss": 0.027, "step": 3735 }, { "epoch": 0.76, "learning_rate": 0.000284999603019053, "loss": 0.0164, "step": 3736 }, { "epoch": 0.76, "learning_rate": 0.00028499115189999113, "loss": 0.0318, "step": 3737 }, { "epoch": 0.76, "learning_rate": 0.0002849826985263223, "loss": 0.032, "step": 3738 }, { "epoch": 0.76, "learning_rate": 0.0002849742428981875, "loss": 0.0194, "step": 3739 }, { "epoch": 0.76, "learning_rate": 0.00028496578501572813, "loss": 0.0167, "step": 3740 }, { "epoch": 0.76, "learning_rate": 0.0002849573248790854, "loss": 0.0071, "step": 3741 }, { "epoch": 0.76, "learning_rate": 0.0002849488624884005, "loss": 0.0155, "step": 3742 }, { "epoch": 0.76, "learning_rate": 0.00028494039784381493, "loss": 0.0361, "step": 3743 }, { "epoch": 0.76, "learning_rate": 0.00028493193094547, "loss": 0.0578, "step": 3744 }, { "epoch": 0.76, "learning_rate": 0.0002849234617935071, "loss": 0.0114, "step": 3745 }, { "epoch": 0.76, "learning_rate": 0.00028491499038806766, "loss": 0.0217, "step": 3746 }, { "epoch": 0.76, "learning_rate": 0.0002849065167292933, "loss": 0.0506, "step": 3747 }, { "epoch": 0.76, "learning_rate": 0.0002848980408173254, "loss": 0.0277, "step": 3748 }, { "epoch": 0.76, "learning_rate": 0.00028488956265230564, "loss": 0.0386, "step": 3749 }, { "epoch": 0.76, "learning_rate": 0.0002848810822343755, "loss": 0.0071, "step": 3750 }, { "epoch": 0.76, "learning_rate": 0.0002848725995636767, "loss": 0.0421, "step": 3751 }, { "epoch": 0.76, "learning_rate": 0.0002848641146403509, "loss": 0.024, "step": 3752 }, { "epoch": 0.76, "learning_rate": 0.0002848556274645398, "loss": 0.0091, "step": 3753 }, { "epoch": 0.76, "learning_rate": 0.00028484713803638513, "loss": 0.0241, "step": 3754 }, { "epoch": 0.76, "learning_rate": 0.0002848386463560288, "loss": 0.0176, "step": 3755 }, { "epoch": 0.76, "learning_rate": 0.0002848301524236125, "loss": 0.0231, "step": 3756 }, { "epoch": 0.76, "learning_rate": 0.00028482165623927813, "loss": 0.0313, "step": 3757 }, { "epoch": 0.77, "learning_rate": 0.00028481315780316764, "loss": 0.0239, "step": 3758 }, { "epoch": 0.77, "learning_rate": 0.00028480465711542294, "loss": 0.0538, "step": 3759 }, { "epoch": 0.77, "learning_rate": 0.00028479615417618595, "loss": 0.0427, "step": 3760 }, { "epoch": 0.77, "learning_rate": 0.0002847876489855988, "loss": 0.0302, "step": 3761 }, { "epoch": 0.77, "learning_rate": 0.00028477914154380346, "loss": 0.0088, "step": 3762 }, { "epoch": 0.77, "learning_rate": 0.000284770631850942, "loss": 0.0424, "step": 3763 }, { "epoch": 0.77, "learning_rate": 0.00028476211990715667, "loss": 0.018, "step": 3764 }, { "epoch": 0.77, "learning_rate": 0.0002847536057125895, "loss": 0.0079, "step": 3765 }, { "epoch": 0.77, "learning_rate": 0.00028474508926738275, "loss": 0.047, "step": 3766 }, { "epoch": 0.77, "learning_rate": 0.00028473657057167867, "loss": 0.0094, "step": 3767 }, { "epoch": 0.77, "learning_rate": 0.0002847280496256196, "loss": 0.0191, "step": 3768 }, { "epoch": 0.77, "learning_rate": 0.00028471952642934766, "loss": 0.0315, "step": 3769 }, { "epoch": 0.77, "learning_rate": 0.0002847110009830054, "loss": 0.0312, "step": 3770 }, { "epoch": 0.77, "learning_rate": 0.0002847024732867351, "loss": 0.0167, "step": 3771 }, { "epoch": 0.77, "learning_rate": 0.00028469394334067926, "loss": 0.0091, "step": 3772 }, { "epoch": 0.77, "learning_rate": 0.0002846854111449803, "loss": 0.0237, "step": 3773 }, { "epoch": 0.77, "learning_rate": 0.00028467687669978073, "loss": 0.0171, "step": 3774 }, { "epoch": 0.77, "learning_rate": 0.00028466834000522316, "loss": 0.0114, "step": 3775 }, { "epoch": 0.77, "learning_rate": 0.00028465980106145, "loss": 0.0106, "step": 3776 }, { "epoch": 0.77, "learning_rate": 0.00028465125986860403, "loss": 0.0325, "step": 3777 }, { "epoch": 0.77, "learning_rate": 0.0002846427164268279, "loss": 0.0193, "step": 3778 }, { "epoch": 0.77, "learning_rate": 0.00028463417073626413, "loss": 0.0146, "step": 3779 }, { "epoch": 0.77, "learning_rate": 0.0002846256227970557, "loss": 0.041, "step": 3780 }, { "epoch": 0.77, "learning_rate": 0.00028461707260934516, "loss": 0.0185, "step": 3781 }, { "epoch": 0.77, "learning_rate": 0.00028460852017327544, "loss": 0.0186, "step": 3782 }, { "epoch": 0.77, "learning_rate": 0.00028459996548898934, "loss": 0.0194, "step": 3783 }, { "epoch": 0.77, "learning_rate": 0.0002845914085566297, "loss": 0.015, "step": 3784 }, { "epoch": 0.77, "learning_rate": 0.00028458284937633947, "loss": 0.0308, "step": 3785 }, { "epoch": 0.77, "learning_rate": 0.00028457428794826165, "loss": 0.0177, "step": 3786 }, { "epoch": 0.77, "learning_rate": 0.0002845657242725392, "loss": 0.0311, "step": 3787 }, { "epoch": 0.77, "learning_rate": 0.00028455715834931517, "loss": 0.0251, "step": 3788 }, { "epoch": 0.77, "learning_rate": 0.00028454859017873257, "loss": 0.0042, "step": 3789 }, { "epoch": 0.77, "learning_rate": 0.0002845400197609345, "loss": 0.0235, "step": 3790 }, { "epoch": 0.77, "learning_rate": 0.0002845314470960642, "loss": 0.0121, "step": 3791 }, { "epoch": 0.77, "learning_rate": 0.0002845228721842647, "loss": 0.0368, "step": 3792 }, { "epoch": 0.77, "learning_rate": 0.0002845142950256794, "loss": 0.0433, "step": 3793 }, { "epoch": 0.77, "learning_rate": 0.0002845057156204514, "loss": 0.0305, "step": 3794 }, { "epoch": 0.77, "learning_rate": 0.00028449713396872406, "loss": 0.0351, "step": 3795 }, { "epoch": 0.77, "learning_rate": 0.00028448855007064073, "loss": 0.0144, "step": 3796 }, { "epoch": 0.77, "learning_rate": 0.00028447996392634475, "loss": 0.0214, "step": 3797 }, { "epoch": 0.77, "learning_rate": 0.0002844713755359795, "loss": 0.0193, "step": 3798 }, { "epoch": 0.77, "learning_rate": 0.0002844627848996884, "loss": 0.0108, "step": 3799 }, { "epoch": 0.77, "learning_rate": 0.00028445419201761504, "loss": 0.0247, "step": 3800 }, { "epoch": 0.77, "learning_rate": 0.0002844455968899029, "loss": 0.0118, "step": 3801 }, { "epoch": 0.77, "learning_rate": 0.00028443699951669543, "loss": 0.0086, "step": 3802 }, { "epoch": 0.77, "learning_rate": 0.00028442839989813634, "loss": 0.0441, "step": 3803 }, { "epoch": 0.77, "learning_rate": 0.0002844197980343692, "loss": 0.0471, "step": 3804 }, { "epoch": 0.77, "learning_rate": 0.0002844111939255377, "loss": 0.0208, "step": 3805 }, { "epoch": 0.77, "learning_rate": 0.0002844025875717856, "loss": 0.0156, "step": 3806 }, { "epoch": 0.78, "learning_rate": 0.00028439397897325654, "loss": 0.0208, "step": 3807 }, { "epoch": 0.78, "learning_rate": 0.00028438536813009434, "loss": 0.0212, "step": 3808 }, { "epoch": 0.78, "learning_rate": 0.0002843767550424428, "loss": 0.0294, "step": 3809 }, { "epoch": 0.78, "learning_rate": 0.0002843681397104458, "loss": 0.0242, "step": 3810 }, { "epoch": 0.78, "learning_rate": 0.0002843595221342473, "loss": 0.0237, "step": 3811 }, { "epoch": 0.78, "learning_rate": 0.0002843509023139911, "loss": 0.0019, "step": 3812 }, { "epoch": 0.78, "learning_rate": 0.00028434228024982127, "loss": 0.0077, "step": 3813 }, { "epoch": 0.78, "learning_rate": 0.0002843336559418817, "loss": 0.0179, "step": 3814 }, { "epoch": 0.78, "learning_rate": 0.0002843250293903166, "loss": 0.0154, "step": 3815 }, { "epoch": 0.78, "learning_rate": 0.00028431640059526985, "loss": 0.0267, "step": 3816 }, { "epoch": 0.78, "learning_rate": 0.00028430776955688575, "loss": 0.0152, "step": 3817 }, { "epoch": 0.78, "learning_rate": 0.0002842991362753083, "loss": 0.029, "step": 3818 }, { "epoch": 0.78, "learning_rate": 0.00028429050075068184, "loss": 0.012, "step": 3819 }, { "epoch": 0.78, "learning_rate": 0.00028428186298315043, "loss": 0.0301, "step": 3820 }, { "epoch": 0.78, "learning_rate": 0.00028427322297285853, "loss": 0.038, "step": 3821 }, { "epoch": 0.78, "learning_rate": 0.0002842645807199503, "loss": 0.0148, "step": 3822 }, { "epoch": 0.78, "learning_rate": 0.00028425593622457017, "loss": 0.0302, "step": 3823 }, { "epoch": 0.78, "learning_rate": 0.00028424728948686244, "loss": 0.0342, "step": 3824 }, { "epoch": 0.78, "learning_rate": 0.00028423864050697154, "loss": 0.0119, "step": 3825 }, { "epoch": 0.78, "learning_rate": 0.000284229989285042, "loss": 0.0319, "step": 3826 }, { "epoch": 0.78, "learning_rate": 0.0002842213358212183, "loss": 0.0189, "step": 3827 }, { "epoch": 0.78, "learning_rate": 0.00028421268011564484, "loss": 0.0124, "step": 3828 }, { "epoch": 0.78, "learning_rate": 0.0002842040221684663, "loss": 0.0459, "step": 3829 }, { "epoch": 0.78, "learning_rate": 0.00028419536197982735, "loss": 0.0686, "step": 3830 }, { "epoch": 0.78, "learning_rate": 0.0002841866995498725, "loss": 0.0168, "step": 3831 }, { "epoch": 0.78, "learning_rate": 0.0002841780348787464, "loss": 0.0107, "step": 3832 }, { "epoch": 0.78, "learning_rate": 0.00028416936796659385, "loss": 0.0169, "step": 3833 }, { "epoch": 0.78, "learning_rate": 0.00028416069881355963, "loss": 0.0647, "step": 3834 }, { "epoch": 0.78, "learning_rate": 0.0002841520274197885, "loss": 0.0187, "step": 3835 }, { "epoch": 0.78, "learning_rate": 0.0002841433537854253, "loss": 0.0211, "step": 3836 }, { "epoch": 0.78, "learning_rate": 0.0002841346779106148, "loss": 0.0242, "step": 3837 }, { "epoch": 0.78, "learning_rate": 0.00028412599979550207, "loss": 0.0109, "step": 3838 }, { "epoch": 0.78, "learning_rate": 0.0002841173194402319, "loss": 0.0183, "step": 3839 }, { "epoch": 0.78, "learning_rate": 0.00028410863684494937, "loss": 0.0312, "step": 3840 }, { "epoch": 0.78, "learning_rate": 0.00028409995200979945, "loss": 0.0044, "step": 3841 }, { "epoch": 0.78, "learning_rate": 0.0002840912649349272, "loss": 0.0076, "step": 3842 }, { "epoch": 0.78, "learning_rate": 0.00028408257562047767, "loss": 0.0202, "step": 3843 }, { "epoch": 0.78, "learning_rate": 0.00028407388406659606, "loss": 0.0297, "step": 3844 }, { "epoch": 0.78, "learning_rate": 0.0002840651902734275, "loss": 0.0333, "step": 3845 }, { "epoch": 0.78, "learning_rate": 0.0002840564942411172, "loss": 0.0343, "step": 3846 }, { "epoch": 0.78, "learning_rate": 0.0002840477959698104, "loss": 0.0343, "step": 3847 }, { "epoch": 0.78, "learning_rate": 0.00028403909545965237, "loss": 0.0182, "step": 3848 }, { "epoch": 0.78, "learning_rate": 0.0002840303927107885, "loss": 0.0156, "step": 3849 }, { "epoch": 0.78, "learning_rate": 0.00028402168772336396, "loss": 0.014, "step": 3850 }, { "epoch": 0.78, "learning_rate": 0.0002840129804975243, "loss": 0.0339, "step": 3851 }, { "epoch": 0.78, "learning_rate": 0.00028400427103341487, "loss": 0.0136, "step": 3852 }, { "epoch": 0.78, "learning_rate": 0.0002839955593311812, "loss": 0.0333, "step": 3853 }, { "epoch": 0.78, "learning_rate": 0.0002839868453909687, "loss": 0.016, "step": 3854 }, { "epoch": 0.78, "learning_rate": 0.000283978129212923, "loss": 0.0296, "step": 3855 }, { "epoch": 0.79, "learning_rate": 0.0002839694107971897, "loss": 0.0495, "step": 3856 }, { "epoch": 0.79, "learning_rate": 0.0002839606901439143, "loss": 0.0364, "step": 3857 }, { "epoch": 0.79, "learning_rate": 0.00028395196725324246, "loss": 0.0252, "step": 3858 }, { "epoch": 0.79, "learning_rate": 0.00028394324212531994, "loss": 0.0235, "step": 3859 }, { "epoch": 0.79, "learning_rate": 0.0002839345147602925, "loss": 0.0148, "step": 3860 }, { "epoch": 0.79, "learning_rate": 0.0002839257851583058, "loss": 0.0601, "step": 3861 }, { "epoch": 0.79, "learning_rate": 0.00028391705331950567, "loss": 0.018, "step": 3862 }, { "epoch": 0.79, "learning_rate": 0.00028390831924403803, "loss": 0.0096, "step": 3863 }, { "epoch": 0.79, "learning_rate": 0.0002838995829320486, "loss": 0.0223, "step": 3864 }, { "epoch": 0.79, "learning_rate": 0.00028389084438368344, "loss": 0.007, "step": 3865 }, { "epoch": 0.79, "learning_rate": 0.0002838821035990884, "loss": 0.0246, "step": 3866 }, { "epoch": 0.79, "learning_rate": 0.00028387336057840955, "loss": 0.0177, "step": 3867 }, { "epoch": 0.79, "learning_rate": 0.00028386461532179286, "loss": 0.0194, "step": 3868 }, { "epoch": 0.79, "learning_rate": 0.00028385586782938443, "loss": 0.0456, "step": 3869 }, { "epoch": 0.79, "learning_rate": 0.0002838471181013303, "loss": 0.023, "step": 3870 }, { "epoch": 0.79, "learning_rate": 0.00028383836613777663, "loss": 0.0178, "step": 3871 }, { "epoch": 0.79, "learning_rate": 0.0002838296119388697, "loss": 0.0177, "step": 3872 }, { "epoch": 0.79, "learning_rate": 0.0002838208555047555, "loss": 0.0363, "step": 3873 }, { "epoch": 0.79, "learning_rate": 0.00028381209683558045, "loss": 0.011, "step": 3874 }, { "epoch": 0.79, "learning_rate": 0.00028380333593149086, "loss": 0.0126, "step": 3875 }, { "epoch": 0.79, "learning_rate": 0.0002837945727926329, "loss": 0.0217, "step": 3876 }, { "epoch": 0.79, "learning_rate": 0.00028378580741915307, "loss": 0.0294, "step": 3877 }, { "epoch": 0.79, "learning_rate": 0.0002837770398111977, "loss": 0.0121, "step": 3878 }, { "epoch": 0.79, "learning_rate": 0.00028376826996891327, "loss": 0.0207, "step": 3879 }, { "epoch": 0.79, "learning_rate": 0.00028375949789244626, "loss": 0.0771, "step": 3880 }, { "epoch": 0.79, "learning_rate": 0.00028375072358194305, "loss": 0.056, "step": 3881 }, { "epoch": 0.79, "learning_rate": 0.00028374194703755033, "loss": 0.028, "step": 3882 }, { "epoch": 0.79, "learning_rate": 0.00028373316825941464, "loss": 0.0595, "step": 3883 }, { "epoch": 0.79, "learning_rate": 0.0002837243872476826, "loss": 0.0251, "step": 3884 }, { "epoch": 0.79, "learning_rate": 0.0002837156040025009, "loss": 0.0249, "step": 3885 }, { "epoch": 0.79, "learning_rate": 0.0002837068185240161, "loss": 0.0181, "step": 3886 }, { "epoch": 0.79, "learning_rate": 0.00028369803081237515, "loss": 0.0381, "step": 3887 }, { "epoch": 0.79, "learning_rate": 0.0002836892408677247, "loss": 0.0183, "step": 3888 }, { "epoch": 0.79, "learning_rate": 0.0002836804486902115, "loss": 0.016, "step": 3889 }, { "epoch": 0.79, "learning_rate": 0.00028367165427998256, "loss": 0.0061, "step": 3890 }, { "epoch": 0.79, "learning_rate": 0.0002836628576371846, "loss": 0.0107, "step": 3891 }, { "epoch": 0.79, "learning_rate": 0.00028365405876196463, "loss": 0.0092, "step": 3892 }, { "epoch": 0.79, "learning_rate": 0.00028364525765446966, "loss": 0.0166, "step": 3893 }, { "epoch": 0.79, "learning_rate": 0.0002836364543148465, "loss": 0.0247, "step": 3894 }, { "epoch": 0.79, "learning_rate": 0.00028362764874324234, "loss": 0.0336, "step": 3895 }, { "epoch": 0.79, "learning_rate": 0.00028361884093980425, "loss": 0.016, "step": 3896 }, { "epoch": 0.79, "learning_rate": 0.00028361003090467926, "loss": 0.0203, "step": 3897 }, { "epoch": 0.79, "learning_rate": 0.0002836012186380145, "loss": 0.0217, "step": 3898 }, { "epoch": 0.79, "learning_rate": 0.0002835924041399573, "loss": 0.0116, "step": 3899 }, { "epoch": 0.79, "learning_rate": 0.0002835835874106547, "loss": 0.0176, "step": 3900 }, { "epoch": 0.79, "learning_rate": 0.00028357476845025404, "loss": 0.0213, "step": 3901 }, { "epoch": 0.79, "learning_rate": 0.0002835659472589026, "loss": 0.0081, "step": 3902 }, { "epoch": 0.79, "learning_rate": 0.00028355712383674775, "loss": 0.0207, "step": 3903 }, { "epoch": 0.79, "learning_rate": 0.0002835482981839368, "loss": 0.0156, "step": 3904 }, { "epoch": 0.8, "learning_rate": 0.0002835394703006172, "loss": 0.0365, "step": 3905 }, { "epoch": 0.8, "learning_rate": 0.0002835306401869364, "loss": 0.0306, "step": 3906 }, { "epoch": 0.8, "learning_rate": 0.00028352180784304177, "loss": 0.0098, "step": 3907 }, { "epoch": 0.8, "learning_rate": 0.000283512973269081, "loss": 0.0178, "step": 3908 }, { "epoch": 0.8, "learning_rate": 0.0002835041364652015, "loss": 0.0138, "step": 3909 }, { "epoch": 0.8, "learning_rate": 0.0002834952974315509, "loss": 0.0098, "step": 3910 }, { "epoch": 0.8, "learning_rate": 0.0002834864561682769, "loss": 0.0046, "step": 3911 }, { "epoch": 0.8, "learning_rate": 0.00028347761267552703, "loss": 0.0062, "step": 3912 }, { "epoch": 0.8, "learning_rate": 0.00028346876695344914, "loss": 0.0243, "step": 3913 }, { "epoch": 0.8, "learning_rate": 0.00028345991900219087, "loss": 0.0232, "step": 3914 }, { "epoch": 0.8, "learning_rate": 0.0002834510688219, "loss": 0.009, "step": 3915 }, { "epoch": 0.8, "learning_rate": 0.0002834422164127244, "loss": 0.0126, "step": 3916 }, { "epoch": 0.8, "learning_rate": 0.0002834333617748119, "loss": 0.0193, "step": 3917 }, { "epoch": 0.8, "learning_rate": 0.0002834245049083104, "loss": 0.0172, "step": 3918 }, { "epoch": 0.8, "learning_rate": 0.0002834156458133678, "loss": 0.0158, "step": 3919 }, { "epoch": 0.8, "learning_rate": 0.0002834067844901321, "loss": 0.0429, "step": 3920 }, { "epoch": 0.8, "learning_rate": 0.00028339792093875127, "loss": 0.0275, "step": 3921 }, { "epoch": 0.8, "learning_rate": 0.0002833890551593733, "loss": 0.0149, "step": 3922 }, { "epoch": 0.8, "learning_rate": 0.0002833801871521464, "loss": 0.0372, "step": 3923 }, { "epoch": 0.8, "learning_rate": 0.0002833713169172185, "loss": 0.0112, "step": 3924 }, { "epoch": 0.8, "learning_rate": 0.00028336244445473794, "loss": 0.0141, "step": 3925 }, { "epoch": 0.8, "learning_rate": 0.0002833535697648528, "loss": 0.0231, "step": 3926 }, { "epoch": 0.8, "learning_rate": 0.0002833446928477113, "loss": 0.0533, "step": 3927 }, { "epoch": 0.8, "learning_rate": 0.0002833358137034617, "loss": 0.0268, "step": 3928 }, { "epoch": 0.8, "learning_rate": 0.0002833269323322524, "loss": 0.0105, "step": 3929 }, { "epoch": 0.8, "learning_rate": 0.00028331804873423156, "loss": 0.0509, "step": 3930 }, { "epoch": 0.8, "learning_rate": 0.0002833091629095477, "loss": 0.0082, "step": 3931 }, { "epoch": 0.8, "learning_rate": 0.00028330027485834924, "loss": 0.0213, "step": 3932 }, { "epoch": 0.8, "learning_rate": 0.0002832913845807845, "loss": 0.0162, "step": 3933 }, { "epoch": 0.8, "learning_rate": 0.000283282492077002, "loss": 0.0242, "step": 3934 }, { "epoch": 0.8, "learning_rate": 0.0002832735973471504, "loss": 0.0166, "step": 3935 }, { "epoch": 0.8, "learning_rate": 0.00028326470039137806, "loss": 0.0252, "step": 3936 }, { "epoch": 0.8, "learning_rate": 0.0002832558012098337, "loss": 0.019, "step": 3937 }, { "epoch": 0.8, "learning_rate": 0.0002832468998026659, "loss": 0.0165, "step": 3938 }, { "epoch": 0.8, "learning_rate": 0.0002832379961700234, "loss": 0.0095, "step": 3939 }, { "epoch": 0.8, "learning_rate": 0.00028322909031205484, "loss": 0.0238, "step": 3940 }, { "epoch": 0.8, "learning_rate": 0.000283220182228909, "loss": 0.0097, "step": 3941 }, { "epoch": 0.8, "learning_rate": 0.0002832112719207346, "loss": 0.026, "step": 3942 }, { "epoch": 0.8, "learning_rate": 0.0002832023593876805, "loss": 0.0118, "step": 3943 }, { "epoch": 0.8, "learning_rate": 0.00028319344462989556, "loss": 0.0248, "step": 3944 }, { "epoch": 0.8, "learning_rate": 0.0002831845276475287, "loss": 0.0185, "step": 3945 }, { "epoch": 0.8, "learning_rate": 0.0002831756084407289, "loss": 0.0154, "step": 3946 }, { "epoch": 0.8, "learning_rate": 0.0002831666870096449, "loss": 0.0236, "step": 3947 }, { "epoch": 0.8, "learning_rate": 0.000283157763354426, "loss": 0.0055, "step": 3948 }, { "epoch": 0.8, "learning_rate": 0.000283148837475221, "loss": 0.0217, "step": 3949 }, { "epoch": 0.8, "learning_rate": 0.00028313990937217914, "loss": 0.0155, "step": 3950 }, { "epoch": 0.8, "learning_rate": 0.0002831309790454494, "loss": 0.0234, "step": 3951 }, { "epoch": 0.8, "learning_rate": 0.0002831220464951811, "loss": 0.0293, "step": 3952 }, { "epoch": 0.8, "learning_rate": 0.00028311311172152324, "loss": 0.0183, "step": 3953 }, { "epoch": 0.81, "learning_rate": 0.00028310417472462524, "loss": 0.019, "step": 3954 }, { "epoch": 0.81, "learning_rate": 0.0002830952355046362, "loss": 0.022, "step": 3955 }, { "epoch": 0.81, "learning_rate": 0.00028308629406170553, "loss": 0.015, "step": 3956 }, { "epoch": 0.81, "learning_rate": 0.00028307735039598253, "loss": 0.0065, "step": 3957 }, { "epoch": 0.81, "learning_rate": 0.00028306840450761657, "loss": 0.0464, "step": 3958 }, { "epoch": 0.81, "learning_rate": 0.00028305945639675703, "loss": 0.02, "step": 3959 }, { "epoch": 0.81, "learning_rate": 0.00028305050606355344, "loss": 0.022, "step": 3960 }, { "epoch": 0.81, "learning_rate": 0.0002830415535081552, "loss": 0.0116, "step": 3961 }, { "epoch": 0.81, "learning_rate": 0.000283032598730712, "loss": 0.0216, "step": 3962 }, { "epoch": 0.81, "learning_rate": 0.00028302364173137315, "loss": 0.0363, "step": 3963 }, { "epoch": 0.81, "learning_rate": 0.0002830146825102885, "loss": 0.0088, "step": 3964 }, { "epoch": 0.81, "learning_rate": 0.0002830057210676075, "loss": 0.0128, "step": 3965 }, { "epoch": 0.81, "learning_rate": 0.00028299675740347987, "loss": 0.0123, "step": 3966 }, { "epoch": 0.81, "learning_rate": 0.0002829877915180554, "loss": 0.0168, "step": 3967 }, { "epoch": 0.81, "learning_rate": 0.00028297882341148377, "loss": 0.0146, "step": 3968 }, { "epoch": 0.81, "learning_rate": 0.00028296985308391476, "loss": 0.0316, "step": 3969 }, { "epoch": 0.81, "learning_rate": 0.0002829608805354982, "loss": 0.013, "step": 3970 }, { "epoch": 0.81, "learning_rate": 0.00028295190576638397, "loss": 0.0211, "step": 3971 }, { "epoch": 0.81, "learning_rate": 0.00028294292877672193, "loss": 0.0162, "step": 3972 }, { "epoch": 0.81, "learning_rate": 0.00028293394956666203, "loss": 0.0044, "step": 3973 }, { "epoch": 0.81, "learning_rate": 0.0002829249681363543, "loss": 0.047, "step": 3974 }, { "epoch": 0.81, "learning_rate": 0.0002829159844859486, "loss": 0.0164, "step": 3975 }, { "epoch": 0.81, "learning_rate": 0.00028290699861559514, "loss": 0.0094, "step": 3976 }, { "epoch": 0.81, "learning_rate": 0.0002828980105254439, "loss": 0.0345, "step": 3977 }, { "epoch": 0.81, "learning_rate": 0.000282889020215645, "loss": 0.0599, "step": 3978 }, { "epoch": 0.81, "learning_rate": 0.0002828800276863486, "loss": 0.0208, "step": 3979 }, { "epoch": 0.81, "learning_rate": 0.00028287103293770494, "loss": 0.0109, "step": 3980 }, { "epoch": 0.81, "learning_rate": 0.00028286203596986423, "loss": 0.0079, "step": 3981 }, { "epoch": 0.81, "learning_rate": 0.0002828530367829767, "loss": 0.0231, "step": 3982 }, { "epoch": 0.81, "learning_rate": 0.0002828440353771927, "loss": 0.0047, "step": 3983 }, { "epoch": 0.81, "learning_rate": 0.0002828350317526625, "loss": 0.0188, "step": 3984 }, { "epoch": 0.81, "learning_rate": 0.0002828260259095366, "loss": 0.0132, "step": 3985 }, { "epoch": 0.81, "learning_rate": 0.0002828170178479653, "loss": 0.0254, "step": 3986 }, { "epoch": 0.81, "learning_rate": 0.0002828080075680991, "loss": 0.0224, "step": 3987 }, { "epoch": 0.81, "learning_rate": 0.00028279899507008846, "loss": 0.0259, "step": 3988 }, { "epoch": 0.81, "learning_rate": 0.0002827899803540839, "loss": 0.0248, "step": 3989 }, { "epoch": 0.81, "learning_rate": 0.00028278096342023606, "loss": 0.0272, "step": 3990 }, { "epoch": 0.81, "learning_rate": 0.0002827719442686955, "loss": 0.0315, "step": 3991 }, { "epoch": 0.81, "learning_rate": 0.00028276292289961284, "loss": 0.0229, "step": 3992 }, { "epoch": 0.81, "learning_rate": 0.0002827538993131387, "loss": 0.0164, "step": 3993 }, { "epoch": 0.81, "learning_rate": 0.0002827448735094239, "loss": 0.0598, "step": 3994 }, { "epoch": 0.81, "learning_rate": 0.00028273584548861916, "loss": 0.0118, "step": 3995 }, { "epoch": 0.81, "learning_rate": 0.0002827268152508752, "loss": 0.0422, "step": 3996 }, { "epoch": 0.81, "learning_rate": 0.0002827177827963429, "loss": 0.0367, "step": 3997 }, { "epoch": 0.81, "learning_rate": 0.0002827087481251731, "loss": 0.0108, "step": 3998 }, { "epoch": 0.81, "learning_rate": 0.0002826997112375167, "loss": 0.025, "step": 3999 }, { "epoch": 0.81, "learning_rate": 0.00028269067213352466, "loss": 0.0224, "step": 4000 }, { "epoch": 0.81, "learning_rate": 0.0002826816308133479, "loss": 0.0262, "step": 4001 }, { "epoch": 0.81, "learning_rate": 0.00028267258727713744, "loss": 0.0303, "step": 4002 }, { "epoch": 0.82, "learning_rate": 0.00028266354152504437, "loss": 0.0164, "step": 4003 }, { "epoch": 0.82, "learning_rate": 0.00028265449355721975, "loss": 0.0348, "step": 4004 }, { "epoch": 0.82, "learning_rate": 0.0002826454433738146, "loss": 0.0277, "step": 4005 }, { "epoch": 0.82, "learning_rate": 0.00028263639097498026, "loss": 0.0136, "step": 4006 }, { "epoch": 0.82, "learning_rate": 0.00028262733636086774, "loss": 0.0141, "step": 4007 }, { "epoch": 0.82, "learning_rate": 0.00028261827953162836, "loss": 0.0206, "step": 4008 }, { "epoch": 0.82, "learning_rate": 0.0002826092204874134, "loss": 0.0193, "step": 4009 }, { "epoch": 0.82, "learning_rate": 0.0002826001592283742, "loss": 0.0303, "step": 4010 }, { "epoch": 0.82, "learning_rate": 0.00028259109575466196, "loss": 0.0089, "step": 4011 }, { "epoch": 0.82, "learning_rate": 0.00028258203006642816, "loss": 0.0243, "step": 4012 }, { "epoch": 0.82, "learning_rate": 0.0002825729621638242, "loss": 0.0028, "step": 4013 }, { "epoch": 0.82, "learning_rate": 0.00028256389204700153, "loss": 0.0152, "step": 4014 }, { "epoch": 0.82, "learning_rate": 0.0002825548197161116, "loss": 0.0072, "step": 4015 }, { "epoch": 0.82, "learning_rate": 0.00028254574517130594, "loss": 0.0387, "step": 4016 }, { "epoch": 0.82, "learning_rate": 0.0002825366684127362, "loss": 0.0193, "step": 4017 }, { "epoch": 0.82, "learning_rate": 0.0002825275894405539, "loss": 0.0204, "step": 4018 }, { "epoch": 0.82, "learning_rate": 0.0002825185082549107, "loss": 0.0214, "step": 4019 }, { "epoch": 0.82, "learning_rate": 0.00028250942485595826, "loss": 0.0261, "step": 4020 }, { "epoch": 0.82, "learning_rate": 0.00028250033924384827, "loss": 0.0147, "step": 4021 }, { "epoch": 0.82, "learning_rate": 0.00028249125141873257, "loss": 0.0209, "step": 4022 }, { "epoch": 0.82, "learning_rate": 0.0002824821613807628, "loss": 0.0154, "step": 4023 }, { "epoch": 0.82, "learning_rate": 0.00028247306913009086, "loss": 0.015, "step": 4024 }, { "epoch": 0.82, "learning_rate": 0.00028246397466686864, "loss": 0.0202, "step": 4025 }, { "epoch": 0.82, "learning_rate": 0.00028245487799124797, "loss": 0.0097, "step": 4026 }, { "epoch": 0.82, "learning_rate": 0.00028244577910338086, "loss": 0.0133, "step": 4027 }, { "epoch": 0.82, "learning_rate": 0.0002824366780034192, "loss": 0.0084, "step": 4028 }, { "epoch": 0.82, "learning_rate": 0.000282427574691515, "loss": 0.0218, "step": 4029 }, { "epoch": 0.82, "learning_rate": 0.00028241846916782036, "loss": 0.0849, "step": 4030 }, { "epoch": 0.82, "learning_rate": 0.0002824093614324873, "loss": 0.0154, "step": 4031 }, { "epoch": 0.82, "learning_rate": 0.000282400251485668, "loss": 0.0192, "step": 4032 }, { "epoch": 0.82, "learning_rate": 0.0002823911393275146, "loss": 0.0203, "step": 4033 }, { "epoch": 0.82, "learning_rate": 0.0002823820249581792, "loss": 0.0586, "step": 4034 }, { "epoch": 0.82, "learning_rate": 0.00028237290837781413, "loss": 0.025, "step": 4035 }, { "epoch": 0.82, "learning_rate": 0.0002823637895865716, "loss": 0.0154, "step": 4036 }, { "epoch": 0.82, "learning_rate": 0.000282354668584604, "loss": 0.0294, "step": 4037 }, { "epoch": 0.82, "learning_rate": 0.0002823455453720635, "loss": 0.0245, "step": 4038 }, { "epoch": 0.82, "learning_rate": 0.00028233641994910257, "loss": 0.012, "step": 4039 }, { "epoch": 0.82, "learning_rate": 0.00028232729231587373, "loss": 0.0278, "step": 4040 }, { "epoch": 0.82, "learning_rate": 0.00028231816247252924, "loss": 0.013, "step": 4041 }, { "epoch": 0.82, "learning_rate": 0.0002823090304192217, "loss": 0.0124, "step": 4042 }, { "epoch": 0.82, "learning_rate": 0.0002822998961561036, "loss": 0.0749, "step": 4043 }, { "epoch": 0.82, "learning_rate": 0.00028229075968332746, "loss": 0.006, "step": 4044 }, { "epoch": 0.82, "learning_rate": 0.00028228162100104595, "loss": 0.0252, "step": 4045 }, { "epoch": 0.82, "learning_rate": 0.00028227248010941167, "loss": 0.0256, "step": 4046 }, { "epoch": 0.82, "learning_rate": 0.0002822633370085773, "loss": 0.0183, "step": 4047 }, { "epoch": 0.82, "learning_rate": 0.0002822541916986955, "loss": 0.0164, "step": 4048 }, { "epoch": 0.82, "learning_rate": 0.0002822450441799191, "loss": 0.0151, "step": 4049 }, { "epoch": 0.82, "learning_rate": 0.0002822358944524008, "loss": 0.0232, "step": 4050 }, { "epoch": 0.82, "learning_rate": 0.0002822267425162934, "loss": 0.0103, "step": 4051 }, { "epoch": 0.83, "learning_rate": 0.0002822175883717499, "loss": 0.0248, "step": 4052 }, { "epoch": 0.83, "learning_rate": 0.00028220843201892307, "loss": 0.0259, "step": 4053 }, { "epoch": 0.83, "learning_rate": 0.0002821992734579658, "loss": 0.0105, "step": 4054 }, { "epoch": 0.83, "learning_rate": 0.0002821901126890312, "loss": 0.0118, "step": 4055 }, { "epoch": 0.83, "learning_rate": 0.0002821809497122722, "loss": 0.011, "step": 4056 }, { "epoch": 0.83, "learning_rate": 0.0002821717845278418, "loss": 0.0274, "step": 4057 }, { "epoch": 0.83, "learning_rate": 0.0002821626171358931, "loss": 0.0375, "step": 4058 }, { "epoch": 0.83, "learning_rate": 0.00028215344753657913, "loss": 0.0124, "step": 4059 }, { "epoch": 0.83, "learning_rate": 0.0002821442757300533, "loss": 0.0397, "step": 4060 }, { "epoch": 0.83, "learning_rate": 0.0002821351017164685, "loss": 0.0285, "step": 4061 }, { "epoch": 0.83, "learning_rate": 0.0002821259254959781, "loss": 0.0192, "step": 4062 }, { "epoch": 0.83, "learning_rate": 0.0002821167470687354, "loss": 0.0253, "step": 4063 }, { "epoch": 0.83, "learning_rate": 0.0002821075664348936, "loss": 0.0236, "step": 4064 }, { "epoch": 0.83, "learning_rate": 0.00028209838359460605, "loss": 0.008, "step": 4065 }, { "epoch": 0.83, "learning_rate": 0.0002820891985480262, "loss": 0.009, "step": 4066 }, { "epoch": 0.83, "learning_rate": 0.0002820800112953073, "loss": 0.0191, "step": 4067 }, { "epoch": 0.83, "learning_rate": 0.00028207082183660294, "loss": 0.0194, "step": 4068 }, { "epoch": 0.83, "learning_rate": 0.00028206163017206656, "loss": 0.0419, "step": 4069 }, { "epoch": 0.83, "learning_rate": 0.00028205243630185166, "loss": 0.0108, "step": 4070 }, { "epoch": 0.83, "learning_rate": 0.00028204324022611184, "loss": 0.028, "step": 4071 }, { "epoch": 0.83, "learning_rate": 0.00028203404194500066, "loss": 0.0276, "step": 4072 }, { "epoch": 0.83, "learning_rate": 0.0002820248414586717, "loss": 0.0179, "step": 4073 }, { "epoch": 0.83, "learning_rate": 0.00028201563876727875, "loss": 0.0097, "step": 4074 }, { "epoch": 0.83, "learning_rate": 0.00028200643387097534, "loss": 0.0131, "step": 4075 }, { "epoch": 0.83, "learning_rate": 0.0002819972267699154, "loss": 0.0013, "step": 4076 }, { "epoch": 0.83, "learning_rate": 0.00028198801746425254, "loss": 0.0017, "step": 4077 }, { "epoch": 0.83, "learning_rate": 0.0002819788059541406, "loss": 0.0253, "step": 4078 }, { "epoch": 0.83, "learning_rate": 0.00028196959223973357, "loss": 0.0383, "step": 4079 }, { "epoch": 0.83, "learning_rate": 0.0002819603763211852, "loss": 0.0091, "step": 4080 }, { "epoch": 0.83, "learning_rate": 0.0002819511581986495, "loss": 0.0197, "step": 4081 }, { "epoch": 0.83, "learning_rate": 0.0002819419378722803, "loss": 0.0379, "step": 4082 }, { "epoch": 0.83, "learning_rate": 0.0002819327153422317, "loss": 0.0231, "step": 4083 }, { "epoch": 0.83, "learning_rate": 0.00028192349060865776, "loss": 0.012, "step": 4084 }, { "epoch": 0.83, "learning_rate": 0.0002819142636717125, "loss": 0.0042, "step": 4085 }, { "epoch": 0.83, "learning_rate": 0.00028190503453155, "loss": 0.0295, "step": 4086 }, { "epoch": 0.83, "learning_rate": 0.00028189580318832444, "loss": 0.0058, "step": 4087 }, { "epoch": 0.83, "learning_rate": 0.00028188656964219, "loss": 0.011, "step": 4088 }, { "epoch": 0.83, "learning_rate": 0.0002818773338933009, "loss": 0.0173, "step": 4089 }, { "epoch": 0.83, "learning_rate": 0.00028186809594181136, "loss": 0.0157, "step": 4090 }, { "epoch": 0.83, "learning_rate": 0.00028185885578787574, "loss": 0.0124, "step": 4091 }, { "epoch": 0.83, "learning_rate": 0.0002818496134316483, "loss": 0.0315, "step": 4092 }, { "epoch": 0.83, "learning_rate": 0.0002818403688732834, "loss": 0.0194, "step": 4093 }, { "epoch": 0.83, "learning_rate": 0.00028183112211293556, "loss": 0.0153, "step": 4094 }, { "epoch": 0.83, "learning_rate": 0.000281821873150759, "loss": 0.0209, "step": 4095 }, { "epoch": 0.83, "learning_rate": 0.0002818126219869085, "loss": 0.01, "step": 4096 }, { "epoch": 0.83, "learning_rate": 0.0002818033686215383, "loss": 0.0196, "step": 4097 }, { "epoch": 0.83, "learning_rate": 0.000281794113054803, "loss": 0.0138, "step": 4098 }, { "epoch": 0.83, "learning_rate": 0.0002817848552868573, "loss": 0.0178, "step": 4099 }, { "epoch": 0.83, "learning_rate": 0.0002817755953178558, "loss": 0.0165, "step": 4100 }, { "epoch": 0.84, "learning_rate": 0.00028176633314795304, "loss": 0.0182, "step": 4101 }, { "epoch": 0.84, "learning_rate": 0.0002817570687773038, "loss": 0.0247, "step": 4102 }, { "epoch": 0.84, "learning_rate": 0.0002817478022060628, "loss": 0.0212, "step": 4103 }, { "epoch": 0.84, "learning_rate": 0.00028173853343438484, "loss": 0.0373, "step": 4104 }, { "epoch": 0.84, "learning_rate": 0.00028172926246242466, "loss": 0.0205, "step": 4105 }, { "epoch": 0.84, "learning_rate": 0.00028171998929033714, "loss": 0.0444, "step": 4106 }, { "epoch": 0.84, "learning_rate": 0.0002817107139182772, "loss": 0.0444, "step": 4107 }, { "epoch": 0.84, "learning_rate": 0.0002817014363463997, "loss": 0.0249, "step": 4108 }, { "epoch": 0.84, "learning_rate": 0.00028169215657485963, "loss": 0.0049, "step": 4109 }, { "epoch": 0.84, "learning_rate": 0.0002816828746038119, "loss": 0.0219, "step": 4110 }, { "epoch": 0.84, "learning_rate": 0.00028167359043341166, "loss": 0.008, "step": 4111 }, { "epoch": 0.84, "learning_rate": 0.0002816643040638139, "loss": 0.0312, "step": 4112 }, { "epoch": 0.84, "learning_rate": 0.0002816550154951737, "loss": 0.0211, "step": 4113 }, { "epoch": 0.84, "learning_rate": 0.0002816457247276462, "loss": 0.0267, "step": 4114 }, { "epoch": 0.84, "learning_rate": 0.0002816364317613866, "loss": 0.0213, "step": 4115 }, { "epoch": 0.84, "learning_rate": 0.0002816271365965502, "loss": 0.0055, "step": 4116 }, { "epoch": 0.84, "learning_rate": 0.00028161783923329203, "loss": 0.0214, "step": 4117 }, { "epoch": 0.84, "learning_rate": 0.0002816085396717676, "loss": 0.0419, "step": 4118 }, { "epoch": 0.84, "learning_rate": 0.00028159923791213205, "loss": 0.0207, "step": 4119 }, { "epoch": 0.84, "learning_rate": 0.0002815899339545409, "loss": 0.0343, "step": 4120 }, { "epoch": 0.84, "learning_rate": 0.0002815806277991494, "loss": 0.0211, "step": 4121 }, { "epoch": 0.84, "learning_rate": 0.00028157131944611305, "loss": 0.0167, "step": 4122 }, { "epoch": 0.84, "learning_rate": 0.0002815620088955873, "loss": 0.0325, "step": 4123 }, { "epoch": 0.84, "learning_rate": 0.0002815526961477277, "loss": 0.0426, "step": 4124 }, { "epoch": 0.84, "learning_rate": 0.00028154338120268973, "loss": 0.0224, "step": 4125 }, { "epoch": 0.84, "learning_rate": 0.000281534064060629, "loss": 0.0326, "step": 4126 }, { "epoch": 0.84, "learning_rate": 0.00028152474472170104, "loss": 0.0361, "step": 4127 }, { "epoch": 0.84, "learning_rate": 0.00028151542318606164, "loss": 0.031, "step": 4128 }, { "epoch": 0.84, "learning_rate": 0.0002815060994538664, "loss": 0.0058, "step": 4129 }, { "epoch": 0.84, "learning_rate": 0.0002814967735252711, "loss": 0.032, "step": 4130 }, { "epoch": 0.84, "learning_rate": 0.0002814874454004314, "loss": 0.0211, "step": 4131 }, { "epoch": 0.84, "learning_rate": 0.0002814781150795032, "loss": 0.0348, "step": 4132 }, { "epoch": 0.84, "learning_rate": 0.0002814687825626423, "loss": 0.0245, "step": 4133 }, { "epoch": 0.84, "learning_rate": 0.00028145944785000455, "loss": 0.0394, "step": 4134 }, { "epoch": 0.84, "learning_rate": 0.0002814501109417459, "loss": 0.0169, "step": 4135 }, { "epoch": 0.84, "learning_rate": 0.0002814407718380222, "loss": 0.0191, "step": 4136 }, { "epoch": 0.84, "learning_rate": 0.00028143143053898956, "loss": 0.0145, "step": 4137 }, { "epoch": 0.84, "learning_rate": 0.00028142208704480396, "loss": 0.0202, "step": 4138 }, { "epoch": 0.84, "learning_rate": 0.00028141274135562135, "loss": 0.0491, "step": 4139 }, { "epoch": 0.84, "learning_rate": 0.00028140339347159797, "loss": 0.023, "step": 4140 }, { "epoch": 0.84, "learning_rate": 0.0002813940433928898, "loss": 0.0255, "step": 4141 }, { "epoch": 0.84, "learning_rate": 0.0002813846911196532, "loss": 0.0652, "step": 4142 }, { "epoch": 0.84, "learning_rate": 0.00028137533665204413, "loss": 0.0176, "step": 4143 }, { "epoch": 0.84, "learning_rate": 0.000281365979990219, "loss": 0.011, "step": 4144 }, { "epoch": 0.84, "learning_rate": 0.00028135662113433404, "loss": 0.0282, "step": 4145 }, { "epoch": 0.84, "learning_rate": 0.0002813472600845455, "loss": 0.0226, "step": 4146 }, { "epoch": 0.84, "learning_rate": 0.00028133789684100987, "loss": 0.1191, "step": 4147 }, { "epoch": 0.84, "learning_rate": 0.0002813285314038834, "loss": 0.0241, "step": 4148 }, { "epoch": 0.84, "learning_rate": 0.0002813191637733226, "loss": 0.0443, "step": 4149 }, { "epoch": 0.85, "learning_rate": 0.0002813097939494838, "loss": 0.0242, "step": 4150 }, { "epoch": 0.85, "learning_rate": 0.00028130042193252365, "loss": 0.012, "step": 4151 }, { "epoch": 0.85, "learning_rate": 0.0002812910477225986, "loss": 0.0224, "step": 4152 }, { "epoch": 0.85, "learning_rate": 0.00028128167131986513, "loss": 0.0124, "step": 4153 }, { "epoch": 0.85, "learning_rate": 0.00028127229272448, "loss": 0.0239, "step": 4154 }, { "epoch": 0.85, "learning_rate": 0.0002812629119365998, "loss": 0.0267, "step": 4155 }, { "epoch": 0.85, "learning_rate": 0.0002812535289563812, "loss": 0.0115, "step": 4156 }, { "epoch": 0.85, "learning_rate": 0.0002812441437839809, "loss": 0.0168, "step": 4157 }, { "epoch": 0.85, "learning_rate": 0.0002812347564195557, "loss": 0.0273, "step": 4158 }, { "epoch": 0.85, "learning_rate": 0.0002812253668632622, "loss": 0.0286, "step": 4159 }, { "epoch": 0.85, "learning_rate": 0.0002812159751152575, "loss": 0.0176, "step": 4160 }, { "epoch": 0.85, "learning_rate": 0.0002812065811756983, "loss": 0.0216, "step": 4161 }, { "epoch": 0.85, "learning_rate": 0.00028119718504474153, "loss": 0.0372, "step": 4162 }, { "epoch": 0.85, "learning_rate": 0.0002811877867225441, "loss": 0.0206, "step": 4163 }, { "epoch": 0.85, "learning_rate": 0.000281178386209263, "loss": 0.0267, "step": 4164 }, { "epoch": 0.85, "learning_rate": 0.00028116898350505527, "loss": 0.0209, "step": 4165 }, { "epoch": 0.85, "learning_rate": 0.0002811595786100779, "loss": 0.017, "step": 4166 }, { "epoch": 0.85, "learning_rate": 0.00028115017152448795, "loss": 0.0129, "step": 4167 }, { "epoch": 0.85, "learning_rate": 0.00028114076224844257, "loss": 0.0303, "step": 4168 }, { "epoch": 0.85, "learning_rate": 0.00028113135078209895, "loss": 0.0267, "step": 4169 }, { "epoch": 0.85, "learning_rate": 0.00028112193712561426, "loss": 0.0457, "step": 4170 }, { "epoch": 0.85, "learning_rate": 0.00028111252127914564, "loss": 0.0199, "step": 4171 }, { "epoch": 0.85, "learning_rate": 0.00028110310324285046, "loss": 0.006, "step": 4172 }, { "epoch": 0.85, "learning_rate": 0.000281093683016886, "loss": 0.027, "step": 4173 }, { "epoch": 0.85, "learning_rate": 0.00028108426060140956, "loss": 0.0149, "step": 4174 }, { "epoch": 0.85, "learning_rate": 0.0002810748359965785, "loss": 0.0076, "step": 4175 }, { "epoch": 0.85, "learning_rate": 0.00028106540920255036, "loss": 0.009, "step": 4176 }, { "epoch": 0.85, "learning_rate": 0.0002810559802194824, "loss": 0.0138, "step": 4177 }, { "epoch": 0.85, "learning_rate": 0.0002810465490475321, "loss": 0.0192, "step": 4178 }, { "epoch": 0.85, "learning_rate": 0.0002810371156868572, "loss": 0.0302, "step": 4179 }, { "epoch": 0.85, "learning_rate": 0.0002810276801376151, "loss": 0.0129, "step": 4180 }, { "epoch": 0.85, "learning_rate": 0.00028101824239996334, "loss": 0.0178, "step": 4181 }, { "epoch": 0.85, "learning_rate": 0.0002810088024740597, "loss": 0.0333, "step": 4182 }, { "epoch": 0.85, "learning_rate": 0.0002809993603600617, "loss": 0.0293, "step": 4183 }, { "epoch": 0.85, "learning_rate": 0.00028098991605812713, "loss": 0.014, "step": 4184 }, { "epoch": 0.85, "learning_rate": 0.00028098046956841373, "loss": 0.0117, "step": 4185 }, { "epoch": 0.85, "learning_rate": 0.0002809710208910792, "loss": 0.013, "step": 4186 }, { "epoch": 0.85, "learning_rate": 0.0002809615700262814, "loss": 0.0203, "step": 4187 }, { "epoch": 0.85, "learning_rate": 0.0002809521169741782, "loss": 0.0781, "step": 4188 }, { "epoch": 0.85, "learning_rate": 0.00028094266173492744, "loss": 0.0175, "step": 4189 }, { "epoch": 0.85, "learning_rate": 0.0002809332043086871, "loss": 0.0124, "step": 4190 }, { "epoch": 0.85, "learning_rate": 0.000280923744695615, "loss": 0.0224, "step": 4191 }, { "epoch": 0.85, "learning_rate": 0.00028091428289586933, "loss": 0.0277, "step": 4192 }, { "epoch": 0.85, "learning_rate": 0.0002809048189096079, "loss": 0.0393, "step": 4193 }, { "epoch": 0.85, "learning_rate": 0.000280895352736989, "loss": 0.0142, "step": 4194 }, { "epoch": 0.85, "learning_rate": 0.00028088588437817055, "loss": 0.0035, "step": 4195 }, { "epoch": 0.85, "learning_rate": 0.0002808764138333108, "loss": 0.0271, "step": 4196 }, { "epoch": 0.85, "learning_rate": 0.00028086694110256795, "loss": 0.051, "step": 4197 }, { "epoch": 0.85, "learning_rate": 0.00028085746618610006, "loss": 0.0264, "step": 4198 }, { "epoch": 0.85, "learning_rate": 0.0002808479890840655, "loss": 0.081, "step": 4199 }, { "epoch": 0.86, "learning_rate": 0.00028083850979662256, "loss": 0.0251, "step": 4200 }, { "epoch": 0.86, "learning_rate": 0.00028082902832392954, "loss": 0.017, "step": 4201 }, { "epoch": 0.86, "learning_rate": 0.00028081954466614473, "loss": 0.0162, "step": 4202 }, { "epoch": 0.86, "learning_rate": 0.00028081005882342664, "loss": 0.0195, "step": 4203 }, { "epoch": 0.86, "learning_rate": 0.0002808005707959336, "loss": 0.0197, "step": 4204 }, { "epoch": 0.86, "learning_rate": 0.0002807910805838242, "loss": 0.0288, "step": 4205 }, { "epoch": 0.86, "learning_rate": 0.0002807815881872568, "loss": 0.0332, "step": 4206 }, { "epoch": 0.86, "learning_rate": 0.00028077209360639, "loss": 0.0135, "step": 4207 }, { "epoch": 0.86, "learning_rate": 0.0002807625968413824, "loss": 0.0212, "step": 4208 }, { "epoch": 0.86, "learning_rate": 0.00028075309789239267, "loss": 0.0149, "step": 4209 }, { "epoch": 0.86, "learning_rate": 0.0002807435967595793, "loss": 0.0107, "step": 4210 }, { "epoch": 0.86, "learning_rate": 0.0002807340934431011, "loss": 0.0278, "step": 4211 }, { "epoch": 0.86, "learning_rate": 0.00028072458794311676, "loss": 0.0136, "step": 4212 }, { "epoch": 0.86, "learning_rate": 0.00028071508025978505, "loss": 0.015, "step": 4213 }, { "epoch": 0.86, "learning_rate": 0.00028070557039326476, "loss": 0.0112, "step": 4214 }, { "epoch": 0.86, "learning_rate": 0.0002806960583437147, "loss": 0.0313, "step": 4215 }, { "epoch": 0.86, "learning_rate": 0.00028068654411129377, "loss": 0.0169, "step": 4216 }, { "epoch": 0.86, "learning_rate": 0.00028067702769616086, "loss": 0.0234, "step": 4217 }, { "epoch": 0.86, "learning_rate": 0.0002806675090984749, "loss": 0.0179, "step": 4218 }, { "epoch": 0.86, "learning_rate": 0.00028065798831839497, "loss": 0.0096, "step": 4219 }, { "epoch": 0.86, "learning_rate": 0.0002806484653560799, "loss": 0.0089, "step": 4220 }, { "epoch": 0.86, "learning_rate": 0.00028063894021168893, "loss": 0.0366, "step": 4221 }, { "epoch": 0.86, "learning_rate": 0.000280629412885381, "loss": 0.0379, "step": 4222 }, { "epoch": 0.86, "learning_rate": 0.00028061988337731527, "loss": 0.0228, "step": 4223 }, { "epoch": 0.86, "learning_rate": 0.000280610351687651, "loss": 0.0071, "step": 4224 }, { "epoch": 0.86, "learning_rate": 0.0002806008178165473, "loss": 0.0221, "step": 4225 }, { "epoch": 0.86, "learning_rate": 0.00028059128176416334, "loss": 0.0501, "step": 4226 }, { "epoch": 0.86, "learning_rate": 0.00028058174353065855, "loss": 0.0268, "step": 4227 }, { "epoch": 0.86, "learning_rate": 0.00028057220311619214, "loss": 0.02, "step": 4228 }, { "epoch": 0.86, "learning_rate": 0.0002805626605209234, "loss": 0.0252, "step": 4229 }, { "epoch": 0.86, "learning_rate": 0.00028055311574501184, "loss": 0.0271, "step": 4230 }, { "epoch": 0.86, "learning_rate": 0.0002805435687886168, "loss": 0.0074, "step": 4231 }, { "epoch": 0.86, "learning_rate": 0.0002805340196518977, "loss": 0.0249, "step": 4232 }, { "epoch": 0.86, "learning_rate": 0.0002805244683350141, "loss": 0.0099, "step": 4233 }, { "epoch": 0.86, "learning_rate": 0.00028051491483812555, "loss": 0.0091, "step": 4234 }, { "epoch": 0.86, "learning_rate": 0.0002805053591613915, "loss": 0.0271, "step": 4235 }, { "epoch": 0.86, "learning_rate": 0.0002804958013049716, "loss": 0.0076, "step": 4236 }, { "epoch": 0.86, "learning_rate": 0.0002804862412690255, "loss": 0.0207, "step": 4237 }, { "epoch": 0.86, "learning_rate": 0.0002804766790537129, "loss": 0.049, "step": 4238 }, { "epoch": 0.86, "learning_rate": 0.0002804671146591934, "loss": 0.0363, "step": 4239 }, { "epoch": 0.86, "learning_rate": 0.00028045754808562687, "loss": 0.0218, "step": 4240 }, { "epoch": 0.86, "learning_rate": 0.000280447979333173, "loss": 0.0089, "step": 4241 }, { "epoch": 0.86, "learning_rate": 0.00028043840840199163, "loss": 0.0372, "step": 4242 }, { "epoch": 0.86, "learning_rate": 0.00028042883529224265, "loss": 0.0115, "step": 4243 }, { "epoch": 0.86, "learning_rate": 0.0002804192600040859, "loss": 0.0194, "step": 4244 }, { "epoch": 0.86, "learning_rate": 0.0002804096825376813, "loss": 0.0163, "step": 4245 }, { "epoch": 0.86, "learning_rate": 0.00028040010289318885, "loss": 0.0211, "step": 4246 }, { "epoch": 0.86, "learning_rate": 0.00028039052107076855, "loss": 0.0236, "step": 4247 }, { "epoch": 0.86, "learning_rate": 0.0002803809370705804, "loss": 0.0244, "step": 4248 }, { "epoch": 0.87, "learning_rate": 0.0002803713508927845, "loss": 0.0309, "step": 4249 }, { "epoch": 0.87, "learning_rate": 0.000280361762537541, "loss": 0.0413, "step": 4250 }, { "epoch": 0.87, "learning_rate": 0.00028035217200500994, "loss": 0.0411, "step": 4251 }, { "epoch": 0.87, "learning_rate": 0.00028034257929535154, "loss": 0.0181, "step": 4252 }, { "epoch": 0.87, "learning_rate": 0.00028033298440872603, "loss": 0.0099, "step": 4253 }, { "epoch": 0.87, "learning_rate": 0.00028032338734529366, "loss": 0.0179, "step": 4254 }, { "epoch": 0.87, "learning_rate": 0.00028031378810521474, "loss": 0.0274, "step": 4255 }, { "epoch": 0.87, "learning_rate": 0.00028030418668864956, "loss": 0.0242, "step": 4256 }, { "epoch": 0.87, "learning_rate": 0.00028029458309575847, "loss": 0.0143, "step": 4257 }, { "epoch": 0.87, "learning_rate": 0.00028028497732670194, "loss": 0.046, "step": 4258 }, { "epoch": 0.87, "learning_rate": 0.0002802753693816403, "loss": 0.0166, "step": 4259 }, { "epoch": 0.87, "learning_rate": 0.0002802657592607341, "loss": 0.0369, "step": 4260 }, { "epoch": 0.87, "learning_rate": 0.00028025614696414387, "loss": 0.0302, "step": 4261 }, { "epoch": 0.87, "learning_rate": 0.00028024653249203007, "loss": 0.0247, "step": 4262 }, { "epoch": 0.87, "learning_rate": 0.00028023691584455336, "loss": 0.014, "step": 4263 }, { "epoch": 0.87, "learning_rate": 0.0002802272970218743, "loss": 0.0321, "step": 4264 }, { "epoch": 0.87, "learning_rate": 0.0002802176760241535, "loss": 0.0628, "step": 4265 }, { "epoch": 0.87, "learning_rate": 0.0002802080528515518, "loss": 0.0024, "step": 4266 }, { "epoch": 0.87, "learning_rate": 0.0002801984275042298, "loss": 0.0259, "step": 4267 }, { "epoch": 0.87, "learning_rate": 0.0002801887999823482, "loss": 0.0036, "step": 4268 }, { "epoch": 0.87, "learning_rate": 0.000280179170286068, "loss": 0.0059, "step": 4269 }, { "epoch": 0.87, "learning_rate": 0.0002801695384155499, "loss": 0.0054, "step": 4270 }, { "epoch": 0.87, "learning_rate": 0.0002801599043709548, "loss": 0.023, "step": 4271 }, { "epoch": 0.87, "learning_rate": 0.0002801502681524436, "loss": 0.0287, "step": 4272 }, { "epoch": 0.87, "learning_rate": 0.00028014062976017723, "loss": 0.0082, "step": 4273 }, { "epoch": 0.87, "learning_rate": 0.0002801309891943167, "loss": 0.0307, "step": 4274 }, { "epoch": 0.87, "learning_rate": 0.000280121346455023, "loss": 0.0417, "step": 4275 }, { "epoch": 0.87, "learning_rate": 0.0002801117015424572, "loss": 0.0122, "step": 4276 }, { "epoch": 0.87, "learning_rate": 0.0002801020544567804, "loss": 0.0077, "step": 4277 }, { "epoch": 0.87, "learning_rate": 0.0002800924051981537, "loss": 0.0418, "step": 4278 }, { "epoch": 0.87, "learning_rate": 0.00028008275376673823, "loss": 0.0423, "step": 4279 }, { "epoch": 0.87, "learning_rate": 0.0002800731001626953, "loss": 0.0217, "step": 4280 }, { "epoch": 0.87, "learning_rate": 0.000280063444386186, "loss": 0.0542, "step": 4281 }, { "epoch": 0.87, "learning_rate": 0.0002800537864373716, "loss": 0.0103, "step": 4282 }, { "epoch": 0.87, "learning_rate": 0.0002800441263164136, "loss": 0.0717, "step": 4283 }, { "epoch": 0.87, "learning_rate": 0.0002800344640234732, "loss": 0.0219, "step": 4284 }, { "epoch": 0.87, "learning_rate": 0.0002800247995587117, "loss": 0.0061, "step": 4285 }, { "epoch": 0.87, "learning_rate": 0.0002800151329222907, "loss": 0.0123, "step": 4286 }, { "epoch": 0.87, "learning_rate": 0.0002800054641143715, "loss": 0.0372, "step": 4287 }, { "epoch": 0.87, "learning_rate": 0.00027999579313511564, "loss": 0.02, "step": 4288 }, { "epoch": 0.87, "learning_rate": 0.00027998611998468476, "loss": 0.0194, "step": 4289 }, { "epoch": 0.87, "learning_rate": 0.0002799764446632402, "loss": 0.0457, "step": 4290 }, { "epoch": 0.87, "learning_rate": 0.00027996676717094367, "loss": 0.03, "step": 4291 }, { "epoch": 0.87, "learning_rate": 0.00027995708750795683, "loss": 0.0322, "step": 4292 }, { "epoch": 0.87, "learning_rate": 0.0002799474056744413, "loss": 0.0174, "step": 4293 }, { "epoch": 0.87, "learning_rate": 0.0002799377216705589, "loss": 0.0253, "step": 4294 }, { "epoch": 0.87, "learning_rate": 0.00027992803549647114, "loss": 0.0389, "step": 4295 }, { "epoch": 0.87, "learning_rate": 0.00027991834715234, "loss": 0.0044, "step": 4296 }, { "epoch": 0.87, "learning_rate": 0.0002799086566383272, "loss": 0.0212, "step": 4297 }, { "epoch": 0.88, "learning_rate": 0.00027989896395459464, "loss": 0.0133, "step": 4298 }, { "epoch": 0.88, "learning_rate": 0.00027988926910130414, "loss": 0.0304, "step": 4299 }, { "epoch": 0.88, "learning_rate": 0.0002798795720786177, "loss": 0.011, "step": 4300 }, { "epoch": 0.88, "learning_rate": 0.0002798698728866972, "loss": 0.0131, "step": 4301 }, { "epoch": 0.88, "learning_rate": 0.0002798601715257047, "loss": 0.0443, "step": 4302 }, { "epoch": 0.88, "learning_rate": 0.00027985046799580227, "loss": 0.0157, "step": 4303 }, { "epoch": 0.88, "learning_rate": 0.0002798407622971518, "loss": 0.0377, "step": 4304 }, { "epoch": 0.88, "learning_rate": 0.00027983105442991557, "loss": 0.0067, "step": 4305 }, { "epoch": 0.88, "learning_rate": 0.00027982134439425566, "loss": 0.0148, "step": 4306 }, { "epoch": 0.88, "learning_rate": 0.00027981163219033424, "loss": 0.0119, "step": 4307 }, { "epoch": 0.88, "learning_rate": 0.00027980191781831347, "loss": 0.0279, "step": 4308 }, { "epoch": 0.88, "learning_rate": 0.00027979220127835575, "loss": 0.0261, "step": 4309 }, { "epoch": 0.88, "learning_rate": 0.00027978248257062323, "loss": 0.0209, "step": 4310 }, { "epoch": 0.88, "learning_rate": 0.0002797727616952782, "loss": 0.034, "step": 4311 }, { "epoch": 0.88, "learning_rate": 0.00027976303865248316, "loss": 0.033, "step": 4312 }, { "epoch": 0.88, "learning_rate": 0.00027975331344240044, "loss": 0.0266, "step": 4313 }, { "epoch": 0.88, "learning_rate": 0.0002797435860651924, "loss": 0.0198, "step": 4314 }, { "epoch": 0.88, "learning_rate": 0.0002797338565210216, "loss": 0.01, "step": 4315 }, { "epoch": 0.88, "learning_rate": 0.00027972412481005055, "loss": 0.0147, "step": 4316 }, { "epoch": 0.88, "learning_rate": 0.00027971439093244166, "loss": 0.0249, "step": 4317 }, { "epoch": 0.88, "learning_rate": 0.00027970465488835766, "loss": 0.0226, "step": 4318 }, { "epoch": 0.88, "learning_rate": 0.00027969491667796106, "loss": 0.0392, "step": 4319 }, { "epoch": 0.88, "learning_rate": 0.0002796851763014145, "loss": 0.0215, "step": 4320 }, { "epoch": 0.88, "learning_rate": 0.0002796754337588807, "loss": 0.027, "step": 4321 }, { "epoch": 0.88, "learning_rate": 0.00027966568905052244, "loss": 0.0152, "step": 4322 }, { "epoch": 0.88, "learning_rate": 0.00027965594217650236, "loss": 0.021, "step": 4323 }, { "epoch": 0.88, "learning_rate": 0.00027964619313698333, "loss": 0.0106, "step": 4324 }, { "epoch": 0.88, "learning_rate": 0.00027963644193212814, "loss": 0.0159, "step": 4325 }, { "epoch": 0.88, "learning_rate": 0.00027962668856209964, "loss": 0.0098, "step": 4326 }, { "epoch": 0.88, "learning_rate": 0.0002796169330270608, "loss": 0.015, "step": 4327 }, { "epoch": 0.88, "learning_rate": 0.00027960717532717446, "loss": 0.0293, "step": 4328 }, { "epoch": 0.88, "learning_rate": 0.00027959741546260364, "loss": 0.0616, "step": 4329 }, { "epoch": 0.88, "learning_rate": 0.0002795876534335114, "loss": 0.0168, "step": 4330 }, { "epoch": 0.88, "learning_rate": 0.00027957788924006075, "loss": 0.0165, "step": 4331 }, { "epoch": 0.88, "learning_rate": 0.00027956812288241464, "loss": 0.0233, "step": 4332 }, { "epoch": 0.88, "learning_rate": 0.0002795583543607364, "loss": 0.0109, "step": 4333 }, { "epoch": 0.88, "learning_rate": 0.0002795485836751891, "loss": 0.0184, "step": 4334 }, { "epoch": 0.88, "learning_rate": 0.0002795388108259358, "loss": 0.0398, "step": 4335 }, { "epoch": 0.88, "learning_rate": 0.00027952903581313993, "loss": 0.0244, "step": 4336 }, { "epoch": 0.88, "learning_rate": 0.00027951925863696465, "loss": 0.012, "step": 4337 }, { "epoch": 0.88, "learning_rate": 0.00027950947929757325, "loss": 0.0229, "step": 4338 }, { "epoch": 0.88, "learning_rate": 0.0002794996977951291, "loss": 0.0255, "step": 4339 }, { "epoch": 0.88, "learning_rate": 0.00027948991412979547, "loss": 0.0178, "step": 4340 }, { "epoch": 0.88, "learning_rate": 0.00027948012830173596, "loss": 0.0193, "step": 4341 }, { "epoch": 0.88, "learning_rate": 0.0002794703403111138, "loss": 0.0205, "step": 4342 }, { "epoch": 0.88, "learning_rate": 0.0002794605501580926, "loss": 0.0141, "step": 4343 }, { "epoch": 0.88, "learning_rate": 0.00027945075784283584, "loss": 0.0203, "step": 4344 }, { "epoch": 0.88, "learning_rate": 0.0002794409633655071, "loss": 0.0246, "step": 4345 }, { "epoch": 0.88, "learning_rate": 0.0002794311667262699, "loss": 0.0162, "step": 4346 }, { "epoch": 0.89, "learning_rate": 0.0002794213679252879, "loss": 0.0956, "step": 4347 }, { "epoch": 0.89, "learning_rate": 0.00027941156696272473, "loss": 0.0221, "step": 4348 }, { "epoch": 0.89, "learning_rate": 0.0002794017638387442, "loss": 0.0212, "step": 4349 }, { "epoch": 0.89, "learning_rate": 0.0002793919585535099, "loss": 0.0348, "step": 4350 }, { "epoch": 0.89, "learning_rate": 0.0002793821511071856, "loss": 0.0221, "step": 4351 }, { "epoch": 0.89, "learning_rate": 0.0002793723414999352, "loss": 0.0068, "step": 4352 }, { "epoch": 0.89, "learning_rate": 0.00027936252973192246, "loss": 0.0098, "step": 4353 }, { "epoch": 0.89, "learning_rate": 0.0002793527158033113, "loss": 0.0065, "step": 4354 }, { "epoch": 0.89, "learning_rate": 0.0002793428997142656, "loss": 0.0197, "step": 4355 }, { "epoch": 0.89, "learning_rate": 0.0002793330814649493, "loss": 0.0418, "step": 4356 }, { "epoch": 0.89, "learning_rate": 0.0002793232610555265, "loss": 0.02, "step": 4357 }, { "epoch": 0.89, "learning_rate": 0.00027931343848616106, "loss": 0.0152, "step": 4358 }, { "epoch": 0.89, "learning_rate": 0.0002793036137570171, "loss": 0.0211, "step": 4359 }, { "epoch": 0.89, "learning_rate": 0.0002792937868682587, "loss": 0.0073, "step": 4360 }, { "epoch": 0.89, "learning_rate": 0.00027928395782005007, "loss": 0.0122, "step": 4361 }, { "epoch": 0.89, "learning_rate": 0.0002792741266125553, "loss": 0.0126, "step": 4362 }, { "epoch": 0.89, "learning_rate": 0.0002792642932459385, "loss": 0.0273, "step": 4363 }, { "epoch": 0.89, "learning_rate": 0.00027925445772036405, "loss": 0.0097, "step": 4364 }, { "epoch": 0.89, "learning_rate": 0.0002792446200359962, "loss": 0.0211, "step": 4365 }, { "epoch": 0.89, "learning_rate": 0.0002792347801929992, "loss": 0.055, "step": 4366 }, { "epoch": 0.89, "learning_rate": 0.0002792249381915374, "loss": 0.0314, "step": 4367 }, { "epoch": 0.89, "learning_rate": 0.0002792150940317752, "loss": 0.01, "step": 4368 }, { "epoch": 0.89, "learning_rate": 0.00027920524771387706, "loss": 0.0241, "step": 4369 }, { "epoch": 0.89, "learning_rate": 0.00027919539923800733, "loss": 0.0129, "step": 4370 }, { "epoch": 0.89, "learning_rate": 0.00027918554860433063, "loss": 0.035, "step": 4371 }, { "epoch": 0.89, "learning_rate": 0.00027917569581301137, "loss": 0.035, "step": 4372 }, { "epoch": 0.89, "learning_rate": 0.0002791658408642142, "loss": 0.0572, "step": 4373 }, { "epoch": 0.89, "learning_rate": 0.00027915598375810363, "loss": 0.0179, "step": 4374 }, { "epoch": 0.89, "learning_rate": 0.00027914612449484437, "loss": 0.0293, "step": 4375 }, { "epoch": 0.89, "learning_rate": 0.00027913626307460104, "loss": 0.0139, "step": 4376 }, { "epoch": 0.89, "learning_rate": 0.0002791263994975383, "loss": 0.011, "step": 4377 }, { "epoch": 0.89, "learning_rate": 0.000279116533763821, "loss": 0.0374, "step": 4378 }, { "epoch": 0.89, "learning_rate": 0.00027910666587361384, "loss": 0.0228, "step": 4379 }, { "epoch": 0.89, "learning_rate": 0.00027909679582708164, "loss": 0.0273, "step": 4380 }, { "epoch": 0.89, "learning_rate": 0.00027908692362438927, "loss": 0.0135, "step": 4381 }, { "epoch": 0.89, "learning_rate": 0.0002790770492657016, "loss": 0.0116, "step": 4382 }, { "epoch": 0.89, "learning_rate": 0.0002790671727511836, "loss": 0.0388, "step": 4383 }, { "epoch": 0.89, "learning_rate": 0.00027905729408100015, "loss": 0.0385, "step": 4384 }, { "epoch": 0.89, "learning_rate": 0.0002790474132553163, "loss": 0.0267, "step": 4385 }, { "epoch": 0.89, "learning_rate": 0.000279037530274297, "loss": 0.0051, "step": 4386 }, { "epoch": 0.89, "learning_rate": 0.00027902764513810743, "loss": 0.0281, "step": 4387 }, { "epoch": 0.89, "learning_rate": 0.0002790177578469126, "loss": 0.0311, "step": 4388 }, { "epoch": 0.89, "learning_rate": 0.0002790078684008777, "loss": 0.0287, "step": 4389 }, { "epoch": 0.89, "learning_rate": 0.00027899797680016784, "loss": 0.021, "step": 4390 }, { "epoch": 0.89, "learning_rate": 0.0002789880830449483, "loss": 0.0853, "step": 4391 }, { "epoch": 0.89, "learning_rate": 0.00027897818713538427, "loss": 0.021, "step": 4392 }, { "epoch": 0.89, "learning_rate": 0.000278968289071641, "loss": 0.0052, "step": 4393 }, { "epoch": 0.89, "learning_rate": 0.000278958388853884, "loss": 0.0196, "step": 4394 }, { "epoch": 0.89, "learning_rate": 0.00027894848648227834, "loss": 0.0101, "step": 4395 }, { "epoch": 0.9, "learning_rate": 0.0002789385819569896, "loss": 0.0099, "step": 4396 }, { "epoch": 0.9, "learning_rate": 0.0002789286752781832, "loss": 0.0166, "step": 4397 }, { "epoch": 0.9, "learning_rate": 0.0002789187664460245, "loss": 0.0429, "step": 4398 }, { "epoch": 0.9, "learning_rate": 0.00027890885546067904, "loss": 0.0144, "step": 4399 }, { "epoch": 0.9, "learning_rate": 0.0002788989423223124, "loss": 0.0109, "step": 4400 }, { "epoch": 0.9, "learning_rate": 0.0002788890270310901, "loss": 0.043, "step": 4401 }, { "epoch": 0.9, "learning_rate": 0.0002788791095871777, "loss": 0.0557, "step": 4402 }, { "epoch": 0.9, "learning_rate": 0.00027886918999074097, "loss": 0.0194, "step": 4403 }, { "epoch": 0.9, "learning_rate": 0.00027885926824194543, "loss": 0.0256, "step": 4404 }, { "epoch": 0.9, "learning_rate": 0.0002788493443409569, "loss": 0.0251, "step": 4405 }, { "epoch": 0.9, "learning_rate": 0.0002788394182879412, "loss": 0.0021, "step": 4406 }, { "epoch": 0.9, "learning_rate": 0.0002788294900830639, "loss": 0.0323, "step": 4407 }, { "epoch": 0.9, "learning_rate": 0.00027881955972649093, "loss": 0.0068, "step": 4408 }, { "epoch": 0.9, "learning_rate": 0.0002788096272183882, "loss": 0.0097, "step": 4409 }, { "epoch": 0.9, "learning_rate": 0.0002787996925589215, "loss": 0.0115, "step": 4410 }, { "epoch": 0.9, "learning_rate": 0.0002787897557482569, "loss": 0.0194, "step": 4411 }, { "epoch": 0.9, "learning_rate": 0.00027877981678656015, "loss": 0.0058, "step": 4412 }, { "epoch": 0.9, "learning_rate": 0.00027876987567399745, "loss": 0.0216, "step": 4413 }, { "epoch": 0.9, "learning_rate": 0.00027875993241073473, "loss": 0.0081, "step": 4414 }, { "epoch": 0.9, "learning_rate": 0.0002787499869969381, "loss": 0.0062, "step": 4415 }, { "epoch": 0.9, "learning_rate": 0.00027874003943277365, "loss": 0.0177, "step": 4416 }, { "epoch": 0.9, "learning_rate": 0.0002787300897184075, "loss": 0.0222, "step": 4417 }, { "epoch": 0.9, "learning_rate": 0.00027872013785400587, "loss": 0.0937, "step": 4418 }, { "epoch": 0.9, "learning_rate": 0.000278710183839735, "loss": 0.0638, "step": 4419 }, { "epoch": 0.9, "learning_rate": 0.00027870022767576105, "loss": 0.0145, "step": 4420 }, { "epoch": 0.9, "learning_rate": 0.0002786902693622504, "loss": 0.0113, "step": 4421 }, { "epoch": 0.9, "learning_rate": 0.00027868030889936925, "loss": 0.0103, "step": 4422 }, { "epoch": 0.9, "learning_rate": 0.0002786703462872842, "loss": 0.0084, "step": 4423 }, { "epoch": 0.9, "learning_rate": 0.0002786603815261613, "loss": 0.0265, "step": 4424 }, { "epoch": 0.9, "learning_rate": 0.00027865041461616727, "loss": 0.0221, "step": 4425 }, { "epoch": 0.9, "learning_rate": 0.0002786404455574685, "loss": 0.0076, "step": 4426 }, { "epoch": 0.9, "learning_rate": 0.0002786304743502314, "loss": 0.0603, "step": 4427 }, { "epoch": 0.9, "learning_rate": 0.00027862050099462256, "loss": 0.0286, "step": 4428 }, { "epoch": 0.9, "learning_rate": 0.0002786105254908086, "loss": 0.0102, "step": 4429 }, { "epoch": 0.9, "learning_rate": 0.0002786005478389561, "loss": 0.0166, "step": 4430 }, { "epoch": 0.9, "learning_rate": 0.0002785905680392317, "loss": 0.0087, "step": 4431 }, { "epoch": 0.9, "learning_rate": 0.00027858058609180205, "loss": 0.0108, "step": 4432 }, { "epoch": 0.9, "learning_rate": 0.0002785706019968339, "loss": 0.0646, "step": 4433 }, { "epoch": 0.9, "learning_rate": 0.00027856061575449407, "loss": 0.0145, "step": 4434 }, { "epoch": 0.9, "learning_rate": 0.0002785506273649492, "loss": 0.0373, "step": 4435 }, { "epoch": 0.9, "learning_rate": 0.00027854063682836627, "loss": 0.012, "step": 4436 }, { "epoch": 0.9, "learning_rate": 0.00027853064414491203, "loss": 0.0449, "step": 4437 }, { "epoch": 0.9, "learning_rate": 0.00027852064931475337, "loss": 0.0249, "step": 4438 }, { "epoch": 0.9, "learning_rate": 0.0002785106523380573, "loss": 0.0052, "step": 4439 }, { "epoch": 0.9, "learning_rate": 0.00027850065321499077, "loss": 0.0433, "step": 4440 }, { "epoch": 0.9, "learning_rate": 0.00027849065194572077, "loss": 0.0385, "step": 4441 }, { "epoch": 0.9, "learning_rate": 0.0002784806485304143, "loss": 0.0164, "step": 4442 }, { "epoch": 0.9, "learning_rate": 0.0002784706429692385, "loss": 0.0101, "step": 4443 }, { "epoch": 0.9, "learning_rate": 0.0002784606352623605, "loss": 0.0162, "step": 4444 }, { "epoch": 0.91, "learning_rate": 0.0002784506254099474, "loss": 0.04, "step": 4445 }, { "epoch": 0.91, "learning_rate": 0.00027844061341216635, "loss": 0.0279, "step": 4446 }, { "epoch": 0.91, "learning_rate": 0.00027843059926918454, "loss": 0.0365, "step": 4447 }, { "epoch": 0.91, "learning_rate": 0.00027842058298116945, "loss": 0.0285, "step": 4448 }, { "epoch": 0.91, "learning_rate": 0.0002784105645482881, "loss": 0.0172, "step": 4449 }, { "epoch": 0.91, "learning_rate": 0.000278400543970708, "loss": 0.0193, "step": 4450 }, { "epoch": 0.91, "learning_rate": 0.00027839052124859637, "loss": 0.0165, "step": 4451 }, { "epoch": 0.91, "learning_rate": 0.0002783804963821207, "loss": 0.0337, "step": 4452 }, { "epoch": 0.91, "learning_rate": 0.0002783704693714484, "loss": 0.0424, "step": 4453 }, { "epoch": 0.91, "learning_rate": 0.00027836044021674696, "loss": 0.0306, "step": 4454 }, { "epoch": 0.91, "learning_rate": 0.0002783504089181839, "loss": 0.0152, "step": 4455 }, { "epoch": 0.91, "learning_rate": 0.0002783403754759267, "loss": 0.0556, "step": 4456 }, { "epoch": 0.91, "learning_rate": 0.00027833033989014297, "loss": 0.0271, "step": 4457 }, { "epoch": 0.91, "learning_rate": 0.0002783203021610003, "loss": 0.0207, "step": 4458 }, { "epoch": 0.91, "learning_rate": 0.0002783102622886664, "loss": 0.0124, "step": 4459 }, { "epoch": 0.91, "learning_rate": 0.0002783002202733089, "loss": 0.0283, "step": 4460 }, { "epoch": 0.91, "learning_rate": 0.00027829017611509554, "loss": 0.0179, "step": 4461 }, { "epoch": 0.91, "learning_rate": 0.0002782801298141941, "loss": 0.0057, "step": 4462 }, { "epoch": 0.91, "learning_rate": 0.0002782700813707723, "loss": 0.0131, "step": 4463 }, { "epoch": 0.91, "learning_rate": 0.00027826003078499804, "loss": 0.0493, "step": 4464 }, { "epoch": 0.91, "learning_rate": 0.00027824997805703917, "loss": 0.0481, "step": 4465 }, { "epoch": 0.91, "learning_rate": 0.0002782399231870636, "loss": 0.021, "step": 4466 }, { "epoch": 0.91, "learning_rate": 0.0002782298661752392, "loss": 0.0188, "step": 4467 }, { "epoch": 0.91, "learning_rate": 0.00027821980702173396, "loss": 0.0262, "step": 4468 }, { "epoch": 0.91, "learning_rate": 0.00027820974572671597, "loss": 0.0149, "step": 4469 }, { "epoch": 0.91, "learning_rate": 0.0002781996822903532, "loss": 0.0121, "step": 4470 }, { "epoch": 0.91, "learning_rate": 0.0002781896167128137, "loss": 0.0348, "step": 4471 }, { "epoch": 0.91, "learning_rate": 0.0002781795489942656, "loss": 0.035, "step": 4472 }, { "epoch": 0.91, "learning_rate": 0.00027816947913487716, "loss": 0.0303, "step": 4473 }, { "epoch": 0.91, "learning_rate": 0.0002781594071348164, "loss": 0.0171, "step": 4474 }, { "epoch": 0.91, "learning_rate": 0.00027814933299425174, "loss": 0.0268, "step": 4475 }, { "epoch": 0.91, "learning_rate": 0.00027813925671335126, "loss": 0.0114, "step": 4476 }, { "epoch": 0.91, "learning_rate": 0.00027812917829228334, "loss": 0.025, "step": 4477 }, { "epoch": 0.91, "learning_rate": 0.0002781190977312162, "loss": 0.0241, "step": 4478 }, { "epoch": 0.91, "learning_rate": 0.0002781090150303183, "loss": 0.0336, "step": 4479 }, { "epoch": 0.91, "learning_rate": 0.00027809893018975807, "loss": 0.0142, "step": 4480 }, { "epoch": 0.91, "learning_rate": 0.0002780888432097039, "loss": 0.005, "step": 4481 }, { "epoch": 0.91, "learning_rate": 0.00027807875409032427, "loss": 0.0259, "step": 4482 }, { "epoch": 0.91, "learning_rate": 0.00027806866283178763, "loss": 0.0377, "step": 4483 }, { "epoch": 0.91, "learning_rate": 0.0002780585694342627, "loss": 0.0074, "step": 4484 }, { "epoch": 0.91, "learning_rate": 0.0002780484738979178, "loss": 0.0172, "step": 4485 }, { "epoch": 0.91, "learning_rate": 0.0002780383762229217, "loss": 0.011, "step": 4486 }, { "epoch": 0.91, "learning_rate": 0.00027802827640944307, "loss": 0.0127, "step": 4487 }, { "epoch": 0.91, "learning_rate": 0.0002780181744576505, "loss": 0.025, "step": 4488 }, { "epoch": 0.91, "learning_rate": 0.0002780080703677128, "loss": 0.016, "step": 4489 }, { "epoch": 0.91, "learning_rate": 0.0002779979641397987, "loss": 0.0146, "step": 4490 }, { "epoch": 0.91, "learning_rate": 0.000277987855774077, "loss": 0.0158, "step": 4491 }, { "epoch": 0.91, "learning_rate": 0.00027797774527071645, "loss": 0.0198, "step": 4492 }, { "epoch": 0.91, "learning_rate": 0.000277967632629886, "loss": 0.0166, "step": 4493 }, { "epoch": 0.92, "learning_rate": 0.00027795751785175454, "loss": 0.0104, "step": 4494 }, { "epoch": 0.92, "learning_rate": 0.00027794740093649105, "loss": 0.0244, "step": 4495 }, { "epoch": 0.92, "learning_rate": 0.0002779372818842644, "loss": 0.0302, "step": 4496 }, { "epoch": 0.92, "learning_rate": 0.00027792716069524365, "loss": 0.0323, "step": 4497 }, { "epoch": 0.92, "learning_rate": 0.0002779170373695978, "loss": 0.015, "step": 4498 }, { "epoch": 0.92, "learning_rate": 0.000277906911907496, "loss": 0.0178, "step": 4499 }, { "epoch": 0.92, "learning_rate": 0.0002778967843091073, "loss": 0.0138, "step": 4500 }, { "epoch": 0.92, "learning_rate": 0.00027788665457460093, "loss": 0.0153, "step": 4501 }, { "epoch": 0.92, "learning_rate": 0.000277876522704146, "loss": 0.0122, "step": 4502 }, { "epoch": 0.92, "learning_rate": 0.00027786638869791173, "loss": 0.0114, "step": 4503 }, { "epoch": 0.92, "learning_rate": 0.00027785625255606747, "loss": 0.0491, "step": 4504 }, { "epoch": 0.92, "learning_rate": 0.00027784611427878234, "loss": 0.0269, "step": 4505 }, { "epoch": 0.92, "learning_rate": 0.0002778359738662259, "loss": 0.0197, "step": 4506 }, { "epoch": 0.92, "learning_rate": 0.0002778258313185673, "loss": 0.0157, "step": 4507 }, { "epoch": 0.92, "learning_rate": 0.00027781568663597605, "loss": 0.0361, "step": 4508 }, { "epoch": 0.92, "learning_rate": 0.0002778055398186216, "loss": 0.0097, "step": 4509 }, { "epoch": 0.92, "learning_rate": 0.00027779539086667334, "loss": 0.003, "step": 4510 }, { "epoch": 0.92, "learning_rate": 0.0002777852397803008, "loss": 0.014, "step": 4511 }, { "epoch": 0.92, "learning_rate": 0.0002777750865596736, "loss": 0.0348, "step": 4512 }, { "epoch": 0.92, "learning_rate": 0.00027776493120496124, "loss": 0.0081, "step": 4513 }, { "epoch": 0.92, "learning_rate": 0.00027775477371633336, "loss": 0.0743, "step": 4514 }, { "epoch": 0.92, "learning_rate": 0.0002777446140939596, "loss": 0.0329, "step": 4515 }, { "epoch": 0.92, "learning_rate": 0.0002777344523380097, "loss": 0.014, "step": 4516 }, { "epoch": 0.92, "learning_rate": 0.0002777242884486533, "loss": 0.0141, "step": 4517 }, { "epoch": 0.92, "learning_rate": 0.00027771412242606015, "loss": 0.0084, "step": 4518 }, { "epoch": 0.92, "learning_rate": 0.0002777039542704001, "loss": 0.0094, "step": 4519 }, { "epoch": 0.92, "learning_rate": 0.00027769378398184296, "loss": 0.0187, "step": 4520 }, { "epoch": 0.92, "learning_rate": 0.0002776836115605586, "loss": 0.0284, "step": 4521 }, { "epoch": 0.92, "learning_rate": 0.0002776734370067169, "loss": 0.0395, "step": 4522 }, { "epoch": 0.92, "learning_rate": 0.00027766326032048776, "loss": 0.0372, "step": 4523 }, { "epoch": 0.92, "learning_rate": 0.0002776530815020412, "loss": 0.0852, "step": 4524 }, { "epoch": 0.92, "learning_rate": 0.00027764290055154727, "loss": 0.0159, "step": 4525 }, { "epoch": 0.92, "learning_rate": 0.0002776327174691759, "loss": 0.0075, "step": 4526 }, { "epoch": 0.92, "learning_rate": 0.00027762253225509725, "loss": 0.0199, "step": 4527 }, { "epoch": 0.92, "learning_rate": 0.0002776123449094814, "loss": 0.0251, "step": 4528 }, { "epoch": 0.92, "learning_rate": 0.0002776021554324985, "loss": 0.0191, "step": 4529 }, { "epoch": 0.92, "learning_rate": 0.00027759196382431874, "loss": 0.0201, "step": 4530 }, { "epoch": 0.92, "learning_rate": 0.0002775817700851124, "loss": 0.0254, "step": 4531 }, { "epoch": 0.92, "learning_rate": 0.0002775715742150496, "loss": 0.0223, "step": 4532 }, { "epoch": 0.92, "learning_rate": 0.0002775613762143007, "loss": 0.0306, "step": 4533 }, { "epoch": 0.92, "learning_rate": 0.0002775511760830361, "loss": 0.0162, "step": 4534 }, { "epoch": 0.92, "learning_rate": 0.000277540973821426, "loss": 0.0066, "step": 4535 }, { "epoch": 0.92, "learning_rate": 0.00027753076942964094, "loss": 0.0172, "step": 4536 }, { "epoch": 0.92, "learning_rate": 0.00027752056290785126, "loss": 0.0381, "step": 4537 }, { "epoch": 0.92, "learning_rate": 0.0002775103542562275, "loss": 0.0139, "step": 4538 }, { "epoch": 0.92, "learning_rate": 0.0002775001434749401, "loss": 0.0127, "step": 4539 }, { "epoch": 0.92, "learning_rate": 0.0002774899305641597, "loss": 0.0112, "step": 4540 }, { "epoch": 0.92, "learning_rate": 0.00027747971552405674, "loss": 0.0262, "step": 4541 }, { "epoch": 0.92, "learning_rate": 0.0002774694983548019, "loss": 0.0304, "step": 4542 }, { "epoch": 0.93, "learning_rate": 0.00027745927905656586, "loss": 0.0311, "step": 4543 }, { "epoch": 0.93, "learning_rate": 0.0002774490576295192, "loss": 0.031, "step": 4544 }, { "epoch": 0.93, "learning_rate": 0.0002774388340738328, "loss": 0.0237, "step": 4545 }, { "epoch": 0.93, "learning_rate": 0.0002774286083896772, "loss": 0.0748, "step": 4546 }, { "epoch": 0.93, "learning_rate": 0.00027741838057722336, "loss": 0.0187, "step": 4547 }, { "epoch": 0.93, "learning_rate": 0.0002774081506366421, "loss": 0.0261, "step": 4548 }, { "epoch": 0.93, "learning_rate": 0.00027739791856810415, "loss": 0.0382, "step": 4549 }, { "epoch": 0.93, "learning_rate": 0.00027738768437178047, "loss": 0.0264, "step": 4550 }, { "epoch": 0.93, "learning_rate": 0.00027737744804784203, "loss": 0.0353, "step": 4551 }, { "epoch": 0.93, "learning_rate": 0.00027736720959645975, "loss": 0.0237, "step": 4552 }, { "epoch": 0.93, "learning_rate": 0.00027735696901780467, "loss": 0.0065, "step": 4553 }, { "epoch": 0.93, "learning_rate": 0.00027734672631204776, "loss": 0.0282, "step": 4554 }, { "epoch": 0.93, "learning_rate": 0.00027733648147936017, "loss": 0.0083, "step": 4555 }, { "epoch": 0.93, "learning_rate": 0.000277326234519913, "loss": 0.0347, "step": 4556 }, { "epoch": 0.93, "learning_rate": 0.00027731598543387733, "loss": 0.0259, "step": 4557 }, { "epoch": 0.93, "learning_rate": 0.00027730573422142437, "loss": 0.0566, "step": 4558 }, { "epoch": 0.93, "learning_rate": 0.00027729548088272534, "loss": 0.0155, "step": 4559 }, { "epoch": 0.93, "learning_rate": 0.00027728522541795156, "loss": 0.0013, "step": 4560 }, { "epoch": 0.93, "learning_rate": 0.00027727496782727415, "loss": 0.0634, "step": 4561 }, { "epoch": 0.93, "learning_rate": 0.0002772647081108646, "loss": 0.0162, "step": 4562 }, { "epoch": 0.93, "learning_rate": 0.0002772544462688941, "loss": 0.0696, "step": 4563 }, { "epoch": 0.93, "learning_rate": 0.00027724418230153433, "loss": 0.0283, "step": 4564 }, { "epoch": 0.93, "learning_rate": 0.00027723391620895635, "loss": 0.0165, "step": 4565 }, { "epoch": 0.93, "learning_rate": 0.00027722364799133187, "loss": 0.02, "step": 4566 }, { "epoch": 0.93, "learning_rate": 0.0002772133776488323, "loss": 0.0117, "step": 4567 }, { "epoch": 0.93, "learning_rate": 0.0002772031051816292, "loss": 0.0362, "step": 4568 }, { "epoch": 0.93, "learning_rate": 0.0002771928305898941, "loss": 0.0157, "step": 4569 }, { "epoch": 0.93, "learning_rate": 0.00027718255387379866, "loss": 0.0072, "step": 4570 }, { "epoch": 0.93, "learning_rate": 0.0002771722750335145, "loss": 0.0304, "step": 4571 }, { "epoch": 0.93, "learning_rate": 0.0002771619940692133, "loss": 0.0132, "step": 4572 }, { "epoch": 0.93, "learning_rate": 0.0002771517109810667, "loss": 0.0068, "step": 4573 }, { "epoch": 0.93, "learning_rate": 0.0002771414257692466, "loss": 0.0171, "step": 4574 }, { "epoch": 0.93, "learning_rate": 0.00027713113843392466, "loss": 0.019, "step": 4575 }, { "epoch": 0.93, "learning_rate": 0.00027712084897527274, "loss": 0.0215, "step": 4576 }, { "epoch": 0.93, "learning_rate": 0.00027711055739346267, "loss": 0.0486, "step": 4577 }, { "epoch": 0.93, "learning_rate": 0.00027710026368866635, "loss": 0.0101, "step": 4578 }, { "epoch": 0.93, "learning_rate": 0.0002770899678610557, "loss": 0.0041, "step": 4579 }, { "epoch": 0.93, "learning_rate": 0.0002770796699108027, "loss": 0.045, "step": 4580 }, { "epoch": 0.93, "learning_rate": 0.00027706936983807934, "loss": 0.037, "step": 4581 }, { "epoch": 0.93, "learning_rate": 0.00027705906764305757, "loss": 0.0368, "step": 4582 }, { "epoch": 0.93, "learning_rate": 0.00027704876332590965, "loss": 0.0083, "step": 4583 }, { "epoch": 0.93, "learning_rate": 0.0002770384568868075, "loss": 0.0114, "step": 4584 }, { "epoch": 0.93, "learning_rate": 0.0002770281483259233, "loss": 0.0087, "step": 4585 }, { "epoch": 0.93, "learning_rate": 0.0002770178376434293, "loss": 0.0187, "step": 4586 }, { "epoch": 0.93, "learning_rate": 0.00027700752483949756, "loss": 0.0239, "step": 4587 }, { "epoch": 0.93, "learning_rate": 0.0002769972099143005, "loss": 0.0423, "step": 4588 }, { "epoch": 0.93, "learning_rate": 0.0002769868928680103, "loss": 0.018, "step": 4589 }, { "epoch": 0.93, "learning_rate": 0.00027697657370079923, "loss": 0.0045, "step": 4590 }, { "epoch": 0.93, "learning_rate": 0.0002769662524128397, "loss": 0.0174, "step": 4591 }, { "epoch": 0.94, "learning_rate": 0.0002769559290043041, "loss": 0.011, "step": 4592 }, { "epoch": 0.94, "learning_rate": 0.00027694560347536485, "loss": 0.01, "step": 4593 }, { "epoch": 0.94, "learning_rate": 0.0002769352758261944, "loss": 0.0255, "step": 4594 }, { "epoch": 0.94, "learning_rate": 0.00027692494605696525, "loss": 0.0343, "step": 4595 }, { "epoch": 0.94, "learning_rate": 0.00027691461416784984, "loss": 0.0099, "step": 4596 }, { "epoch": 0.94, "learning_rate": 0.0002769042801590209, "loss": 0.0252, "step": 4597 }, { "epoch": 0.94, "learning_rate": 0.0002768939440306509, "loss": 0.0294, "step": 4598 }, { "epoch": 0.94, "learning_rate": 0.00027688360578291245, "loss": 0.0571, "step": 4599 }, { "epoch": 0.94, "learning_rate": 0.00027687326541597833, "loss": 0.0535, "step": 4600 }, { "epoch": 0.94, "learning_rate": 0.0002768629229300212, "loss": 0.0127, "step": 4601 }, { "epoch": 0.94, "learning_rate": 0.00027685257832521374, "loss": 0.0166, "step": 4602 }, { "epoch": 0.94, "learning_rate": 0.0002768422316017288, "loss": 0.0197, "step": 4603 }, { "epoch": 0.94, "learning_rate": 0.0002768318827597392, "loss": 0.0163, "step": 4604 }, { "epoch": 0.94, "learning_rate": 0.00027682153179941766, "loss": 0.0212, "step": 4605 }, { "epoch": 0.94, "learning_rate": 0.0002768111787209372, "loss": 0.0149, "step": 4606 }, { "epoch": 0.94, "learning_rate": 0.0002768008235244707, "loss": 0.0089, "step": 4607 }, { "epoch": 0.94, "learning_rate": 0.00027679046621019107, "loss": 0.0064, "step": 4608 }, { "epoch": 0.94, "learning_rate": 0.0002767801067782713, "loss": 0.0288, "step": 4609 }, { "epoch": 0.94, "learning_rate": 0.0002767697452288844, "loss": 0.0269, "step": 4610 }, { "epoch": 0.94, "learning_rate": 0.00027675938156220356, "loss": 0.0178, "step": 4611 }, { "epoch": 0.94, "learning_rate": 0.00027674901577840166, "loss": 0.0053, "step": 4612 }, { "epoch": 0.94, "learning_rate": 0.00027673864787765203, "loss": 0.0201, "step": 4613 }, { "epoch": 0.94, "learning_rate": 0.0002767282778601277, "loss": 0.0665, "step": 4614 }, { "epoch": 0.94, "learning_rate": 0.0002767179057260019, "loss": 0.0529, "step": 4615 }, { "epoch": 0.94, "learning_rate": 0.00027670753147544797, "loss": 0.0321, "step": 4616 }, { "epoch": 0.94, "learning_rate": 0.000276697155108639, "loss": 0.0123, "step": 4617 }, { "epoch": 0.94, "learning_rate": 0.00027668677662574836, "loss": 0.0241, "step": 4618 }, { "epoch": 0.94, "learning_rate": 0.00027667639602694947, "loss": 0.0042, "step": 4619 }, { "epoch": 0.94, "learning_rate": 0.00027666601331241563, "loss": 0.0173, "step": 4620 }, { "epoch": 0.94, "learning_rate": 0.0002766556284823203, "loss": 0.0566, "step": 4621 }, { "epoch": 0.94, "learning_rate": 0.00027664524153683687, "loss": 0.007, "step": 4622 }, { "epoch": 0.94, "learning_rate": 0.00027663485247613883, "loss": 0.0321, "step": 4623 }, { "epoch": 0.94, "learning_rate": 0.00027662446130039973, "loss": 0.0121, "step": 4624 }, { "epoch": 0.94, "learning_rate": 0.0002766140680097931, "loss": 0.0157, "step": 4625 }, { "epoch": 0.94, "learning_rate": 0.00027660367260449255, "loss": 0.0135, "step": 4626 }, { "epoch": 0.94, "learning_rate": 0.0002765932750846717, "loss": 0.0137, "step": 4627 }, { "epoch": 0.94, "learning_rate": 0.0002765828754505041, "loss": 0.0369, "step": 4628 }, { "epoch": 0.94, "learning_rate": 0.0002765724737021636, "loss": 0.0234, "step": 4629 }, { "epoch": 0.94, "learning_rate": 0.0002765620698398239, "loss": 0.0221, "step": 4630 }, { "epoch": 0.94, "learning_rate": 0.0002765516638636587, "loss": 0.0143, "step": 4631 }, { "epoch": 0.94, "learning_rate": 0.0002765412557738418, "loss": 0.0416, "step": 4632 }, { "epoch": 0.94, "learning_rate": 0.0002765308455705471, "loss": 0.0217, "step": 4633 }, { "epoch": 0.94, "learning_rate": 0.00027652043325394844, "loss": 0.0165, "step": 4634 }, { "epoch": 0.94, "learning_rate": 0.00027651001882421974, "loss": 0.0052, "step": 4635 }, { "epoch": 0.94, "learning_rate": 0.00027649960228153485, "loss": 0.0144, "step": 4636 }, { "epoch": 0.94, "learning_rate": 0.0002764891836260679, "loss": 0.0258, "step": 4637 }, { "epoch": 0.94, "learning_rate": 0.0002764787628579928, "loss": 0.0326, "step": 4638 }, { "epoch": 0.94, "learning_rate": 0.00027646833997748354, "loss": 0.0306, "step": 4639 }, { "epoch": 0.94, "learning_rate": 0.0002764579149847143, "loss": 0.0183, "step": 4640 }, { "epoch": 0.94, "learning_rate": 0.00027644748787985927, "loss": 0.0557, "step": 4641 }, { "epoch": 0.95, "learning_rate": 0.0002764370586630924, "loss": 0.034, "step": 4642 }, { "epoch": 0.95, "learning_rate": 0.000276426627334588, "loss": 0.007, "step": 4643 }, { "epoch": 0.95, "learning_rate": 0.0002764161938945203, "loss": 0.0327, "step": 4644 }, { "epoch": 0.95, "learning_rate": 0.00027640575834306355, "loss": 0.0091, "step": 4645 }, { "epoch": 0.95, "learning_rate": 0.00027639532068039204, "loss": 0.027, "step": 4646 }, { "epoch": 0.95, "learning_rate": 0.00027638488090668003, "loss": 0.0179, "step": 4647 }, { "epoch": 0.95, "learning_rate": 0.000276374439022102, "loss": 0.0372, "step": 4648 }, { "epoch": 0.95, "learning_rate": 0.0002763639950268322, "loss": 0.0259, "step": 4649 }, { "epoch": 0.95, "learning_rate": 0.00027635354892104524, "loss": 0.0253, "step": 4650 }, { "epoch": 0.95, "learning_rate": 0.00027634310070491546, "loss": 0.0182, "step": 4651 }, { "epoch": 0.95, "learning_rate": 0.0002763326503786174, "loss": 0.0064, "step": 4652 }, { "epoch": 0.95, "learning_rate": 0.0002763221979423257, "loss": 0.0147, "step": 4653 }, { "epoch": 0.95, "learning_rate": 0.00027631174339621476, "loss": 0.0318, "step": 4654 }, { "epoch": 0.95, "learning_rate": 0.0002763012867404593, "loss": 0.0345, "step": 4655 }, { "epoch": 0.95, "learning_rate": 0.00027629082797523395, "loss": 0.0067, "step": 4656 }, { "epoch": 0.95, "learning_rate": 0.00027628036710071333, "loss": 0.0333, "step": 4657 }, { "epoch": 0.95, "learning_rate": 0.00027626990411707227, "loss": 0.028, "step": 4658 }, { "epoch": 0.95, "learning_rate": 0.00027625943902448544, "loss": 0.0032, "step": 4659 }, { "epoch": 0.95, "learning_rate": 0.0002762489718231276, "loss": 0.0377, "step": 4660 }, { "epoch": 0.95, "learning_rate": 0.00027623850251317364, "loss": 0.0599, "step": 4661 }, { "epoch": 0.95, "learning_rate": 0.00027622803109479845, "loss": 0.0259, "step": 4662 }, { "epoch": 0.95, "learning_rate": 0.00027621755756817684, "loss": 0.0213, "step": 4663 }, { "epoch": 0.95, "learning_rate": 0.00027620708193348375, "loss": 0.0264, "step": 4664 }, { "epoch": 0.95, "learning_rate": 0.00027619660419089413, "loss": 0.0192, "step": 4665 }, { "epoch": 0.95, "learning_rate": 0.00027618612434058307, "loss": 0.0376, "step": 4666 }, { "epoch": 0.95, "learning_rate": 0.0002761756423827255, "loss": 0.05, "step": 4667 }, { "epoch": 0.95, "learning_rate": 0.0002761651583174966, "loss": 0.0142, "step": 4668 }, { "epoch": 0.95, "learning_rate": 0.0002761546721450713, "loss": 0.0233, "step": 4669 }, { "epoch": 0.95, "learning_rate": 0.0002761441838656249, "loss": 0.0056, "step": 4670 }, { "epoch": 0.95, "learning_rate": 0.0002761336934793325, "loss": 0.0105, "step": 4671 }, { "epoch": 0.95, "learning_rate": 0.00027612320098636934, "loss": 0.0223, "step": 4672 }, { "epoch": 0.95, "learning_rate": 0.0002761127063869107, "loss": 0.0185, "step": 4673 }, { "epoch": 0.95, "learning_rate": 0.0002761022096811317, "loss": 0.0043, "step": 4674 }, { "epoch": 0.95, "learning_rate": 0.0002760917108692078, "loss": 0.0265, "step": 4675 }, { "epoch": 0.95, "learning_rate": 0.00027608120995131427, "loss": 0.0185, "step": 4676 }, { "epoch": 0.95, "learning_rate": 0.00027607070692762663, "loss": 0.0257, "step": 4677 }, { "epoch": 0.95, "learning_rate": 0.00027606020179832014, "loss": 0.0157, "step": 4678 }, { "epoch": 0.95, "learning_rate": 0.0002760496945635704, "loss": 0.0069, "step": 4679 }, { "epoch": 0.95, "learning_rate": 0.00027603918522355275, "loss": 0.0104, "step": 4680 }, { "epoch": 0.95, "learning_rate": 0.00027602867377844286, "loss": 0.0238, "step": 4681 }, { "epoch": 0.95, "learning_rate": 0.0002760181602284162, "loss": 0.0395, "step": 4682 }, { "epoch": 0.95, "learning_rate": 0.0002760076445736483, "loss": 0.0066, "step": 4683 }, { "epoch": 0.95, "learning_rate": 0.000275997126814315, "loss": 0.024, "step": 4684 }, { "epoch": 0.95, "learning_rate": 0.00027598660695059177, "loss": 0.0146, "step": 4685 }, { "epoch": 0.95, "learning_rate": 0.0002759760849826544, "loss": 0.0175, "step": 4686 }, { "epoch": 0.95, "learning_rate": 0.00027596556091067867, "loss": 0.0234, "step": 4687 }, { "epoch": 0.95, "learning_rate": 0.0002759550347348402, "loss": 0.023, "step": 4688 }, { "epoch": 0.95, "learning_rate": 0.000275944506455315, "loss": 0.0512, "step": 4689 }, { "epoch": 0.95, "learning_rate": 0.00027593397607227874, "loss": 0.0128, "step": 4690 }, { "epoch": 0.96, "learning_rate": 0.0002759234435859074, "loss": 0.0111, "step": 4691 }, { "epoch": 0.96, "learning_rate": 0.0002759129089963768, "loss": 0.0153, "step": 4692 }, { "epoch": 0.96, "learning_rate": 0.000275902372303863, "loss": 0.0457, "step": 4693 }, { "epoch": 0.96, "learning_rate": 0.00027589183350854187, "loss": 0.0303, "step": 4694 }, { "epoch": 0.96, "learning_rate": 0.0002758812926105895, "loss": 0.0175, "step": 4695 }, { "epoch": 0.96, "learning_rate": 0.000275870749610182, "loss": 0.0372, "step": 4696 }, { "epoch": 0.96, "learning_rate": 0.00027586020450749525, "loss": 0.0177, "step": 4697 }, { "epoch": 0.96, "learning_rate": 0.0002758496573027056, "loss": 0.0094, "step": 4698 }, { "epoch": 0.96, "learning_rate": 0.0002758391079959891, "loss": 0.0062, "step": 4699 }, { "epoch": 0.96, "learning_rate": 0.00027582855658752194, "loss": 0.0289, "step": 4700 }, { "epoch": 0.96, "learning_rate": 0.0002758180030774804, "loss": 0.0117, "step": 4701 }, { "epoch": 0.96, "learning_rate": 0.00027580744746604066, "loss": 0.0522, "step": 4702 }, { "epoch": 0.96, "learning_rate": 0.0002757968897533791, "loss": 0.0219, "step": 4703 }, { "epoch": 0.96, "learning_rate": 0.000275786329939672, "loss": 0.0287, "step": 4704 }, { "epoch": 0.96, "learning_rate": 0.00027577576802509575, "loss": 0.0108, "step": 4705 }, { "epoch": 0.96, "learning_rate": 0.0002757652040098268, "loss": 0.0285, "step": 4706 }, { "epoch": 0.96, "learning_rate": 0.00027575463789404153, "loss": 0.0244, "step": 4707 }, { "epoch": 0.96, "learning_rate": 0.0002757440696779164, "loss": 0.0136, "step": 4708 }, { "epoch": 0.96, "learning_rate": 0.00027573349936162796, "loss": 0.0097, "step": 4709 }, { "epoch": 0.96, "learning_rate": 0.0002757229269453527, "loss": 0.0178, "step": 4710 }, { "epoch": 0.96, "learning_rate": 0.00027571235242926736, "loss": 0.0259, "step": 4711 }, { "epoch": 0.96, "learning_rate": 0.00027570177581354833, "loss": 0.0286, "step": 4712 }, { "epoch": 0.96, "learning_rate": 0.0002756911970983724, "loss": 0.0132, "step": 4713 }, { "epoch": 0.96, "learning_rate": 0.0002756806162839162, "loss": 0.0401, "step": 4714 }, { "epoch": 0.96, "learning_rate": 0.0002756700333703565, "loss": 0.016, "step": 4715 }, { "epoch": 0.96, "learning_rate": 0.00027565944835787, "loss": 0.0147, "step": 4716 }, { "epoch": 0.96, "learning_rate": 0.0002756488612466335, "loss": 0.0249, "step": 4717 }, { "epoch": 0.96, "learning_rate": 0.00027563827203682393, "loss": 0.0237, "step": 4718 }, { "epoch": 0.96, "learning_rate": 0.000275627680728618, "loss": 0.033, "step": 4719 }, { "epoch": 0.96, "learning_rate": 0.00027561708732219264, "loss": 0.0246, "step": 4720 }, { "epoch": 0.96, "learning_rate": 0.0002756064918177248, "loss": 0.0234, "step": 4721 }, { "epoch": 0.96, "learning_rate": 0.0002755958942153914, "loss": 0.0192, "step": 4722 }, { "epoch": 0.96, "learning_rate": 0.00027558529451536957, "loss": 0.0111, "step": 4723 }, { "epoch": 0.96, "learning_rate": 0.0002755746927178363, "loss": 0.013, "step": 4724 }, { "epoch": 0.96, "learning_rate": 0.0002755640888229685, "loss": 0.0278, "step": 4725 }, { "epoch": 0.96, "learning_rate": 0.0002755534828309435, "loss": 0.0327, "step": 4726 }, { "epoch": 0.96, "learning_rate": 0.0002755428747419383, "loss": 0.0154, "step": 4727 }, { "epoch": 0.96, "learning_rate": 0.00027553226455613014, "loss": 0.0383, "step": 4728 }, { "epoch": 0.96, "learning_rate": 0.00027552165227369614, "loss": 0.0361, "step": 4729 }, { "epoch": 0.96, "learning_rate": 0.0002755110378948137, "loss": 0.0089, "step": 4730 }, { "epoch": 0.96, "learning_rate": 0.0002755004214196599, "loss": 0.0195, "step": 4731 }, { "epoch": 0.96, "learning_rate": 0.0002754898028484122, "loss": 0.0066, "step": 4732 }, { "epoch": 0.96, "learning_rate": 0.000275479182181248, "loss": 0.0252, "step": 4733 }, { "epoch": 0.96, "learning_rate": 0.0002754685594183445, "loss": 0.0457, "step": 4734 }, { "epoch": 0.96, "learning_rate": 0.00027545793455987925, "loss": 0.0202, "step": 4735 }, { "epoch": 0.96, "learning_rate": 0.00027544730760602963, "loss": 0.013, "step": 4736 }, { "epoch": 0.96, "learning_rate": 0.00027543667855697325, "loss": 0.0191, "step": 4737 }, { "epoch": 0.96, "learning_rate": 0.00027542604741288753, "loss": 0.0261, "step": 4738 }, { "epoch": 0.96, "learning_rate": 0.00027541541417395006, "loss": 0.0139, "step": 4739 }, { "epoch": 0.97, "learning_rate": 0.0002754047788403384, "loss": 0.0066, "step": 4740 }, { "epoch": 0.97, "learning_rate": 0.0002753941414122303, "loss": 0.0248, "step": 4741 }, { "epoch": 0.97, "learning_rate": 0.00027538350188980324, "loss": 0.0204, "step": 4742 }, { "epoch": 0.97, "learning_rate": 0.0002753728602732351, "loss": 0.0208, "step": 4743 }, { "epoch": 0.97, "learning_rate": 0.00027536221656270345, "loss": 0.0083, "step": 4744 }, { "epoch": 0.97, "learning_rate": 0.00027535157075838626, "loss": 0.0095, "step": 4745 }, { "epoch": 0.97, "learning_rate": 0.0002753409228604611, "loss": 0.0523, "step": 4746 }, { "epoch": 0.97, "learning_rate": 0.000275330272869106, "loss": 0.0456, "step": 4747 }, { "epoch": 0.97, "learning_rate": 0.0002753196207844988, "loss": 0.0279, "step": 4748 }, { "epoch": 0.97, "learning_rate": 0.0002753089666068173, "loss": 0.0242, "step": 4749 }, { "epoch": 0.97, "learning_rate": 0.0002752983103362395, "loss": 0.0248, "step": 4750 }, { "epoch": 0.97, "learning_rate": 0.0002752876519729435, "loss": 0.0167, "step": 4751 }, { "epoch": 0.97, "learning_rate": 0.00027527699151710716, "loss": 0.0092, "step": 4752 }, { "epoch": 0.97, "learning_rate": 0.00027526632896890857, "loss": 0.0178, "step": 4753 }, { "epoch": 0.97, "learning_rate": 0.00027525566432852586, "loss": 0.0169, "step": 4754 }, { "epoch": 0.97, "learning_rate": 0.0002752449975961371, "loss": 0.0454, "step": 4755 }, { "epoch": 0.97, "learning_rate": 0.0002752343287719205, "loss": 0.0309, "step": 4756 }, { "epoch": 0.97, "learning_rate": 0.00027522365785605414, "loss": 0.0189, "step": 4757 }, { "epoch": 0.97, "learning_rate": 0.00027521298484871635, "loss": 0.0156, "step": 4758 }, { "epoch": 0.97, "learning_rate": 0.0002752023097500854, "loss": 0.066, "step": 4759 }, { "epoch": 0.97, "learning_rate": 0.00027519163256033955, "loss": 0.0475, "step": 4760 }, { "epoch": 0.97, "learning_rate": 0.00027518095327965707, "loss": 0.0258, "step": 4761 }, { "epoch": 0.97, "learning_rate": 0.00027517027190821636, "loss": 0.005, "step": 4762 }, { "epoch": 0.97, "learning_rate": 0.0002751595884461959, "loss": 0.0071, "step": 4763 }, { "epoch": 0.97, "learning_rate": 0.000275148902893774, "loss": 0.0222, "step": 4764 }, { "epoch": 0.97, "learning_rate": 0.00027513821525112917, "loss": 0.0217, "step": 4765 }, { "epoch": 0.97, "learning_rate": 0.00027512752551843997, "loss": 0.0427, "step": 4766 }, { "epoch": 0.97, "learning_rate": 0.0002751168336958849, "loss": 0.0104, "step": 4767 }, { "epoch": 0.97, "learning_rate": 0.0002751061397836425, "loss": 0.0317, "step": 4768 }, { "epoch": 0.97, "learning_rate": 0.00027509544378189144, "loss": 0.0425, "step": 4769 }, { "epoch": 0.97, "learning_rate": 0.0002750847456908103, "loss": 0.0157, "step": 4770 }, { "epoch": 0.97, "learning_rate": 0.0002750740455105779, "loss": 0.0223, "step": 4771 }, { "epoch": 0.97, "learning_rate": 0.00027506334324137275, "loss": 0.0399, "step": 4772 }, { "epoch": 0.97, "learning_rate": 0.0002750526388833737, "loss": 0.0134, "step": 4773 }, { "epoch": 0.97, "learning_rate": 0.00027504193243675954, "loss": 0.0355, "step": 4774 }, { "epoch": 0.97, "learning_rate": 0.00027503122390170904, "loss": 0.0072, "step": 4775 }, { "epoch": 0.97, "learning_rate": 0.0002750205132784011, "loss": 0.015, "step": 4776 }, { "epoch": 0.97, "learning_rate": 0.00027500980056701464, "loss": 0.0252, "step": 4777 }, { "epoch": 0.97, "learning_rate": 0.00027499908576772853, "loss": 0.0254, "step": 4778 }, { "epoch": 0.97, "learning_rate": 0.0002749883688807217, "loss": 0.0177, "step": 4779 }, { "epoch": 0.97, "learning_rate": 0.0002749776499061732, "loss": 0.029, "step": 4780 }, { "epoch": 0.97, "learning_rate": 0.000274966928844262, "loss": 0.016, "step": 4781 }, { "epoch": 0.97, "learning_rate": 0.00027495620569516725, "loss": 0.0198, "step": 4782 }, { "epoch": 0.97, "learning_rate": 0.00027494548045906795, "loss": 0.0281, "step": 4783 }, { "epoch": 0.97, "learning_rate": 0.0002749347531361433, "loss": 0.0171, "step": 4784 }, { "epoch": 0.97, "learning_rate": 0.0002749240237265725, "loss": 0.0492, "step": 4785 }, { "epoch": 0.97, "learning_rate": 0.0002749132922305346, "loss": 0.0252, "step": 4786 }, { "epoch": 0.97, "learning_rate": 0.00027490255864820896, "loss": 0.0177, "step": 4787 }, { "epoch": 0.97, "learning_rate": 0.0002748918229797748, "loss": 0.0116, "step": 4788 }, { "epoch": 0.98, "learning_rate": 0.00027488108522541146, "loss": 0.043, "step": 4789 }, { "epoch": 0.98, "learning_rate": 0.0002748703453852983, "loss": 0.0315, "step": 4790 }, { "epoch": 0.98, "learning_rate": 0.0002748596034596146, "loss": 0.0191, "step": 4791 }, { "epoch": 0.98, "learning_rate": 0.00027484885944853985, "loss": 0.0346, "step": 4792 }, { "epoch": 0.98, "learning_rate": 0.00027483811335225354, "loss": 0.0156, "step": 4793 }, { "epoch": 0.98, "learning_rate": 0.00027482736517093505, "loss": 0.0252, "step": 4794 }, { "epoch": 0.98, "learning_rate": 0.0002748166149047639, "loss": 0.0379, "step": 4795 }, { "epoch": 0.98, "learning_rate": 0.00027480586255391976, "loss": 0.0156, "step": 4796 }, { "epoch": 0.98, "learning_rate": 0.00027479510811858205, "loss": 0.0069, "step": 4797 }, { "epoch": 0.98, "learning_rate": 0.0002747843515989305, "loss": 0.0175, "step": 4798 }, { "epoch": 0.98, "learning_rate": 0.0002747735929951447, "loss": 0.007, "step": 4799 }, { "epoch": 0.98, "learning_rate": 0.0002747628323074044, "loss": 0.0361, "step": 4800 }, { "epoch": 0.98, "learning_rate": 0.00027475206953588927, "loss": 0.0165, "step": 4801 }, { "epoch": 0.98, "learning_rate": 0.0002747413046807791, "loss": 0.0351, "step": 4802 }, { "epoch": 0.98, "learning_rate": 0.00027473053774225366, "loss": 0.0044, "step": 4803 }, { "epoch": 0.98, "learning_rate": 0.00027471976872049284, "loss": 0.033, "step": 4804 }, { "epoch": 0.98, "learning_rate": 0.0002747089976156764, "loss": 0.0109, "step": 4805 }, { "epoch": 0.98, "learning_rate": 0.00027469822442798437, "loss": 0.0431, "step": 4806 }, { "epoch": 0.98, "learning_rate": 0.00027468744915759655, "loss": 0.0088, "step": 4807 }, { "epoch": 0.98, "learning_rate": 0.00027467667180469294, "loss": 0.0034, "step": 4808 }, { "epoch": 0.98, "learning_rate": 0.0002746658923694536, "loss": 0.0229, "step": 4809 }, { "epoch": 0.98, "learning_rate": 0.00027465511085205855, "loss": 0.011, "step": 4810 }, { "epoch": 0.98, "learning_rate": 0.00027464432725268783, "loss": 0.045, "step": 4811 }, { "epoch": 0.98, "learning_rate": 0.0002746335415715216, "loss": 0.0135, "step": 4812 }, { "epoch": 0.98, "learning_rate": 0.00027462275380873996, "loss": 0.0116, "step": 4813 }, { "epoch": 0.98, "learning_rate": 0.000274611963964523, "loss": 0.0108, "step": 4814 }, { "epoch": 0.98, "learning_rate": 0.0002746011720390511, "loss": 0.0177, "step": 4815 }, { "epoch": 0.98, "learning_rate": 0.0002745903780325044, "loss": 0.0167, "step": 4816 }, { "epoch": 0.98, "learning_rate": 0.0002745795819450632, "loss": 0.0305, "step": 4817 }, { "epoch": 0.98, "learning_rate": 0.00027456878377690784, "loss": 0.0224, "step": 4818 }, { "epoch": 0.98, "learning_rate": 0.00027455798352821865, "loss": 0.0139, "step": 4819 }, { "epoch": 0.98, "learning_rate": 0.00027454718119917604, "loss": 0.002, "step": 4820 }, { "epoch": 0.98, "learning_rate": 0.0002745363767899603, "loss": 0.0163, "step": 4821 }, { "epoch": 0.98, "learning_rate": 0.0002745255703007521, "loss": 0.026, "step": 4822 }, { "epoch": 0.98, "learning_rate": 0.0002745147617317318, "loss": 0.014, "step": 4823 }, { "epoch": 0.98, "learning_rate": 0.0002745039510830799, "loss": 0.0083, "step": 4824 }, { "epoch": 0.98, "learning_rate": 0.000274493138354977, "loss": 0.0137, "step": 4825 }, { "epoch": 0.98, "learning_rate": 0.0002744823235476037, "loss": 0.0131, "step": 4826 }, { "epoch": 0.98, "learning_rate": 0.00027447150666114065, "loss": 0.0245, "step": 4827 }, { "epoch": 0.98, "learning_rate": 0.00027446068769576847, "loss": 0.0426, "step": 4828 }, { "epoch": 0.98, "learning_rate": 0.00027444986665166787, "loss": 0.0533, "step": 4829 }, { "epoch": 0.98, "learning_rate": 0.0002744390435290196, "loss": 0.0103, "step": 4830 }, { "epoch": 0.98, "learning_rate": 0.00027442821832800434, "loss": 0.0081, "step": 4831 }, { "epoch": 0.98, "learning_rate": 0.000274417391048803, "loss": 0.0127, "step": 4832 }, { "epoch": 0.98, "learning_rate": 0.0002744065616915964, "loss": 0.0286, "step": 4833 }, { "epoch": 0.98, "learning_rate": 0.0002743957302565653, "loss": 0.0073, "step": 4834 }, { "epoch": 0.98, "learning_rate": 0.00027438489674389075, "loss": 0.0175, "step": 4835 }, { "epoch": 0.98, "learning_rate": 0.00027437406115375364, "loss": 0.0138, "step": 4836 }, { "epoch": 0.98, "learning_rate": 0.0002743632234863349, "loss": 0.0405, "step": 4837 }, { "epoch": 0.99, "learning_rate": 0.00027435238374181567, "loss": 0.0183, "step": 4838 }, { "epoch": 0.99, "learning_rate": 0.00027434154192037684, "loss": 0.0307, "step": 4839 }, { "epoch": 0.99, "learning_rate": 0.0002743306980221995, "loss": 0.0166, "step": 4840 }, { "epoch": 0.99, "learning_rate": 0.00027431985204746484, "loss": 0.0174, "step": 4841 }, { "epoch": 0.99, "learning_rate": 0.000274309003996354, "loss": 0.0219, "step": 4842 }, { "epoch": 0.99, "learning_rate": 0.00027429815386904817, "loss": 0.0225, "step": 4843 }, { "epoch": 0.99, "learning_rate": 0.00027428730166572854, "loss": 0.0306, "step": 4844 }, { "epoch": 0.99, "learning_rate": 0.0002742764473865763, "loss": 0.0186, "step": 4845 }, { "epoch": 0.99, "learning_rate": 0.00027426559103177283, "loss": 0.0811, "step": 4846 }, { "epoch": 0.99, "learning_rate": 0.00027425473260149946, "loss": 0.0292, "step": 4847 }, { "epoch": 0.99, "learning_rate": 0.0002742438720959374, "loss": 0.0364, "step": 4848 }, { "epoch": 0.99, "learning_rate": 0.00027423300951526827, "loss": 0.0687, "step": 4849 }, { "epoch": 0.99, "learning_rate": 0.0002742221448596733, "loss": 0.0387, "step": 4850 }, { "epoch": 0.99, "learning_rate": 0.0002742112781293341, "loss": 0.0108, "step": 4851 }, { "epoch": 0.99, "learning_rate": 0.000274200409324432, "loss": 0.0163, "step": 4852 }, { "epoch": 0.99, "learning_rate": 0.0002741895384451487, "loss": 0.0189, "step": 4853 }, { "epoch": 0.99, "learning_rate": 0.0002741786654916656, "loss": 0.0121, "step": 4854 }, { "epoch": 0.99, "learning_rate": 0.00027416779046416447, "loss": 0.0259, "step": 4855 }, { "epoch": 0.99, "learning_rate": 0.0002741569133628268, "loss": 0.0142, "step": 4856 }, { "epoch": 0.99, "learning_rate": 0.00027414603418783427, "loss": 0.0222, "step": 4857 }, { "epoch": 0.99, "learning_rate": 0.0002741351529393687, "loss": 0.0146, "step": 4858 }, { "epoch": 0.99, "learning_rate": 0.00027412426961761176, "loss": 0.0283, "step": 4859 }, { "epoch": 0.99, "learning_rate": 0.0002741133842227452, "loss": 0.0353, "step": 4860 }, { "epoch": 0.99, "learning_rate": 0.00027410249675495084, "loss": 0.0182, "step": 4861 }, { "epoch": 0.99, "learning_rate": 0.00027409160721441055, "loss": 0.0212, "step": 4862 }, { "epoch": 0.99, "learning_rate": 0.00027408071560130614, "loss": 0.013, "step": 4863 }, { "epoch": 0.99, "learning_rate": 0.0002740698219158196, "loss": 0.0611, "step": 4864 }, { "epoch": 0.99, "learning_rate": 0.00027405892615813275, "loss": 0.0162, "step": 4865 }, { "epoch": 0.99, "learning_rate": 0.0002740480283284277, "loss": 0.0059, "step": 4866 }, { "epoch": 0.99, "learning_rate": 0.00027403712842688645, "loss": 0.0155, "step": 4867 }, { "epoch": 0.99, "learning_rate": 0.000274026226453691, "loss": 0.071, "step": 4868 }, { "epoch": 0.99, "learning_rate": 0.0002740153224090234, "loss": 0.0263, "step": 4869 }, { "epoch": 0.99, "learning_rate": 0.00027400441629306594, "loss": 0.0043, "step": 4870 }, { "epoch": 0.99, "learning_rate": 0.00027399350810600057, "loss": 0.0208, "step": 4871 }, { "epoch": 0.99, "learning_rate": 0.0002739825978480096, "loss": 0.0133, "step": 4872 }, { "epoch": 0.99, "learning_rate": 0.0002739716855192751, "loss": 0.017, "step": 4873 }, { "epoch": 0.99, "learning_rate": 0.00027396077111997957, "loss": 0.0446, "step": 4874 }, { "epoch": 0.99, "learning_rate": 0.0002739498546503051, "loss": 0.0166, "step": 4875 }, { "epoch": 0.99, "learning_rate": 0.0002739389361104341, "loss": 0.0137, "step": 4876 }, { "epoch": 0.99, "learning_rate": 0.000273928015500549, "loss": 0.0234, "step": 4877 }, { "epoch": 0.99, "learning_rate": 0.000273917092820832, "loss": 0.0125, "step": 4878 }, { "epoch": 0.99, "learning_rate": 0.0002739061680714657, "loss": 0.0233, "step": 4879 }, { "epoch": 0.99, "learning_rate": 0.0002738952412526325, "loss": 0.0032, "step": 4880 }, { "epoch": 0.99, "learning_rate": 0.00027388431236451485, "loss": 0.0195, "step": 4881 }, { "epoch": 0.99, "learning_rate": 0.0002738733814072954, "loss": 0.0153, "step": 4882 }, { "epoch": 0.99, "learning_rate": 0.00027386244838115663, "loss": 0.0609, "step": 4883 }, { "epoch": 0.99, "learning_rate": 0.00027385151328628113, "loss": 0.0041, "step": 4884 }, { "epoch": 0.99, "learning_rate": 0.0002738405761228516, "loss": 0.044, "step": 4885 }, { "epoch": 0.99, "learning_rate": 0.0002738296368910507, "loss": 0.0258, "step": 4886 }, { "epoch": 1.0, "learning_rate": 0.0002738186955910611, "loss": 0.0395, "step": 4887 }, { "epoch": 1.0, "learning_rate": 0.00027380775222306556, "loss": 0.0248, "step": 4888 }, { "epoch": 1.0, "learning_rate": 0.00027379680678724685, "loss": 0.0501, "step": 4889 }, { "epoch": 1.0, "learning_rate": 0.00027378585928378776, "loss": 0.0148, "step": 4890 }, { "epoch": 1.0, "learning_rate": 0.0002737749097128712, "loss": 0.0058, "step": 4891 }, { "epoch": 1.0, "learning_rate": 0.00027376395807468003, "loss": 0.0175, "step": 4892 }, { "epoch": 1.0, "learning_rate": 0.00027375300436939705, "loss": 0.0735, "step": 4893 }, { "epoch": 1.0, "learning_rate": 0.00027374204859720536, "loss": 0.0253, "step": 4894 }, { "epoch": 1.0, "learning_rate": 0.0002737310907582879, "loss": 0.0172, "step": 4895 }, { "epoch": 1.0, "learning_rate": 0.00027372013085282757, "loss": 0.0254, "step": 4896 }, { "epoch": 1.0, "learning_rate": 0.0002737091688810076, "loss": 0.0126, "step": 4897 }, { "epoch": 1.0, "learning_rate": 0.000273698204843011, "loss": 0.0161, "step": 4898 }, { "epoch": 1.0, "learning_rate": 0.00027368723873902085, "loss": 0.0149, "step": 4899 }, { "epoch": 1.0, "learning_rate": 0.00027367627056922034, "loss": 0.0184, "step": 4900 }, { "epoch": 1.0, "learning_rate": 0.00027366530033379264, "loss": 0.0145, "step": 4901 }, { "epoch": 1.0, "learning_rate": 0.000273654328032921, "loss": 0.0158, "step": 4902 }, { "epoch": 1.0, "learning_rate": 0.0002736433536667887, "loss": 0.0131, "step": 4903 }, { "epoch": 1.0, "learning_rate": 0.00027363237723557893, "loss": 0.0277, "step": 4904 }, { "epoch": 1.0, "learning_rate": 0.00027362139873947513, "loss": 0.0404, "step": 4905 }, { "epoch": 1.0, "learning_rate": 0.0002736104181786607, "loss": 0.0064, "step": 4906 }, { "epoch": 1.0, "learning_rate": 0.0002735994355533188, "loss": 0.01, "step": 4907 }, { "epoch": 1.0, "learning_rate": 0.0002735884508636331, "loss": 0.0311, "step": 4908 }, { "epoch": 1.0, "learning_rate": 0.000273577464109787, "loss": 0.0178, "step": 4909 }, { "epoch": 1.0, "learning_rate": 0.0002735664752919639, "loss": 0.0294, "step": 4910 }, { "epoch": 1.0, "learning_rate": 0.0002735554844103475, "loss": 0.0235, "step": 4911 }, { "epoch": 1.0, "learning_rate": 0.0002735444914651212, "loss": 0.0744, "step": 4912 }, { "epoch": 1.0, "learning_rate": 0.0002735334964564688, "loss": 0.0094, "step": 4913 }, { "epoch": 1.0, "learning_rate": 0.00027352249938457373, "loss": 0.0288, "step": 4914 }, { "epoch": 1.0, "learning_rate": 0.0002735115002496198, "loss": 0.0135, "step": 4915 }, { "epoch": 1.0, "learning_rate": 0.00027350049905179065, "loss": 0.0195, "step": 4916 }, { "epoch": 1.0, "learning_rate": 0.00027348949579127004, "loss": 0.0156, "step": 4917 }, { "epoch": 1.0, "learning_rate": 0.00027347849046824177, "loss": 0.0034, "step": 4918 }, { "epoch": 1.0, "learning_rate": 0.0002734674830828896, "loss": 0.007, "step": 4919 }, { "epoch": 1.0, "learning_rate": 0.0002734564736353974, "loss": 0.0282, "step": 4920 }, { "epoch": 1.0, "learning_rate": 0.0002734454621259491, "loss": 0.0118, "step": 4921 }, { "epoch": 1.0, "learning_rate": 0.0002734344485547285, "loss": 0.0074, "step": 4922 }, { "epoch": 1.0, "learning_rate": 0.00027342343292191963, "loss": 0.0154, "step": 4923 }, { "epoch": 1.0, "learning_rate": 0.0002734124152277065, "loss": 0.004, "step": 4924 }, { "epoch": 1.0, "learning_rate": 0.000273401395472273, "loss": 0.0045, "step": 4925 }, { "epoch": 1.0, "learning_rate": 0.0002733903736558033, "loss": 0.0316, "step": 4926 }, { "epoch": 1.0, "learning_rate": 0.00027337934977848143, "loss": 0.017, "step": 4927 }, { "epoch": 1.0, "learning_rate": 0.0002733683238404915, "loss": 0.0163, "step": 4928 }, { "epoch": 1.0, "learning_rate": 0.00027335729584201777, "loss": 0.0203, "step": 4929 }, { "epoch": 1.0, "learning_rate": 0.0002733462657832443, "loss": 0.0132, "step": 4930 }, { "epoch": 1.0, "learning_rate": 0.00027333523366435537, "loss": 0.0218, "step": 4931 }, { "epoch": 1.0, "learning_rate": 0.00027332419948553516, "loss": 0.0072, "step": 4932 }, { "epoch": 1.0, "learning_rate": 0.0002733131632469681, "loss": 0.0136, "step": 4933 }, { "epoch": 1.0, "learning_rate": 0.0002733021249488384, "loss": 0.0069, "step": 4934 }, { "epoch": 1.0, "learning_rate": 0.0002732910845913305, "loss": 0.0321, "step": 4935 }, { "epoch": 1.01, "learning_rate": 0.00027328004217462874, "loss": 0.0134, "step": 4936 }, { "epoch": 1.01, "learning_rate": 0.0002732689976989176, "loss": 0.0253, "step": 4937 }, { "epoch": 1.01, "learning_rate": 0.00027325795116438147, "loss": 0.0124, "step": 4938 }, { "epoch": 1.01, "learning_rate": 0.0002732469025712049, "loss": 0.0075, "step": 4939 }, { "epoch": 1.01, "learning_rate": 0.0002732358519195724, "loss": 0.0134, "step": 4940 }, { "epoch": 1.01, "learning_rate": 0.0002732247992096686, "loss": 0.0149, "step": 4941 }, { "epoch": 1.01, "learning_rate": 0.00027321374444167797, "loss": 0.002, "step": 4942 }, { "epoch": 1.01, "learning_rate": 0.00027320268761578533, "loss": 0.0109, "step": 4943 }, { "epoch": 1.01, "learning_rate": 0.00027319162873217515, "loss": 0.0116, "step": 4944 }, { "epoch": 1.01, "learning_rate": 0.0002731805677910323, "loss": 0.0128, "step": 4945 }, { "epoch": 1.01, "learning_rate": 0.00027316950479254134, "loss": 0.0133, "step": 4946 }, { "epoch": 1.01, "learning_rate": 0.0002731584397368873, "loss": 0.0084, "step": 4947 }, { "epoch": 1.01, "learning_rate": 0.00027314737262425475, "loss": 0.0323, "step": 4948 }, { "epoch": 1.01, "learning_rate": 0.0002731363034548286, "loss": 0.0155, "step": 4949 }, { "epoch": 1.01, "learning_rate": 0.00027312523222879374, "loss": 0.0167, "step": 4950 }, { "epoch": 1.01, "learning_rate": 0.0002731141589463352, "loss": 0.0101, "step": 4951 }, { "epoch": 1.01, "learning_rate": 0.0002731030836076377, "loss": 0.0072, "step": 4952 }, { "epoch": 1.01, "learning_rate": 0.0002730920062128864, "loss": 0.0202, "step": 4953 }, { "epoch": 1.01, "learning_rate": 0.0002730809267622662, "loss": 0.0232, "step": 4954 }, { "epoch": 1.01, "learning_rate": 0.0002730698452559622, "loss": 0.012, "step": 4955 }, { "epoch": 1.01, "learning_rate": 0.0002730587616941595, "loss": 0.0048, "step": 4956 }, { "epoch": 1.01, "learning_rate": 0.00027304767607704315, "loss": 0.0121, "step": 4957 }, { "epoch": 1.01, "learning_rate": 0.00027303658840479835, "loss": 0.0207, "step": 4958 }, { "epoch": 1.01, "learning_rate": 0.00027302549867761026, "loss": 0.0048, "step": 4959 }, { "epoch": 1.01, "learning_rate": 0.00027301440689566416, "loss": 0.0032, "step": 4960 }, { "epoch": 1.01, "learning_rate": 0.00027300331305914525, "loss": 0.0071, "step": 4961 }, { "epoch": 1.01, "learning_rate": 0.00027299221716823875, "loss": 0.0178, "step": 4962 }, { "epoch": 1.01, "learning_rate": 0.0002729811192231301, "loss": 0.0082, "step": 4963 }, { "epoch": 1.01, "learning_rate": 0.0002729700192240047, "loss": 0.0021, "step": 4964 }, { "epoch": 1.01, "learning_rate": 0.0002729589171710478, "loss": 0.0225, "step": 4965 }, { "epoch": 1.01, "learning_rate": 0.0002729478130644448, "loss": 0.0101, "step": 4966 }, { "epoch": 1.01, "learning_rate": 0.0002729367069043814, "loss": 0.0282, "step": 4967 }, { "epoch": 1.01, "learning_rate": 0.00027292559869104285, "loss": 0.0135, "step": 4968 }, { "epoch": 1.01, "learning_rate": 0.00027291448842461474, "loss": 0.0074, "step": 4969 }, { "epoch": 1.01, "learning_rate": 0.0002729033761052827, "loss": 0.0232, "step": 4970 }, { "epoch": 1.01, "learning_rate": 0.00027289226173323226, "loss": 0.0145, "step": 4971 }, { "epoch": 1.01, "learning_rate": 0.00027288114530864906, "loss": 0.0062, "step": 4972 }, { "epoch": 1.01, "learning_rate": 0.0002728700268317188, "loss": 0.005, "step": 4973 }, { "epoch": 1.01, "learning_rate": 0.0002728589063026272, "loss": 0.0065, "step": 4974 }, { "epoch": 1.01, "learning_rate": 0.00027284778372155987, "loss": 0.0035, "step": 4975 }, { "epoch": 1.01, "learning_rate": 0.0002728366590887027, "loss": 0.0114, "step": 4976 }, { "epoch": 1.01, "learning_rate": 0.00027282553240424144, "loss": 0.0062, "step": 4977 }, { "epoch": 1.01, "learning_rate": 0.00027281440366836194, "loss": 0.0288, "step": 4978 }, { "epoch": 1.01, "learning_rate": 0.00027280327288125005, "loss": 0.045, "step": 4979 }, { "epoch": 1.01, "learning_rate": 0.00027279214004309176, "loss": 0.0053, "step": 4980 }, { "epoch": 1.01, "learning_rate": 0.0002727810051540729, "loss": 0.0203, "step": 4981 }, { "epoch": 1.01, "learning_rate": 0.0002727698682143795, "loss": 0.092, "step": 4982 }, { "epoch": 1.01, "learning_rate": 0.0002727587292241975, "loss": 0.0201, "step": 4983 }, { "epoch": 1.01, "learning_rate": 0.0002727475881837131, "loss": 0.0184, "step": 4984 }, { "epoch": 1.02, "learning_rate": 0.0002727364450931122, "loss": 0.0095, "step": 4985 }, { "epoch": 1.02, "learning_rate": 0.00027272529995258103, "loss": 0.0128, "step": 4986 }, { "epoch": 1.02, "learning_rate": 0.0002727141527623057, "loss": 0.0197, "step": 4987 }, { "epoch": 1.02, "learning_rate": 0.0002727030035224723, "loss": 0.0303, "step": 4988 }, { "epoch": 1.02, "learning_rate": 0.00027269185223326723, "loss": 0.0281, "step": 4989 }, { "epoch": 1.02, "learning_rate": 0.00027268069889487657, "loss": 0.0525, "step": 4990 }, { "epoch": 1.02, "learning_rate": 0.00027266954350748664, "loss": 0.0241, "step": 4991 }, { "epoch": 1.02, "learning_rate": 0.0002726583860712838, "loss": 0.0035, "step": 4992 }, { "epoch": 1.02, "learning_rate": 0.00027264722658645435, "loss": 0.021, "step": 4993 }, { "epoch": 1.02, "learning_rate": 0.0002726360650531848, "loss": 0.0053, "step": 4994 }, { "epoch": 1.02, "learning_rate": 0.0002726249014716614, "loss": 0.0225, "step": 4995 }, { "epoch": 1.02, "learning_rate": 0.0002726137358420707, "loss": 0.0102, "step": 4996 }, { "epoch": 1.02, "learning_rate": 0.0002726025681645991, "loss": 0.0128, "step": 4997 }, { "epoch": 1.02, "learning_rate": 0.00027259139843943323, "loss": 0.0241, "step": 4998 }, { "epoch": 1.02, "learning_rate": 0.0002725802266667596, "loss": 0.0192, "step": 4999 }, { "epoch": 1.02, "learning_rate": 0.0002725690528467648, "loss": 0.0061, "step": 5000 }, { "epoch": 1.02, "learning_rate": 0.00027255787697963544, "loss": 0.0431, "step": 5001 }, { "epoch": 1.02, "learning_rate": 0.00027254669906555824, "loss": 0.0069, "step": 5002 }, { "epoch": 1.02, "learning_rate": 0.00027253551910471973, "loss": 0.0077, "step": 5003 }, { "epoch": 1.02, "learning_rate": 0.00027252433709730684, "loss": 0.0091, "step": 5004 }, { "epoch": 1.02, "learning_rate": 0.00027251315304350625, "loss": 0.0097, "step": 5005 }, { "epoch": 1.02, "learning_rate": 0.0002725019669435047, "loss": 0.0092, "step": 5006 }, { "epoch": 1.02, "learning_rate": 0.000272490778797489, "loss": 0.0143, "step": 5007 }, { "epoch": 1.02, "learning_rate": 0.0002724795886056462, "loss": 0.0142, "step": 5008 }, { "epoch": 1.02, "learning_rate": 0.000272468396368163, "loss": 0.0059, "step": 5009 }, { "epoch": 1.02, "learning_rate": 0.00027245720208522647, "loss": 0.0076, "step": 5010 }, { "epoch": 1.02, "learning_rate": 0.00027244600575702347, "loss": 0.0144, "step": 5011 }, { "epoch": 1.02, "learning_rate": 0.00027243480738374103, "loss": 0.0189, "step": 5012 }, { "epoch": 1.02, "learning_rate": 0.0002724236069655662, "loss": 0.0062, "step": 5013 }, { "epoch": 1.02, "learning_rate": 0.00027241240450268605, "loss": 0.0203, "step": 5014 }, { "epoch": 1.02, "learning_rate": 0.0002724011999952877, "loss": 0.005, "step": 5015 }, { "epoch": 1.02, "learning_rate": 0.0002723899934435582, "loss": 0.0122, "step": 5016 }, { "epoch": 1.02, "learning_rate": 0.0002723787848476848, "loss": 0.0122, "step": 5017 }, { "epoch": 1.02, "learning_rate": 0.00027236757420785474, "loss": 0.0192, "step": 5018 }, { "epoch": 1.02, "learning_rate": 0.0002723563615242551, "loss": 0.0241, "step": 5019 }, { "epoch": 1.02, "learning_rate": 0.00027234514679707337, "loss": 0.0138, "step": 5020 }, { "epoch": 1.02, "learning_rate": 0.0002723339300264967, "loss": 0.0264, "step": 5021 }, { "epoch": 1.02, "learning_rate": 0.0002723227112127125, "loss": 0.0067, "step": 5022 }, { "epoch": 1.02, "learning_rate": 0.0002723114903559081, "loss": 0.0179, "step": 5023 }, { "epoch": 1.02, "learning_rate": 0.00027230026745627095, "loss": 0.024, "step": 5024 }, { "epoch": 1.02, "learning_rate": 0.0002722890425139884, "loss": 0.0152, "step": 5025 }, { "epoch": 1.02, "learning_rate": 0.0002722778155292481, "loss": 0.0078, "step": 5026 }, { "epoch": 1.02, "learning_rate": 0.0002722665865022374, "loss": 0.0072, "step": 5027 }, { "epoch": 1.02, "learning_rate": 0.00027225535543314396, "loss": 0.0221, "step": 5028 }, { "epoch": 1.02, "learning_rate": 0.00027224412232215527, "loss": 0.0192, "step": 5029 }, { "epoch": 1.02, "learning_rate": 0.000272232887169459, "loss": 0.0197, "step": 5030 }, { "epoch": 1.02, "learning_rate": 0.0002722216499752428, "loss": 0.0198, "step": 5031 }, { "epoch": 1.02, "learning_rate": 0.0002722104107396943, "loss": 0.0014, "step": 5032 }, { "epoch": 1.02, "learning_rate": 0.00027219916946300134, "loss": 0.0142, "step": 5033 }, { "epoch": 1.03, "learning_rate": 0.0002721879261453515, "loss": 0.014, "step": 5034 }, { "epoch": 1.03, "learning_rate": 0.00027217668078693264, "loss": 0.0067, "step": 5035 }, { "epoch": 1.03, "learning_rate": 0.00027216543338793263, "loss": 0.0108, "step": 5036 }, { "epoch": 1.03, "learning_rate": 0.0002721541839485392, "loss": 0.0047, "step": 5037 }, { "epoch": 1.03, "learning_rate": 0.0002721429324689404, "loss": 0.0033, "step": 5038 }, { "epoch": 1.03, "learning_rate": 0.00027213167894932406, "loss": 0.0179, "step": 5039 }, { "epoch": 1.03, "learning_rate": 0.00027212042338987816, "loss": 0.0093, "step": 5040 }, { "epoch": 1.03, "learning_rate": 0.0002721091657907906, "loss": 0.0171, "step": 5041 }, { "epoch": 1.03, "learning_rate": 0.00027209790615224954, "loss": 0.0195, "step": 5042 }, { "epoch": 1.03, "learning_rate": 0.0002720866444744429, "loss": 0.0176, "step": 5043 }, { "epoch": 1.03, "learning_rate": 0.0002720753807575589, "loss": 0.0129, "step": 5044 }, { "epoch": 1.03, "learning_rate": 0.0002720641150017856, "loss": 0.0268, "step": 5045 }, { "epoch": 1.03, "learning_rate": 0.0002720528472073111, "loss": 0.0141, "step": 5046 }, { "epoch": 1.03, "learning_rate": 0.00027204157737432375, "loss": 0.02, "step": 5047 }, { "epoch": 1.03, "learning_rate": 0.0002720303055030117, "loss": 0.0091, "step": 5048 }, { "epoch": 1.03, "learning_rate": 0.00027201903159356313, "loss": 0.0187, "step": 5049 }, { "epoch": 1.03, "learning_rate": 0.0002720077556461664, "loss": 0.0145, "step": 5050 }, { "epoch": 1.03, "learning_rate": 0.00027199647766100986, "loss": 0.0048, "step": 5051 }, { "epoch": 1.03, "learning_rate": 0.0002719851976382819, "loss": 0.0298, "step": 5052 }, { "epoch": 1.03, "learning_rate": 0.00027197391557817085, "loss": 0.0078, "step": 5053 }, { "epoch": 1.03, "learning_rate": 0.00027196263148086515, "loss": 0.0316, "step": 5054 }, { "epoch": 1.03, "learning_rate": 0.0002719513453465533, "loss": 0.0048, "step": 5055 }, { "epoch": 1.03, "learning_rate": 0.0002719400571754238, "loss": 0.0086, "step": 5056 }, { "epoch": 1.03, "learning_rate": 0.00027192876696766516, "loss": 0.0537, "step": 5057 }, { "epoch": 1.03, "learning_rate": 0.00027191747472346593, "loss": 0.0418, "step": 5058 }, { "epoch": 1.03, "learning_rate": 0.0002719061804430148, "loss": 0.0088, "step": 5059 }, { "epoch": 1.03, "learning_rate": 0.00027189488412650026, "loss": 0.0047, "step": 5060 }, { "epoch": 1.03, "learning_rate": 0.00027188358577411113, "loss": 0.005, "step": 5061 }, { "epoch": 1.03, "learning_rate": 0.00027187228538603597, "loss": 0.0086, "step": 5062 }, { "epoch": 1.03, "learning_rate": 0.0002718609829624636, "loss": 0.0099, "step": 5063 }, { "epoch": 1.03, "learning_rate": 0.00027184967850358286, "loss": 0.0053, "step": 5064 }, { "epoch": 1.03, "learning_rate": 0.0002718383720095825, "loss": 0.0109, "step": 5065 }, { "epoch": 1.03, "learning_rate": 0.0002718270634806512, "loss": 0.0088, "step": 5066 }, { "epoch": 1.03, "learning_rate": 0.00027181575291697807, "loss": 0.0064, "step": 5067 }, { "epoch": 1.03, "learning_rate": 0.00027180444031875195, "loss": 0.0111, "step": 5068 }, { "epoch": 1.03, "learning_rate": 0.0002717931256861617, "loss": 0.0301, "step": 5069 }, { "epoch": 1.03, "learning_rate": 0.00027178180901939636, "loss": 0.0031, "step": 5070 }, { "epoch": 1.03, "learning_rate": 0.00027177049031864496, "loss": 0.018, "step": 5071 }, { "epoch": 1.03, "learning_rate": 0.0002717591695840965, "loss": 0.0049, "step": 5072 }, { "epoch": 1.03, "learning_rate": 0.00027174784681594004, "loss": 0.0137, "step": 5073 }, { "epoch": 1.03, "learning_rate": 0.00027173652201436475, "loss": 0.0051, "step": 5074 }, { "epoch": 1.03, "learning_rate": 0.00027172519517955975, "loss": 0.0531, "step": 5075 }, { "epoch": 1.03, "learning_rate": 0.00027171386631171424, "loss": 0.0117, "step": 5076 }, { "epoch": 1.03, "learning_rate": 0.00027170253541101736, "loss": 0.01, "step": 5077 }, { "epoch": 1.03, "learning_rate": 0.0002716912024776584, "loss": 0.0077, "step": 5078 }, { "epoch": 1.03, "learning_rate": 0.0002716798675118267, "loss": 0.0387, "step": 5079 }, { "epoch": 1.03, "learning_rate": 0.0002716685305137115, "loss": 0.0141, "step": 5080 }, { "epoch": 1.03, "learning_rate": 0.0002716571914835022, "loss": 0.0431, "step": 5081 }, { "epoch": 1.03, "learning_rate": 0.0002716458504213881, "loss": 0.0436, "step": 5082 }, { "epoch": 1.03, "learning_rate": 0.00027163450732755874, "loss": 0.02, "step": 5083 }, { "epoch": 1.04, "learning_rate": 0.0002716231622022035, "loss": 0.0449, "step": 5084 }, { "epoch": 1.04, "learning_rate": 0.0002716118150455119, "loss": 0.0128, "step": 5085 }, { "epoch": 1.04, "learning_rate": 0.00027160046585767333, "loss": 0.0112, "step": 5086 }, { "epoch": 1.04, "learning_rate": 0.00027158911463887747, "loss": 0.0321, "step": 5087 }, { "epoch": 1.04, "learning_rate": 0.0002715777613893139, "loss": 0.0152, "step": 5088 }, { "epoch": 1.04, "learning_rate": 0.0002715664061091722, "loss": 0.0046, "step": 5089 }, { "epoch": 1.04, "learning_rate": 0.00027155504879864214, "loss": 0.0154, "step": 5090 }, { "epoch": 1.04, "learning_rate": 0.00027154368945791325, "loss": 0.0137, "step": 5091 }, { "epoch": 1.04, "learning_rate": 0.00027153232808717527, "loss": 0.0131, "step": 5092 }, { "epoch": 1.04, "learning_rate": 0.00027152096468661805, "loss": 0.0149, "step": 5093 }, { "epoch": 1.04, "learning_rate": 0.00027150959925643133, "loss": 0.0047, "step": 5094 }, { "epoch": 1.04, "learning_rate": 0.0002714982317968049, "loss": 0.0095, "step": 5095 }, { "epoch": 1.04, "learning_rate": 0.0002714868623079287, "loss": 0.0021, "step": 5096 }, { "epoch": 1.04, "learning_rate": 0.0002714754907899926, "loss": 0.0069, "step": 5097 }, { "epoch": 1.04, "learning_rate": 0.0002714641172431864, "loss": 0.0093, "step": 5098 }, { "epoch": 1.04, "learning_rate": 0.0002714527416677003, "loss": 0.0309, "step": 5099 }, { "epoch": 1.04, "learning_rate": 0.0002714413640637241, "loss": 0.0099, "step": 5100 }, { "epoch": 1.04, "learning_rate": 0.0002714299844314478, "loss": 0.0281, "step": 5101 }, { "epoch": 1.04, "learning_rate": 0.00027141860277106163, "loss": 0.0026, "step": 5102 }, { "epoch": 1.04, "learning_rate": 0.00027140721908275556, "loss": 0.0085, "step": 5103 }, { "epoch": 1.04, "learning_rate": 0.00027139583336671983, "loss": 0.0123, "step": 5104 }, { "epoch": 1.04, "learning_rate": 0.00027138444562314445, "loss": 0.0122, "step": 5105 }, { "epoch": 1.04, "learning_rate": 0.00027137305585221976, "loss": 0.0123, "step": 5106 }, { "epoch": 1.04, "learning_rate": 0.00027136166405413586, "loss": 0.0251, "step": 5107 }, { "epoch": 1.04, "learning_rate": 0.00027135027022908315, "loss": 0.01, "step": 5108 }, { "epoch": 1.04, "learning_rate": 0.00027133887437725185, "loss": 0.0254, "step": 5109 }, { "epoch": 1.04, "learning_rate": 0.00027132747649883233, "loss": 0.029, "step": 5110 }, { "epoch": 1.04, "learning_rate": 0.00027131607659401484, "loss": 0.0177, "step": 5111 }, { "epoch": 1.04, "learning_rate": 0.00027130467466298996, "loss": 0.0304, "step": 5112 }, { "epoch": 1.04, "learning_rate": 0.000271293270705948, "loss": 0.0052, "step": 5113 }, { "epoch": 1.04, "learning_rate": 0.00027128186472307944, "loss": 0.0131, "step": 5114 }, { "epoch": 1.04, "learning_rate": 0.00027127045671457485, "loss": 0.0071, "step": 5115 }, { "epoch": 1.04, "learning_rate": 0.0002712590466806247, "loss": 0.0133, "step": 5116 }, { "epoch": 1.04, "learning_rate": 0.00027124763462141956, "loss": 0.0104, "step": 5117 }, { "epoch": 1.04, "learning_rate": 0.00027123622053715, "loss": 0.0132, "step": 5118 }, { "epoch": 1.04, "learning_rate": 0.0002712248044280068, "loss": 0.0115, "step": 5119 }, { "epoch": 1.04, "learning_rate": 0.00027121338629418053, "loss": 0.0077, "step": 5120 }, { "epoch": 1.04, "learning_rate": 0.00027120196613586185, "loss": 0.0178, "step": 5121 }, { "epoch": 1.04, "learning_rate": 0.0002711905439532416, "loss": 0.0126, "step": 5122 }, { "epoch": 1.04, "learning_rate": 0.0002711791197465105, "loss": 0.0153, "step": 5123 }, { "epoch": 1.04, "learning_rate": 0.0002711676935158593, "loss": 0.0214, "step": 5124 }, { "epoch": 1.04, "learning_rate": 0.00027115626526147895, "loss": 0.0214, "step": 5125 }, { "epoch": 1.04, "learning_rate": 0.0002711448349835603, "loss": 0.0199, "step": 5126 }, { "epoch": 1.04, "learning_rate": 0.00027113340268229415, "loss": 0.0236, "step": 5127 }, { "epoch": 1.04, "learning_rate": 0.00027112196835787157, "loss": 0.0353, "step": 5128 }, { "epoch": 1.04, "learning_rate": 0.00027111053201048344, "loss": 0.0095, "step": 5129 }, { "epoch": 1.04, "learning_rate": 0.0002710990936403208, "loss": 0.0053, "step": 5130 }, { "epoch": 1.04, "learning_rate": 0.00027108765324757484, "loss": 0.0119, "step": 5131 }, { "epoch": 1.04, "learning_rate": 0.0002710762108324364, "loss": 0.0143, "step": 5132 }, { "epoch": 1.05, "learning_rate": 0.0002710647663950967, "loss": 0.018, "step": 5133 }, { "epoch": 1.05, "learning_rate": 0.0002710533199357469, "loss": 0.0203, "step": 5134 }, { "epoch": 1.05, "learning_rate": 0.0002710418714545781, "loss": 0.0119, "step": 5135 }, { "epoch": 1.05, "learning_rate": 0.0002710304209517816, "loss": 0.0062, "step": 5136 }, { "epoch": 1.05, "learning_rate": 0.00027101896842754864, "loss": 0.0257, "step": 5137 }, { "epoch": 1.05, "learning_rate": 0.0002710075138820704, "loss": 0.0056, "step": 5138 }, { "epoch": 1.05, "learning_rate": 0.0002709960573155383, "loss": 0.026, "step": 5139 }, { "epoch": 1.05, "learning_rate": 0.00027098459872814366, "loss": 0.0095, "step": 5140 }, { "epoch": 1.05, "learning_rate": 0.0002709731381200778, "loss": 0.0068, "step": 5141 }, { "epoch": 1.05, "learning_rate": 0.00027096167549153224, "loss": 0.0299, "step": 5142 }, { "epoch": 1.05, "learning_rate": 0.0002709502108426983, "loss": 0.0082, "step": 5143 }, { "epoch": 1.05, "learning_rate": 0.00027093874417376756, "loss": 0.0508, "step": 5144 }, { "epoch": 1.05, "learning_rate": 0.00027092727548493154, "loss": 0.0086, "step": 5145 }, { "epoch": 1.05, "learning_rate": 0.0002709158047763817, "loss": 0.0118, "step": 5146 }, { "epoch": 1.05, "learning_rate": 0.0002709043320483097, "loss": 0.0351, "step": 5147 }, { "epoch": 1.05, "learning_rate": 0.00027089285730090714, "loss": 0.0186, "step": 5148 }, { "epoch": 1.05, "learning_rate": 0.0002708813805343656, "loss": 0.04, "step": 5149 }, { "epoch": 1.05, "learning_rate": 0.00027086990174887693, "loss": 0.0245, "step": 5150 }, { "epoch": 1.05, "learning_rate": 0.0002708584209446327, "loss": 0.0194, "step": 5151 }, { "epoch": 1.05, "learning_rate": 0.0002708469381218247, "loss": 0.0071, "step": 5152 }, { "epoch": 1.05, "learning_rate": 0.00027083545328064466, "loss": 0.0108, "step": 5153 }, { "epoch": 1.05, "learning_rate": 0.00027082396642128453, "loss": 0.0079, "step": 5154 }, { "epoch": 1.05, "learning_rate": 0.0002708124775439361, "loss": 0.0122, "step": 5155 }, { "epoch": 1.05, "learning_rate": 0.0002708009866487912, "loss": 0.008, "step": 5156 }, { "epoch": 1.05, "learning_rate": 0.00027078949373604176, "loss": 0.0119, "step": 5157 }, { "epoch": 1.05, "learning_rate": 0.00027077799880587984, "loss": 0.0159, "step": 5158 }, { "epoch": 1.05, "learning_rate": 0.00027076650185849733, "loss": 0.0138, "step": 5159 }, { "epoch": 1.05, "learning_rate": 0.00027075500289408625, "loss": 0.0068, "step": 5160 }, { "epoch": 1.05, "learning_rate": 0.0002707435019128387, "loss": 0.0112, "step": 5161 }, { "epoch": 1.05, "learning_rate": 0.00027073199891494677, "loss": 0.0039, "step": 5162 }, { "epoch": 1.05, "learning_rate": 0.00027072049390060256, "loss": 0.0311, "step": 5163 }, { "epoch": 1.05, "learning_rate": 0.0002707089868699982, "loss": 0.007, "step": 5164 }, { "epoch": 1.05, "learning_rate": 0.00027069747782332596, "loss": 0.0113, "step": 5165 }, { "epoch": 1.05, "learning_rate": 0.00027068596676077793, "loss": 0.0114, "step": 5166 }, { "epoch": 1.05, "learning_rate": 0.0002706744536825465, "loss": 0.0058, "step": 5167 }, { "epoch": 1.05, "learning_rate": 0.00027066293858882387, "loss": 0.0104, "step": 5168 }, { "epoch": 1.05, "learning_rate": 0.0002706514214798024, "loss": 0.0101, "step": 5169 }, { "epoch": 1.05, "learning_rate": 0.00027063990235567443, "loss": 0.0144, "step": 5170 }, { "epoch": 1.05, "learning_rate": 0.00027062838121663245, "loss": 0.0088, "step": 5171 }, { "epoch": 1.05, "learning_rate": 0.00027061685806286875, "loss": 0.0104, "step": 5172 }, { "epoch": 1.05, "learning_rate": 0.0002706053328945758, "loss": 0.0102, "step": 5173 }, { "epoch": 1.05, "learning_rate": 0.0002705938057119462, "loss": 0.0069, "step": 5174 }, { "epoch": 1.05, "learning_rate": 0.00027058227651517236, "loss": 0.0183, "step": 5175 }, { "epoch": 1.05, "learning_rate": 0.00027057074530444694, "loss": 0.0113, "step": 5176 }, { "epoch": 1.05, "learning_rate": 0.0002705592120799624, "loss": 0.0157, "step": 5177 }, { "epoch": 1.05, "learning_rate": 0.0002705476768419115, "loss": 0.0273, "step": 5178 }, { "epoch": 1.05, "learning_rate": 0.00027053613959048683, "loss": 0.0322, "step": 5179 }, { "epoch": 1.05, "learning_rate": 0.00027052460032588114, "loss": 0.008, "step": 5180 }, { "epoch": 1.05, "learning_rate": 0.00027051305904828704, "loss": 0.0114, "step": 5181 }, { "epoch": 1.06, "learning_rate": 0.0002705015157578974, "loss": 0.0086, "step": 5182 }, { "epoch": 1.06, "learning_rate": 0.000270489970454905, "loss": 0.011, "step": 5183 }, { "epoch": 1.06, "learning_rate": 0.00027047842313950265, "loss": 0.0012, "step": 5184 }, { "epoch": 1.06, "learning_rate": 0.0002704668738118832, "loss": 0.005, "step": 5185 }, { "epoch": 1.06, "learning_rate": 0.0002704553224722396, "loss": 0.0084, "step": 5186 }, { "epoch": 1.06, "learning_rate": 0.00027044376912076473, "loss": 0.0175, "step": 5187 }, { "epoch": 1.06, "learning_rate": 0.0002704322137576516, "loss": 0.0273, "step": 5188 }, { "epoch": 1.06, "learning_rate": 0.00027042065638309306, "loss": 0.0056, "step": 5189 }, { "epoch": 1.06, "learning_rate": 0.0002704090969972823, "loss": 0.002, "step": 5190 }, { "epoch": 1.06, "learning_rate": 0.0002703975356004123, "loss": 0.0109, "step": 5191 }, { "epoch": 1.06, "learning_rate": 0.00027038597219267624, "loss": 0.0037, "step": 5192 }, { "epoch": 1.06, "learning_rate": 0.0002703744067742672, "loss": 0.0174, "step": 5193 }, { "epoch": 1.06, "learning_rate": 0.0002703628393453783, "loss": 0.0143, "step": 5194 }, { "epoch": 1.06, "learning_rate": 0.00027035126990620286, "loss": 0.0141, "step": 5195 }, { "epoch": 1.06, "learning_rate": 0.000270339698456934, "loss": 0.0356, "step": 5196 }, { "epoch": 1.06, "learning_rate": 0.000270328124997765, "loss": 0.026, "step": 5197 }, { "epoch": 1.06, "learning_rate": 0.00027031654952888913, "loss": 0.013, "step": 5198 }, { "epoch": 1.06, "learning_rate": 0.00027030497205049984, "loss": 0.0076, "step": 5199 }, { "epoch": 1.06, "learning_rate": 0.0002702933925627904, "loss": 0.0084, "step": 5200 }, { "epoch": 1.06, "learning_rate": 0.00027028181106595424, "loss": 0.0124, "step": 5201 }, { "epoch": 1.06, "learning_rate": 0.00027027022756018475, "loss": 0.0077, "step": 5202 }, { "epoch": 1.06, "learning_rate": 0.00027025864204567547, "loss": 0.0208, "step": 5203 }, { "epoch": 1.06, "learning_rate": 0.00027024705452261986, "loss": 0.0077, "step": 5204 }, { "epoch": 1.06, "learning_rate": 0.0002702354649912115, "loss": 0.0315, "step": 5205 }, { "epoch": 1.06, "learning_rate": 0.00027022387345164385, "loss": 0.0134, "step": 5206 }, { "epoch": 1.06, "learning_rate": 0.0002702122799041106, "loss": 0.0253, "step": 5207 }, { "epoch": 1.06, "learning_rate": 0.00027020068434880533, "loss": 0.0168, "step": 5208 }, { "epoch": 1.06, "learning_rate": 0.00027018908678592176, "loss": 0.0209, "step": 5209 }, { "epoch": 1.06, "learning_rate": 0.0002701774872156536, "loss": 0.0058, "step": 5210 }, { "epoch": 1.06, "learning_rate": 0.00027016588563819456, "loss": 0.0132, "step": 5211 }, { "epoch": 1.06, "learning_rate": 0.0002701542820537383, "loss": 0.0228, "step": 5212 }, { "epoch": 1.06, "learning_rate": 0.0002701426764624788, "loss": 0.0094, "step": 5213 }, { "epoch": 1.06, "learning_rate": 0.0002701310688646098, "loss": 0.0185, "step": 5214 }, { "epoch": 1.06, "learning_rate": 0.0002701194592603252, "loss": 0.0148, "step": 5215 }, { "epoch": 1.06, "learning_rate": 0.0002701078476498189, "loss": 0.0029, "step": 5216 }, { "epoch": 1.06, "learning_rate": 0.0002700962340332848, "loss": 0.0178, "step": 5217 }, { "epoch": 1.06, "learning_rate": 0.0002700846184109169, "loss": 0.0257, "step": 5218 }, { "epoch": 1.06, "learning_rate": 0.0002700730007829092, "loss": 0.0115, "step": 5219 }, { "epoch": 1.06, "learning_rate": 0.00027006138114945574, "loss": 0.0101, "step": 5220 }, { "epoch": 1.06, "learning_rate": 0.00027004975951075053, "loss": 0.0231, "step": 5221 }, { "epoch": 1.06, "learning_rate": 0.00027003813586698775, "loss": 0.0315, "step": 5222 }, { "epoch": 1.06, "learning_rate": 0.00027002651021836157, "loss": 0.0137, "step": 5223 }, { "epoch": 1.06, "learning_rate": 0.000270014882565066, "loss": 0.0323, "step": 5224 }, { "epoch": 1.06, "learning_rate": 0.00027000325290729547, "loss": 0.0701, "step": 5225 }, { "epoch": 1.06, "learning_rate": 0.000269991621245244, "loss": 0.0199, "step": 5226 }, { "epoch": 1.06, "learning_rate": 0.000269979987579106, "loss": 0.029, "step": 5227 }, { "epoch": 1.06, "learning_rate": 0.0002699683519090757, "loss": 0.0279, "step": 5228 }, { "epoch": 1.06, "learning_rate": 0.00026995671423534753, "loss": 0.02, "step": 5229 }, { "epoch": 1.06, "learning_rate": 0.00026994507455811576, "loss": 0.0084, "step": 5230 }, { "epoch": 1.07, "learning_rate": 0.0002699334328775748, "loss": 0.0169, "step": 5231 }, { "epoch": 1.07, "learning_rate": 0.00026992178919391915, "loss": 0.0177, "step": 5232 }, { "epoch": 1.07, "learning_rate": 0.0002699101435073432, "loss": 0.0086, "step": 5233 }, { "epoch": 1.07, "learning_rate": 0.0002698984958180416, "loss": 0.0227, "step": 5234 }, { "epoch": 1.07, "learning_rate": 0.00026988684612620875, "loss": 0.0162, "step": 5235 }, { "epoch": 1.07, "learning_rate": 0.00026987519443203925, "loss": 0.0102, "step": 5236 }, { "epoch": 1.07, "learning_rate": 0.00026986354073572775, "loss": 0.0144, "step": 5237 }, { "epoch": 1.07, "learning_rate": 0.00026985188503746886, "loss": 0.0052, "step": 5238 }, { "epoch": 1.07, "learning_rate": 0.0002698402273374572, "loss": 0.0197, "step": 5239 }, { "epoch": 1.07, "learning_rate": 0.0002698285676358876, "loss": 0.0274, "step": 5240 }, { "epoch": 1.07, "learning_rate": 0.0002698169059329547, "loss": 0.0303, "step": 5241 }, { "epoch": 1.07, "learning_rate": 0.0002698052422288533, "loss": 0.0145, "step": 5242 }, { "epoch": 1.07, "learning_rate": 0.00026979357652377826, "loss": 0.0063, "step": 5243 }, { "epoch": 1.07, "learning_rate": 0.0002697819088179243, "loss": 0.0122, "step": 5244 }, { "epoch": 1.07, "learning_rate": 0.0002697702391114864, "loss": 0.0131, "step": 5245 }, { "epoch": 1.07, "learning_rate": 0.0002697585674046594, "loss": 0.0116, "step": 5246 }, { "epoch": 1.07, "learning_rate": 0.0002697468936976382, "loss": 0.0342, "step": 5247 }, { "epoch": 1.07, "learning_rate": 0.0002697352179906179, "loss": 0.0167, "step": 5248 }, { "epoch": 1.07, "learning_rate": 0.00026972354028379343, "loss": 0.0047, "step": 5249 }, { "epoch": 1.07, "learning_rate": 0.00026971186057735987, "loss": 0.0391, "step": 5250 }, { "epoch": 1.07, "learning_rate": 0.00026970017887151227, "loss": 0.0226, "step": 5251 }, { "epoch": 1.07, "learning_rate": 0.0002696884951664457, "loss": 0.0082, "step": 5252 }, { "epoch": 1.07, "learning_rate": 0.0002696768094623554, "loss": 0.007, "step": 5253 }, { "epoch": 1.07, "learning_rate": 0.00026966512175943634, "loss": 0.0035, "step": 5254 }, { "epoch": 1.07, "learning_rate": 0.00026965343205788395, "loss": 0.0101, "step": 5255 }, { "epoch": 1.07, "learning_rate": 0.00026964174035789336, "loss": 0.0398, "step": 5256 }, { "epoch": 1.07, "learning_rate": 0.00026963004665965995, "loss": 0.0352, "step": 5257 }, { "epoch": 1.07, "learning_rate": 0.00026961835096337886, "loss": 0.0114, "step": 5258 }, { "epoch": 1.07, "learning_rate": 0.00026960665326924554, "loss": 0.012, "step": 5259 }, { "epoch": 1.07, "learning_rate": 0.00026959495357745534, "loss": 0.0155, "step": 5260 }, { "epoch": 1.07, "learning_rate": 0.00026958325188820365, "loss": 0.007, "step": 5261 }, { "epoch": 1.07, "learning_rate": 0.0002695715482016859, "loss": 0.0187, "step": 5262 }, { "epoch": 1.07, "learning_rate": 0.0002695598425180976, "loss": 0.0015, "step": 5263 }, { "epoch": 1.07, "learning_rate": 0.00026954813483763426, "loss": 0.0169, "step": 5264 }, { "epoch": 1.07, "learning_rate": 0.0002695364251604914, "loss": 0.0175, "step": 5265 }, { "epoch": 1.07, "learning_rate": 0.00026952471348686463, "loss": 0.0314, "step": 5266 }, { "epoch": 1.07, "learning_rate": 0.00026951299981694946, "loss": 0.007, "step": 5267 }, { "epoch": 1.07, "learning_rate": 0.00026950128415094166, "loss": 0.0156, "step": 5268 }, { "epoch": 1.07, "learning_rate": 0.0002694895664890368, "loss": 0.0158, "step": 5269 }, { "epoch": 1.07, "learning_rate": 0.0002694778468314306, "loss": 0.0133, "step": 5270 }, { "epoch": 1.07, "learning_rate": 0.00026946612517831893, "loss": 0.0099, "step": 5271 }, { "epoch": 1.07, "learning_rate": 0.00026945440152989736, "loss": 0.0253, "step": 5272 }, { "epoch": 1.07, "learning_rate": 0.00026944267588636185, "loss": 0.0085, "step": 5273 }, { "epoch": 1.07, "learning_rate": 0.00026943094824790823, "loss": 0.0126, "step": 5274 }, { "epoch": 1.07, "learning_rate": 0.00026941921861473224, "loss": 0.0097, "step": 5275 }, { "epoch": 1.07, "learning_rate": 0.0002694074869870299, "loss": 0.02, "step": 5276 }, { "epoch": 1.07, "learning_rate": 0.0002693957533649972, "loss": 0.008, "step": 5277 }, { "epoch": 1.07, "learning_rate": 0.00026938401774883, "loss": 0.0217, "step": 5278 }, { "epoch": 1.07, "learning_rate": 0.00026937228013872427, "loss": 0.0079, "step": 5279 }, { "epoch": 1.08, "learning_rate": 0.0002693605405348762, "loss": 0.0161, "step": 5280 }, { "epoch": 1.08, "learning_rate": 0.00026934879893748186, "loss": 0.0298, "step": 5281 }, { "epoch": 1.08, "learning_rate": 0.0002693370553467372, "loss": 0.0219, "step": 5282 }, { "epoch": 1.08, "learning_rate": 0.0002693253097628385, "loss": 0.0082, "step": 5283 }, { "epoch": 1.08, "learning_rate": 0.0002693135621859818, "loss": 0.0074, "step": 5284 }, { "epoch": 1.08, "learning_rate": 0.0002693018126163635, "loss": 0.0362, "step": 5285 }, { "epoch": 1.08, "learning_rate": 0.00026929006105417966, "loss": 0.0302, "step": 5286 }, { "epoch": 1.08, "learning_rate": 0.00026927830749962664, "loss": 0.0091, "step": 5287 }, { "epoch": 1.08, "learning_rate": 0.0002692665519529008, "loss": 0.0186, "step": 5288 }, { "epoch": 1.08, "learning_rate": 0.0002692547944141983, "loss": 0.0067, "step": 5289 }, { "epoch": 1.08, "learning_rate": 0.0002692430348837157, "loss": 0.0047, "step": 5290 }, { "epoch": 1.08, "learning_rate": 0.0002692312733616493, "loss": 0.0034, "step": 5291 }, { "epoch": 1.08, "learning_rate": 0.0002692195098481956, "loss": 0.0077, "step": 5292 }, { "epoch": 1.08, "learning_rate": 0.000269207744343551, "loss": 0.0125, "step": 5293 }, { "epoch": 1.08, "learning_rate": 0.00026919597684791204, "loss": 0.0091, "step": 5294 }, { "epoch": 1.08, "learning_rate": 0.0002691842073614753, "loss": 0.0443, "step": 5295 }, { "epoch": 1.08, "learning_rate": 0.00026917243588443735, "loss": 0.022, "step": 5296 }, { "epoch": 1.08, "learning_rate": 0.0002691606624169947, "loss": 0.0094, "step": 5297 }, { "epoch": 1.08, "learning_rate": 0.0002691488869593441, "loss": 0.0215, "step": 5298 }, { "epoch": 1.08, "learning_rate": 0.00026913710951168213, "loss": 0.0116, "step": 5299 }, { "epoch": 1.08, "learning_rate": 0.0002691253300742056, "loss": 0.0176, "step": 5300 }, { "epoch": 1.08, "learning_rate": 0.0002691135486471112, "loss": 0.0164, "step": 5301 }, { "epoch": 1.08, "learning_rate": 0.0002691017652305957, "loss": 0.0175, "step": 5302 }, { "epoch": 1.08, "learning_rate": 0.0002690899798248558, "loss": 0.0017, "step": 5303 }, { "epoch": 1.08, "learning_rate": 0.00026907819243008853, "loss": 0.0127, "step": 5304 }, { "epoch": 1.08, "learning_rate": 0.00026906640304649065, "loss": 0.0153, "step": 5305 }, { "epoch": 1.08, "learning_rate": 0.0002690546116742591, "loss": 0.009, "step": 5306 }, { "epoch": 1.08, "learning_rate": 0.00026904281831359076, "loss": 0.0064, "step": 5307 }, { "epoch": 1.08, "learning_rate": 0.0002690310229646827, "loss": 0.0126, "step": 5308 }, { "epoch": 1.08, "learning_rate": 0.00026901922562773184, "loss": 0.0085, "step": 5309 }, { "epoch": 1.08, "learning_rate": 0.0002690074263029352, "loss": 0.0389, "step": 5310 }, { "epoch": 1.08, "learning_rate": 0.00026899562499049, "loss": 0.0327, "step": 5311 }, { "epoch": 1.08, "learning_rate": 0.0002689838216905932, "loss": 0.0081, "step": 5312 }, { "epoch": 1.08, "learning_rate": 0.00026897201640344194, "loss": 0.0184, "step": 5313 }, { "epoch": 1.08, "learning_rate": 0.00026896020912923346, "loss": 0.0247, "step": 5314 }, { "epoch": 1.08, "learning_rate": 0.0002689483998681649, "loss": 0.0065, "step": 5315 }, { "epoch": 1.08, "learning_rate": 0.0002689365886204336, "loss": 0.0251, "step": 5316 }, { "epoch": 1.08, "learning_rate": 0.0002689247753862367, "loss": 0.0314, "step": 5317 }, { "epoch": 1.08, "learning_rate": 0.00026891296016577166, "loss": 0.0123, "step": 5318 }, { "epoch": 1.08, "learning_rate": 0.0002689011429592356, "loss": 0.0111, "step": 5319 }, { "epoch": 1.08, "learning_rate": 0.0002688893237668261, "loss": 0.0047, "step": 5320 }, { "epoch": 1.08, "learning_rate": 0.0002688775025887404, "loss": 0.0079, "step": 5321 }, { "epoch": 1.08, "learning_rate": 0.0002688656794251761, "loss": 0.0127, "step": 5322 }, { "epoch": 1.08, "learning_rate": 0.0002688538542763305, "loss": 0.0151, "step": 5323 }, { "epoch": 1.08, "learning_rate": 0.00026884202714240116, "loss": 0.0272, "step": 5324 }, { "epoch": 1.08, "learning_rate": 0.0002688301980235857, "loss": 0.0217, "step": 5325 }, { "epoch": 1.08, "learning_rate": 0.0002688183669200816, "loss": 0.0321, "step": 5326 }, { "epoch": 1.08, "learning_rate": 0.0002688065338320865, "loss": 0.021, "step": 5327 }, { "epoch": 1.08, "learning_rate": 0.000268794698759798, "loss": 0.0216, "step": 5328 }, { "epoch": 1.09, "learning_rate": 0.0002687828617034139, "loss": 0.0285, "step": 5329 }, { "epoch": 1.09, "learning_rate": 0.00026877102266313163, "loss": 0.0139, "step": 5330 }, { "epoch": 1.09, "learning_rate": 0.0002687591816391491, "loss": 0.0136, "step": 5331 }, { "epoch": 1.09, "learning_rate": 0.00026874733863166417, "loss": 0.0271, "step": 5332 }, { "epoch": 1.09, "learning_rate": 0.00026873549364087447, "loss": 0.0046, "step": 5333 }, { "epoch": 1.09, "learning_rate": 0.0002687236466669779, "loss": 0.0123, "step": 5334 }, { "epoch": 1.09, "learning_rate": 0.00026871179771017237, "loss": 0.0112, "step": 5335 }, { "epoch": 1.09, "learning_rate": 0.00026869994677065565, "loss": 0.0141, "step": 5336 }, { "epoch": 1.09, "learning_rate": 0.0002686880938486258, "loss": 0.0075, "step": 5337 }, { "epoch": 1.09, "learning_rate": 0.0002686762389442808, "loss": 0.0167, "step": 5338 }, { "epoch": 1.09, "learning_rate": 0.0002686643820578185, "loss": 0.011, "step": 5339 }, { "epoch": 1.09, "learning_rate": 0.00026865252318943706, "loss": 0.0087, "step": 5340 }, { "epoch": 1.09, "learning_rate": 0.0002686406623393345, "loss": 0.025, "step": 5341 }, { "epoch": 1.09, "learning_rate": 0.00026862879950770893, "loss": 0.0077, "step": 5342 }, { "epoch": 1.09, "learning_rate": 0.0002686169346947585, "loss": 0.0216, "step": 5343 }, { "epoch": 1.09, "learning_rate": 0.00026860506790068133, "loss": 0.0157, "step": 5344 }, { "epoch": 1.09, "learning_rate": 0.00026859319912567566, "loss": 0.0061, "step": 5345 }, { "epoch": 1.09, "learning_rate": 0.00026858132836993974, "loss": 0.0212, "step": 5346 }, { "epoch": 1.09, "learning_rate": 0.0002685694556336717, "loss": 0.0219, "step": 5347 }, { "epoch": 1.09, "learning_rate": 0.00026855758091707003, "loss": 0.0128, "step": 5348 }, { "epoch": 1.09, "learning_rate": 0.00026854570422033295, "loss": 0.0189, "step": 5349 }, { "epoch": 1.09, "learning_rate": 0.0002685338255436588, "loss": 0.0092, "step": 5350 }, { "epoch": 1.09, "learning_rate": 0.00026852194488724606, "loss": 0.0207, "step": 5351 }, { "epoch": 1.09, "learning_rate": 0.00026851006225129306, "loss": 0.0037, "step": 5352 }, { "epoch": 1.09, "learning_rate": 0.00026849817763599835, "loss": 0.0054, "step": 5353 }, { "epoch": 1.09, "learning_rate": 0.0002684862910415604, "loss": 0.0091, "step": 5354 }, { "epoch": 1.09, "learning_rate": 0.00026847440246817775, "loss": 0.0154, "step": 5355 }, { "epoch": 1.09, "learning_rate": 0.0002684625119160489, "loss": 0.0195, "step": 5356 }, { "epoch": 1.09, "learning_rate": 0.00026845061938537247, "loss": 0.0128, "step": 5357 }, { "epoch": 1.09, "learning_rate": 0.0002684387248763471, "loss": 0.0042, "step": 5358 }, { "epoch": 1.09, "learning_rate": 0.00026842682838917154, "loss": 0.0087, "step": 5359 }, { "epoch": 1.09, "learning_rate": 0.0002684149299240443, "loss": 0.0231, "step": 5360 }, { "epoch": 1.09, "learning_rate": 0.00026840302948116427, "loss": 0.0169, "step": 5361 }, { "epoch": 1.09, "learning_rate": 0.00026839112706073014, "loss": 0.0339, "step": 5362 }, { "epoch": 1.09, "learning_rate": 0.0002683792226629407, "loss": 0.0112, "step": 5363 }, { "epoch": 1.09, "learning_rate": 0.0002683673162879948, "loss": 0.007, "step": 5364 }, { "epoch": 1.09, "learning_rate": 0.0002683554079360913, "loss": 0.0178, "step": 5365 }, { "epoch": 1.09, "learning_rate": 0.000268343497607429, "loss": 0.0064, "step": 5366 }, { "epoch": 1.09, "learning_rate": 0.000268331585302207, "loss": 0.0139, "step": 5367 }, { "epoch": 1.09, "learning_rate": 0.00026831967102062404, "loss": 0.0597, "step": 5368 }, { "epoch": 1.09, "learning_rate": 0.00026830775476287933, "loss": 0.0236, "step": 5369 }, { "epoch": 1.09, "learning_rate": 0.0002682958365291717, "loss": 0.011, "step": 5370 }, { "epoch": 1.09, "learning_rate": 0.0002682839163197004, "loss": 0.0376, "step": 5371 }, { "epoch": 1.09, "learning_rate": 0.0002682719941346644, "loss": 0.0184, "step": 5372 }, { "epoch": 1.09, "learning_rate": 0.0002682600699742628, "loss": 0.0173, "step": 5373 }, { "epoch": 1.09, "learning_rate": 0.0002682481438386948, "loss": 0.0092, "step": 5374 }, { "epoch": 1.09, "learning_rate": 0.00026823621572815966, "loss": 0.0146, "step": 5375 }, { "epoch": 1.09, "learning_rate": 0.0002682242856428565, "loss": 0.007, "step": 5376 }, { "epoch": 1.09, "learning_rate": 0.00026821235358298455, "loss": 0.0149, "step": 5377 }, { "epoch": 1.1, "learning_rate": 0.0002682004195487432, "loss": 0.0106, "step": 5378 }, { "epoch": 1.1, "learning_rate": 0.00026818848354033173, "loss": 0.0284, "step": 5379 }, { "epoch": 1.1, "learning_rate": 0.00026817654555794947, "loss": 0.0066, "step": 5380 }, { "epoch": 1.1, "learning_rate": 0.0002681646056017958, "loss": 0.0072, "step": 5381 }, { "epoch": 1.1, "learning_rate": 0.0002681526636720702, "loss": 0.0138, "step": 5382 }, { "epoch": 1.1, "learning_rate": 0.00026814071976897206, "loss": 0.0083, "step": 5383 }, { "epoch": 1.1, "learning_rate": 0.0002681287738927009, "loss": 0.0122, "step": 5384 }, { "epoch": 1.1, "learning_rate": 0.0002681168260434563, "loss": 0.0158, "step": 5385 }, { "epoch": 1.1, "learning_rate": 0.00026810487622143766, "loss": 0.013, "step": 5386 }, { "epoch": 1.1, "learning_rate": 0.0002680929244268447, "loss": 0.0275, "step": 5387 }, { "epoch": 1.1, "learning_rate": 0.000268080970659877, "loss": 0.0326, "step": 5388 }, { "epoch": 1.1, "learning_rate": 0.00026806901492073415, "loss": 0.0155, "step": 5389 }, { "epoch": 1.1, "learning_rate": 0.0002680570572096159, "loss": 0.0086, "step": 5390 }, { "epoch": 1.1, "learning_rate": 0.0002680450975267219, "loss": 0.0159, "step": 5391 }, { "epoch": 1.1, "learning_rate": 0.000268033135872252, "loss": 0.0258, "step": 5392 }, { "epoch": 1.1, "learning_rate": 0.0002680211722464059, "loss": 0.0238, "step": 5393 }, { "epoch": 1.1, "learning_rate": 0.0002680092066493834, "loss": 0.0417, "step": 5394 }, { "epoch": 1.1, "learning_rate": 0.0002679972390813845, "loss": 0.0495, "step": 5395 }, { "epoch": 1.1, "learning_rate": 0.0002679852695426089, "loss": 0.0054, "step": 5396 }, { "epoch": 1.1, "learning_rate": 0.0002679732980332566, "loss": 0.0077, "step": 5397 }, { "epoch": 1.1, "learning_rate": 0.00026796132455352754, "loss": 0.0057, "step": 5398 }, { "epoch": 1.1, "learning_rate": 0.00026794934910362174, "loss": 0.011, "step": 5399 }, { "epoch": 1.1, "learning_rate": 0.00026793737168373906, "loss": 0.0147, "step": 5400 }, { "epoch": 1.1, "learning_rate": 0.0002679253922940797, "loss": 0.0111, "step": 5401 }, { "epoch": 1.1, "learning_rate": 0.0002679134109348437, "loss": 0.0059, "step": 5402 }, { "epoch": 1.1, "learning_rate": 0.00026790142760623115, "loss": 0.0102, "step": 5403 }, { "epoch": 1.1, "learning_rate": 0.0002678894423084422, "loss": 0.019, "step": 5404 }, { "epoch": 1.1, "learning_rate": 0.00026787745504167705, "loss": 0.0262, "step": 5405 }, { "epoch": 1.1, "learning_rate": 0.0002678654658061359, "loss": 0.0095, "step": 5406 }, { "epoch": 1.1, "learning_rate": 0.00026785347460201895, "loss": 0.0147, "step": 5407 }, { "epoch": 1.1, "learning_rate": 0.0002678414814295265, "loss": 0.0148, "step": 5408 }, { "epoch": 1.1, "learning_rate": 0.00026782948628885887, "loss": 0.0261, "step": 5409 }, { "epoch": 1.1, "learning_rate": 0.00026781748918021646, "loss": 0.0109, "step": 5410 }, { "epoch": 1.1, "learning_rate": 0.0002678054901037995, "loss": 0.0045, "step": 5411 }, { "epoch": 1.1, "learning_rate": 0.00026779348905980855, "loss": 0.0261, "step": 5412 }, { "epoch": 1.1, "learning_rate": 0.000267781486048444, "loss": 0.0287, "step": 5413 }, { "epoch": 1.1, "learning_rate": 0.00026776948106990625, "loss": 0.0033, "step": 5414 }, { "epoch": 1.1, "learning_rate": 0.00026775747412439586, "loss": 0.0142, "step": 5415 }, { "epoch": 1.1, "learning_rate": 0.00026774546521211336, "loss": 0.0113, "step": 5416 }, { "epoch": 1.1, "learning_rate": 0.00026773345433325936, "loss": 0.0218, "step": 5417 }, { "epoch": 1.1, "learning_rate": 0.00026772144148803445, "loss": 0.0198, "step": 5418 }, { "epoch": 1.1, "learning_rate": 0.0002677094266766392, "loss": 0.0064, "step": 5419 }, { "epoch": 1.1, "learning_rate": 0.00026769740989927436, "loss": 0.0034, "step": 5420 }, { "epoch": 1.1, "learning_rate": 0.0002676853911561406, "loss": 0.0182, "step": 5421 }, { "epoch": 1.1, "learning_rate": 0.0002676733704474387, "loss": 0.0141, "step": 5422 }, { "epoch": 1.1, "learning_rate": 0.00026766134777336933, "loss": 0.0041, "step": 5423 }, { "epoch": 1.1, "learning_rate": 0.0002676493231341334, "loss": 0.0216, "step": 5424 }, { "epoch": 1.1, "learning_rate": 0.00026763729652993167, "loss": 0.0166, "step": 5425 }, { "epoch": 1.1, "learning_rate": 0.000267625267960965, "loss": 0.0033, "step": 5426 }, { "epoch": 1.11, "learning_rate": 0.00026761323742743436, "loss": 0.0197, "step": 5427 }, { "epoch": 1.11, "learning_rate": 0.00026760120492954064, "loss": 0.0324, "step": 5428 }, { "epoch": 1.11, "learning_rate": 0.00026758917046748484, "loss": 0.0225, "step": 5429 }, { "epoch": 1.11, "learning_rate": 0.0002675771340414679, "loss": 0.0032, "step": 5430 }, { "epoch": 1.11, "learning_rate": 0.0002675650956516909, "loss": 0.007, "step": 5431 }, { "epoch": 1.11, "learning_rate": 0.00026755305529835483, "loss": 0.0232, "step": 5432 }, { "epoch": 1.11, "learning_rate": 0.0002675410129816609, "loss": 0.0054, "step": 5433 }, { "epoch": 1.11, "learning_rate": 0.0002675289687018101, "loss": 0.0129, "step": 5434 }, { "epoch": 1.11, "learning_rate": 0.0002675169224590037, "loss": 0.0189, "step": 5435 }, { "epoch": 1.11, "learning_rate": 0.0002675048742534429, "loss": 0.0298, "step": 5436 }, { "epoch": 1.11, "learning_rate": 0.0002674928240853289, "loss": 0.023, "step": 5437 }, { "epoch": 1.11, "learning_rate": 0.00026748077195486294, "loss": 0.0122, "step": 5438 }, { "epoch": 1.11, "learning_rate": 0.00026746871786224635, "loss": 0.0082, "step": 5439 }, { "epoch": 1.11, "learning_rate": 0.00026745666180768034, "loss": 0.046, "step": 5440 }, { "epoch": 1.11, "learning_rate": 0.00026744460379136644, "loss": 0.0062, "step": 5441 }, { "epoch": 1.11, "learning_rate": 0.00026743254381350596, "loss": 0.0137, "step": 5442 }, { "epoch": 1.11, "learning_rate": 0.0002674204818743003, "loss": 0.0088, "step": 5443 }, { "epoch": 1.11, "learning_rate": 0.000267408417973951, "loss": 0.0284, "step": 5444 }, { "epoch": 1.11, "learning_rate": 0.00026739635211265944, "loss": 0.0098, "step": 5445 }, { "epoch": 1.11, "learning_rate": 0.00026738428429062724, "loss": 0.0054, "step": 5446 }, { "epoch": 1.11, "learning_rate": 0.0002673722145080559, "loss": 0.0489, "step": 5447 }, { "epoch": 1.11, "learning_rate": 0.000267360142765147, "loss": 0.0155, "step": 5448 }, { "epoch": 1.11, "learning_rate": 0.0002673480690621022, "loss": 0.0091, "step": 5449 }, { "epoch": 1.11, "learning_rate": 0.00026733599339912316, "loss": 0.0178, "step": 5450 }, { "epoch": 1.11, "learning_rate": 0.0002673239157764115, "loss": 0.0216, "step": 5451 }, { "epoch": 1.11, "learning_rate": 0.000267311836194169, "loss": 0.0281, "step": 5452 }, { "epoch": 1.11, "learning_rate": 0.0002672997546525974, "loss": 0.0048, "step": 5453 }, { "epoch": 1.11, "learning_rate": 0.0002672876711518985, "loss": 0.0043, "step": 5454 }, { "epoch": 1.11, "learning_rate": 0.000267275585692274, "loss": 0.0126, "step": 5455 }, { "epoch": 1.11, "learning_rate": 0.0002672634982739259, "loss": 0.001, "step": 5456 }, { "epoch": 1.11, "learning_rate": 0.00026725140889705606, "loss": 0.0082, "step": 5457 }, { "epoch": 1.11, "learning_rate": 0.0002672393175618664, "loss": 0.0053, "step": 5458 }, { "epoch": 1.11, "learning_rate": 0.0002672272242685588, "loss": 0.0015, "step": 5459 }, { "epoch": 1.11, "learning_rate": 0.0002672151290173352, "loss": 0.0159, "step": 5460 }, { "epoch": 1.11, "learning_rate": 0.00026720303180839775, "loss": 0.0109, "step": 5461 }, { "epoch": 1.11, "learning_rate": 0.0002671909326419484, "loss": 0.0225, "step": 5462 }, { "epoch": 1.11, "learning_rate": 0.0002671788315181893, "loss": 0.017, "step": 5463 }, { "epoch": 1.11, "learning_rate": 0.0002671667284373225, "loss": 0.0025, "step": 5464 }, { "epoch": 1.11, "learning_rate": 0.00026715462339955016, "loss": 0.0141, "step": 5465 }, { "epoch": 1.11, "learning_rate": 0.00026714251640507446, "loss": 0.0194, "step": 5466 }, { "epoch": 1.11, "learning_rate": 0.0002671304074540976, "loss": 0.0126, "step": 5467 }, { "epoch": 1.11, "learning_rate": 0.0002671182965468219, "loss": 0.0124, "step": 5468 }, { "epoch": 1.11, "learning_rate": 0.00026710618368344955, "loss": 0.0031, "step": 5469 }, { "epoch": 1.11, "learning_rate": 0.00026709406886418286, "loss": 0.0166, "step": 5470 }, { "epoch": 1.11, "learning_rate": 0.0002670819520892242, "loss": 0.0153, "step": 5471 }, { "epoch": 1.11, "learning_rate": 0.0002670698333587759, "loss": 0.0252, "step": 5472 }, { "epoch": 1.11, "learning_rate": 0.00026705771267304044, "loss": 0.0267, "step": 5473 }, { "epoch": 1.11, "learning_rate": 0.0002670455900322202, "loss": 0.0228, "step": 5474 }, { "epoch": 1.11, "learning_rate": 0.0002670334654365177, "loss": 0.018, "step": 5475 }, { "epoch": 1.12, "learning_rate": 0.00026702133888613534, "loss": 0.0268, "step": 5476 }, { "epoch": 1.12, "learning_rate": 0.0002670092103812758, "loss": 0.0248, "step": 5477 }, { "epoch": 1.12, "learning_rate": 0.0002669970799221415, "loss": 0.0072, "step": 5478 }, { "epoch": 1.12, "learning_rate": 0.00026698494750893514, "loss": 0.0093, "step": 5479 }, { "epoch": 1.12, "learning_rate": 0.00026697281314185943, "loss": 0.0157, "step": 5480 }, { "epoch": 1.12, "learning_rate": 0.00026696067682111684, "loss": 0.0154, "step": 5481 }, { "epoch": 1.12, "learning_rate": 0.0002669485385469101, "loss": 0.0102, "step": 5482 }, { "epoch": 1.12, "learning_rate": 0.00026693639831944216, "loss": 0.0066, "step": 5483 }, { "epoch": 1.12, "learning_rate": 0.0002669242561389156, "loss": 0.0187, "step": 5484 }, { "epoch": 1.12, "learning_rate": 0.0002669121120055332, "loss": 0.0032, "step": 5485 }, { "epoch": 1.12, "learning_rate": 0.0002668999659194979, "loss": 0.008, "step": 5486 }, { "epoch": 1.12, "learning_rate": 0.0002668878178810125, "loss": 0.0172, "step": 5487 }, { "epoch": 1.12, "learning_rate": 0.00026687566789027983, "loss": 0.0298, "step": 5488 }, { "epoch": 1.12, "learning_rate": 0.0002668635159475029, "loss": 0.0109, "step": 5489 }, { "epoch": 1.12, "learning_rate": 0.0002668513620528847, "loss": 0.0283, "step": 5490 }, { "epoch": 1.12, "learning_rate": 0.00026683920620662816, "loss": 0.0186, "step": 5491 }, { "epoch": 1.12, "learning_rate": 0.00026682704840893634, "loss": 0.0262, "step": 5492 }, { "epoch": 1.12, "learning_rate": 0.0002668148886600123, "loss": 0.0093, "step": 5493 }, { "epoch": 1.12, "learning_rate": 0.00026680272696005906, "loss": 0.011, "step": 5494 }, { "epoch": 1.12, "learning_rate": 0.00026679056330927985, "loss": 0.0173, "step": 5495 }, { "epoch": 1.12, "learning_rate": 0.00026677839770787777, "loss": 0.013, "step": 5496 }, { "epoch": 1.12, "learning_rate": 0.000266766230156056, "loss": 0.0073, "step": 5497 }, { "epoch": 1.12, "learning_rate": 0.0002667540606540178, "loss": 0.0249, "step": 5498 }, { "epoch": 1.12, "learning_rate": 0.00026674188920196637, "loss": 0.0255, "step": 5499 }, { "epoch": 1.12, "learning_rate": 0.000266729715800105, "loss": 0.0134, "step": 5500 }, { "epoch": 1.12, "learning_rate": 0.00026671754044863704, "loss": 0.0034, "step": 5501 }, { "epoch": 1.12, "learning_rate": 0.00026670536314776593, "loss": 0.0305, "step": 5502 }, { "epoch": 1.12, "learning_rate": 0.0002666931838976949, "loss": 0.0064, "step": 5503 }, { "epoch": 1.12, "learning_rate": 0.0002666810026986274, "loss": 0.0068, "step": 5504 }, { "epoch": 1.12, "learning_rate": 0.0002666688195507669, "loss": 0.0044, "step": 5505 }, { "epoch": 1.12, "learning_rate": 0.0002666566344543169, "loss": 0.0077, "step": 5506 }, { "epoch": 1.12, "learning_rate": 0.0002666444474094809, "loss": 0.0093, "step": 5507 }, { "epoch": 1.12, "learning_rate": 0.00026663225841646243, "loss": 0.0202, "step": 5508 }, { "epoch": 1.12, "learning_rate": 0.0002666200674754651, "loss": 0.0156, "step": 5509 }, { "epoch": 1.12, "learning_rate": 0.0002666078745866925, "loss": 0.0109, "step": 5510 }, { "epoch": 1.12, "learning_rate": 0.0002665956797503483, "loss": 0.0112, "step": 5511 }, { "epoch": 1.12, "learning_rate": 0.00026658348296663617, "loss": 0.0023, "step": 5512 }, { "epoch": 1.12, "learning_rate": 0.00026657128423575977, "loss": 0.0308, "step": 5513 }, { "epoch": 1.12, "learning_rate": 0.0002665590835579229, "loss": 0.0057, "step": 5514 }, { "epoch": 1.12, "learning_rate": 0.0002665468809333293, "loss": 0.0541, "step": 5515 }, { "epoch": 1.12, "learning_rate": 0.0002665346763621828, "loss": 0.0104, "step": 5516 }, { "epoch": 1.12, "learning_rate": 0.0002665224698446873, "loss": 0.0097, "step": 5517 }, { "epoch": 1.12, "learning_rate": 0.0002665102613810465, "loss": 0.0129, "step": 5518 }, { "epoch": 1.12, "learning_rate": 0.00026649805097146446, "loss": 0.0172, "step": 5519 }, { "epoch": 1.12, "learning_rate": 0.000266485838616145, "loss": 0.0255, "step": 5520 }, { "epoch": 1.12, "learning_rate": 0.0002664736243152922, "loss": 0.0289, "step": 5521 }, { "epoch": 1.12, "learning_rate": 0.00026646140806911003, "loss": 0.0136, "step": 5522 }, { "epoch": 1.12, "learning_rate": 0.0002664491898778025, "loss": 0.0134, "step": 5523 }, { "epoch": 1.12, "learning_rate": 0.0002664369697415736, "loss": 0.0105, "step": 5524 }, { "epoch": 1.12, "learning_rate": 0.00026642474766062766, "loss": 0.02, "step": 5525 }, { "epoch": 1.13, "learning_rate": 0.0002664125236351686, "loss": 0.0027, "step": 5526 }, { "epoch": 1.13, "learning_rate": 0.0002664002976654006, "loss": 0.0195, "step": 5527 }, { "epoch": 1.13, "learning_rate": 0.00026638806975152796, "loss": 0.0464, "step": 5528 }, { "epoch": 1.13, "learning_rate": 0.00026637583989375487, "loss": 0.0063, "step": 5529 }, { "epoch": 1.13, "learning_rate": 0.00026636360809228555, "loss": 0.0463, "step": 5530 }, { "epoch": 1.13, "learning_rate": 0.00026635137434732436, "loss": 0.0032, "step": 5531 }, { "epoch": 1.13, "learning_rate": 0.0002663391386590755, "loss": 0.0166, "step": 5532 }, { "epoch": 1.13, "learning_rate": 0.00026632690102774357, "loss": 0.0133, "step": 5533 }, { "epoch": 1.13, "learning_rate": 0.00026631466145353265, "loss": 0.0104, "step": 5534 }, { "epoch": 1.13, "learning_rate": 0.0002663024199366474, "loss": 0.0088, "step": 5535 }, { "epoch": 1.13, "learning_rate": 0.0002662901764772922, "loss": 0.0182, "step": 5536 }, { "epoch": 1.13, "learning_rate": 0.00026627793107567157, "loss": 0.0031, "step": 5537 }, { "epoch": 1.13, "learning_rate": 0.00026626568373198993, "loss": 0.0135, "step": 5538 }, { "epoch": 1.13, "learning_rate": 0.00026625343444645194, "loss": 0.0253, "step": 5539 }, { "epoch": 1.13, "learning_rate": 0.0002662411832192622, "loss": 0.0403, "step": 5540 }, { "epoch": 1.13, "learning_rate": 0.0002662289300506252, "loss": 0.0291, "step": 5541 }, { "epoch": 1.13, "learning_rate": 0.0002662166749407457, "loss": 0.0089, "step": 5542 }, { "epoch": 1.13, "learning_rate": 0.00026620441788982835, "loss": 0.0066, "step": 5543 }, { "epoch": 1.13, "learning_rate": 0.00026619215889807786, "loss": 0.0052, "step": 5544 }, { "epoch": 1.13, "learning_rate": 0.00026617989796569905, "loss": 0.0041, "step": 5545 }, { "epoch": 1.13, "learning_rate": 0.00026616763509289655, "loss": 0.0236, "step": 5546 }, { "epoch": 1.13, "learning_rate": 0.00026615537027987535, "loss": 0.0164, "step": 5547 }, { "epoch": 1.13, "learning_rate": 0.00026614310352684014, "loss": 0.0136, "step": 5548 }, { "epoch": 1.13, "learning_rate": 0.00026613083483399593, "loss": 0.0151, "step": 5549 }, { "epoch": 1.13, "learning_rate": 0.0002661185642015475, "loss": 0.0163, "step": 5550 }, { "epoch": 1.13, "learning_rate": 0.0002661062916296999, "loss": 0.0035, "step": 5551 }, { "epoch": 1.13, "learning_rate": 0.00026609401711865803, "loss": 0.0052, "step": 5552 }, { "epoch": 1.13, "learning_rate": 0.00026608174066862695, "loss": 0.0041, "step": 5553 }, { "epoch": 1.13, "learning_rate": 0.00026606946227981167, "loss": 0.0098, "step": 5554 }, { "epoch": 1.13, "learning_rate": 0.0002660571819524173, "loss": 0.0108, "step": 5555 }, { "epoch": 1.13, "learning_rate": 0.0002660448996866489, "loss": 0.0102, "step": 5556 }, { "epoch": 1.13, "learning_rate": 0.0002660326154827116, "loss": 0.0463, "step": 5557 }, { "epoch": 1.13, "learning_rate": 0.00026602032934081065, "loss": 0.0251, "step": 5558 }, { "epoch": 1.13, "learning_rate": 0.00026600804126115116, "loss": 0.0104, "step": 5559 }, { "epoch": 1.13, "learning_rate": 0.0002659957512439384, "loss": 0.0181, "step": 5560 }, { "epoch": 1.13, "learning_rate": 0.00026598345928937765, "loss": 0.0084, "step": 5561 }, { "epoch": 1.13, "learning_rate": 0.00026597116539767417, "loss": 0.0023, "step": 5562 }, { "epoch": 1.13, "learning_rate": 0.0002659588695690334, "loss": 0.0216, "step": 5563 }, { "epoch": 1.13, "learning_rate": 0.0002659465718036605, "loss": 0.0323, "step": 5564 }, { "epoch": 1.13, "learning_rate": 0.000265934272101761, "loss": 0.0384, "step": 5565 }, { "epoch": 1.13, "learning_rate": 0.0002659219704635404, "loss": 0.0045, "step": 5566 }, { "epoch": 1.13, "learning_rate": 0.000265909666889204, "loss": 0.0018, "step": 5567 }, { "epoch": 1.13, "learning_rate": 0.00026589736137895743, "loss": 0.0287, "step": 5568 }, { "epoch": 1.13, "learning_rate": 0.0002658850539330061, "loss": 0.0134, "step": 5569 }, { "epoch": 1.13, "learning_rate": 0.0002658727445515556, "loss": 0.0152, "step": 5570 }, { "epoch": 1.13, "learning_rate": 0.0002658604332348116, "loss": 0.0047, "step": 5571 }, { "epoch": 1.13, "learning_rate": 0.00026584811998297967, "loss": 0.0248, "step": 5572 }, { "epoch": 1.13, "learning_rate": 0.00026583580479626546, "loss": 0.0132, "step": 5573 }, { "epoch": 1.13, "learning_rate": 0.0002658234876748746, "loss": 0.0014, "step": 5574 }, { "epoch": 1.14, "learning_rate": 0.0002658111686190129, "loss": 0.0072, "step": 5575 }, { "epoch": 1.14, "learning_rate": 0.00026579884762888606, "loss": 0.0026, "step": 5576 }, { "epoch": 1.14, "learning_rate": 0.0002657865247046999, "loss": 0.0065, "step": 5577 }, { "epoch": 1.14, "learning_rate": 0.0002657741998466602, "loss": 0.0077, "step": 5578 }, { "epoch": 1.14, "learning_rate": 0.0002657618730549728, "loss": 0.0299, "step": 5579 }, { "epoch": 1.14, "learning_rate": 0.00026574954432984364, "loss": 0.0166, "step": 5580 }, { "epoch": 1.14, "learning_rate": 0.00026573721367147856, "loss": 0.0094, "step": 5581 }, { "epoch": 1.14, "learning_rate": 0.0002657248810800836, "loss": 0.014, "step": 5582 }, { "epoch": 1.14, "learning_rate": 0.0002657125465558647, "loss": 0.0073, "step": 5583 }, { "epoch": 1.14, "learning_rate": 0.00026570021009902776, "loss": 0.0067, "step": 5584 }, { "epoch": 1.14, "learning_rate": 0.0002656878717097789, "loss": 0.015, "step": 5585 }, { "epoch": 1.14, "learning_rate": 0.0002656755313883243, "loss": 0.0416, "step": 5586 }, { "epoch": 1.14, "learning_rate": 0.0002656631891348699, "loss": 0.0192, "step": 5587 }, { "epoch": 1.14, "learning_rate": 0.00026565084494962197, "loss": 0.0063, "step": 5588 }, { "epoch": 1.14, "learning_rate": 0.00026563849883278655, "loss": 0.0113, "step": 5589 }, { "epoch": 1.14, "learning_rate": 0.00026562615078457, "loss": 0.0198, "step": 5590 }, { "epoch": 1.14, "learning_rate": 0.0002656138008051784, "loss": 0.0147, "step": 5591 }, { "epoch": 1.14, "learning_rate": 0.00026560144889481815, "loss": 0.0116, "step": 5592 }, { "epoch": 1.14, "learning_rate": 0.00026558909505369543, "loss": 0.0155, "step": 5593 }, { "epoch": 1.14, "learning_rate": 0.0002655767392820167, "loss": 0.0306, "step": 5594 }, { "epoch": 1.14, "learning_rate": 0.0002655643815799882, "loss": 0.0152, "step": 5595 }, { "epoch": 1.14, "learning_rate": 0.0002655520219478164, "loss": 0.0128, "step": 5596 }, { "epoch": 1.14, "learning_rate": 0.0002655396603857077, "loss": 0.0158, "step": 5597 }, { "epoch": 1.14, "learning_rate": 0.0002655272968938686, "loss": 0.0125, "step": 5598 }, { "epoch": 1.14, "learning_rate": 0.0002655149314725056, "loss": 0.0188, "step": 5599 }, { "epoch": 1.14, "learning_rate": 0.00026550256412182513, "loss": 0.0237, "step": 5600 }, { "epoch": 1.14, "learning_rate": 0.00026549019484203385, "loss": 0.0476, "step": 5601 }, { "epoch": 1.14, "learning_rate": 0.0002654778236333383, "loss": 0.0071, "step": 5602 }, { "epoch": 1.14, "learning_rate": 0.0002654654504959451, "loss": 0.0132, "step": 5603 }, { "epoch": 1.14, "learning_rate": 0.00026545307543006093, "loss": 0.0278, "step": 5604 }, { "epoch": 1.14, "learning_rate": 0.0002654406984358925, "loss": 0.0123, "step": 5605 }, { "epoch": 1.14, "learning_rate": 0.00026542831951364645, "loss": 0.0077, "step": 5606 }, { "epoch": 1.14, "learning_rate": 0.0002654159386635296, "loss": 0.0181, "step": 5607 }, { "epoch": 1.14, "learning_rate": 0.0002654035558857487, "loss": 0.0083, "step": 5608 }, { "epoch": 1.14, "learning_rate": 0.00026539117118051065, "loss": 0.007, "step": 5609 }, { "epoch": 1.14, "learning_rate": 0.0002653787845480221, "loss": 0.0182, "step": 5610 }, { "epoch": 1.14, "learning_rate": 0.0002653663959884901, "loss": 0.0229, "step": 5611 }, { "epoch": 1.14, "learning_rate": 0.0002653540055021216, "loss": 0.0323, "step": 5612 }, { "epoch": 1.14, "learning_rate": 0.00026534161308912335, "loss": 0.0165, "step": 5613 }, { "epoch": 1.14, "learning_rate": 0.0002653292187497025, "loss": 0.019, "step": 5614 }, { "epoch": 1.14, "learning_rate": 0.00026531682248406597, "loss": 0.0289, "step": 5615 }, { "epoch": 1.14, "learning_rate": 0.00026530442429242087, "loss": 0.0094, "step": 5616 }, { "epoch": 1.14, "learning_rate": 0.0002652920241749742, "loss": 0.0116, "step": 5617 }, { "epoch": 1.14, "learning_rate": 0.0002652796221319331, "loss": 0.0254, "step": 5618 }, { "epoch": 1.14, "learning_rate": 0.0002652672181635047, "loss": 0.044, "step": 5619 }, { "epoch": 1.14, "learning_rate": 0.0002652548122698962, "loss": 0.0061, "step": 5620 }, { "epoch": 1.14, "learning_rate": 0.00026524240445131473, "loss": 0.0104, "step": 5621 }, { "epoch": 1.14, "learning_rate": 0.0002652299947079676, "loss": 0.0125, "step": 5622 }, { "epoch": 1.14, "learning_rate": 0.0002652175830400621, "loss": 0.0071, "step": 5623 }, { "epoch": 1.15, "learning_rate": 0.00026520516944780536, "loss": 0.0137, "step": 5624 }, { "epoch": 1.15, "learning_rate": 0.00026519275393140486, "loss": 0.0216, "step": 5625 }, { "epoch": 1.15, "learning_rate": 0.000265180336491068, "loss": 0.0229, "step": 5626 }, { "epoch": 1.15, "learning_rate": 0.000265167917127002, "loss": 0.0247, "step": 5627 }, { "epoch": 1.15, "learning_rate": 0.00026515549583941444, "loss": 0.0109, "step": 5628 }, { "epoch": 1.15, "learning_rate": 0.00026514307262851276, "loss": 0.0399, "step": 5629 }, { "epoch": 1.15, "learning_rate": 0.0002651306474945044, "loss": 0.0313, "step": 5630 }, { "epoch": 1.15, "learning_rate": 0.0002651182204375969, "loss": 0.0159, "step": 5631 }, { "epoch": 1.15, "learning_rate": 0.0002651057914579978, "loss": 0.0189, "step": 5632 }, { "epoch": 1.15, "learning_rate": 0.0002650933605559147, "loss": 0.0112, "step": 5633 }, { "epoch": 1.15, "learning_rate": 0.00026508092773155526, "loss": 0.0082, "step": 5634 }, { "epoch": 1.15, "learning_rate": 0.0002650684929851271, "loss": 0.0145, "step": 5635 }, { "epoch": 1.15, "learning_rate": 0.0002650560563168378, "loss": 0.0049, "step": 5636 }, { "epoch": 1.15, "learning_rate": 0.00026504361772689526, "loss": 0.0124, "step": 5637 }, { "epoch": 1.15, "learning_rate": 0.0002650311772155071, "loss": 0.0049, "step": 5638 }, { "epoch": 1.15, "learning_rate": 0.00026501873478288124, "loss": 0.0178, "step": 5639 }, { "epoch": 1.15, "learning_rate": 0.00026500629042922535, "loss": 0.0138, "step": 5640 }, { "epoch": 1.15, "learning_rate": 0.0002649938441547473, "loss": 0.0303, "step": 5641 }, { "epoch": 1.15, "learning_rate": 0.000264981395959655, "loss": 0.0055, "step": 5642 }, { "epoch": 1.15, "learning_rate": 0.0002649689458441563, "loss": 0.0102, "step": 5643 }, { "epoch": 1.15, "learning_rate": 0.0002649564938084592, "loss": 0.0123, "step": 5644 }, { "epoch": 1.15, "learning_rate": 0.00026494403985277167, "loss": 0.0195, "step": 5645 }, { "epoch": 1.15, "learning_rate": 0.0002649315839773018, "loss": 0.003, "step": 5646 }, { "epoch": 1.15, "learning_rate": 0.00026491912618225737, "loss": 0.0137, "step": 5647 }, { "epoch": 1.15, "learning_rate": 0.00026490666646784665, "loss": 0.0237, "step": 5648 }, { "epoch": 1.15, "learning_rate": 0.00026489420483427774, "loss": 0.0239, "step": 5649 }, { "epoch": 1.15, "learning_rate": 0.00026488174128175875, "loss": 0.0188, "step": 5650 }, { "epoch": 1.15, "learning_rate": 0.0002648692758104978, "loss": 0.0206, "step": 5651 }, { "epoch": 1.15, "learning_rate": 0.00026485680842070305, "loss": 0.0236, "step": 5652 }, { "epoch": 1.15, "learning_rate": 0.0002648443391125829, "loss": 0.0033, "step": 5653 }, { "epoch": 1.15, "learning_rate": 0.0002648318678863454, "loss": 0.0109, "step": 5654 }, { "epoch": 1.15, "learning_rate": 0.00026481939474219907, "loss": 0.0569, "step": 5655 }, { "epoch": 1.15, "learning_rate": 0.000264806919680352, "loss": 0.0191, "step": 5656 }, { "epoch": 1.15, "learning_rate": 0.0002647944427010127, "loss": 0.0128, "step": 5657 }, { "epoch": 1.15, "learning_rate": 0.0002647819638043895, "loss": 0.0238, "step": 5658 }, { "epoch": 1.15, "learning_rate": 0.00026476948299069083, "loss": 0.0409, "step": 5659 }, { "epoch": 1.15, "learning_rate": 0.00026475700026012516, "loss": 0.0135, "step": 5660 }, { "epoch": 1.15, "learning_rate": 0.000264744515612901, "loss": 0.011, "step": 5661 }, { "epoch": 1.15, "learning_rate": 0.00026473202904922684, "loss": 0.005, "step": 5662 }, { "epoch": 1.15, "learning_rate": 0.00026471954056931117, "loss": 0.0288, "step": 5663 }, { "epoch": 1.15, "learning_rate": 0.00026470705017336263, "loss": 0.0148, "step": 5664 }, { "epoch": 1.15, "learning_rate": 0.0002646945578615899, "loss": 0.0222, "step": 5665 }, { "epoch": 1.15, "learning_rate": 0.00026468206363420145, "loss": 0.0061, "step": 5666 }, { "epoch": 1.15, "learning_rate": 0.0002646695674914061, "loss": 0.0066, "step": 5667 }, { "epoch": 1.15, "learning_rate": 0.00026465706943341254, "loss": 0.0159, "step": 5668 }, { "epoch": 1.15, "learning_rate": 0.00026464456946042946, "loss": 0.0078, "step": 5669 }, { "epoch": 1.15, "learning_rate": 0.00026463206757266567, "loss": 0.0173, "step": 5670 }, { "epoch": 1.15, "learning_rate": 0.00026461956377033, "loss": 0.019, "step": 5671 }, { "epoch": 1.15, "learning_rate": 0.0002646070580536312, "loss": 0.0071, "step": 5672 }, { "epoch": 1.16, "learning_rate": 0.00026459455042277826, "loss": 0.0123, "step": 5673 }, { "epoch": 1.16, "learning_rate": 0.00026458204087797995, "loss": 0.0046, "step": 5674 }, { "epoch": 1.16, "learning_rate": 0.0002645695294194453, "loss": 0.0256, "step": 5675 }, { "epoch": 1.16, "learning_rate": 0.00026455701604738327, "loss": 0.0202, "step": 5676 }, { "epoch": 1.16, "learning_rate": 0.0002645445007620028, "loss": 0.003, "step": 5677 }, { "epoch": 1.16, "learning_rate": 0.00026453198356351295, "loss": 0.0062, "step": 5678 }, { "epoch": 1.16, "learning_rate": 0.00026451946445212276, "loss": 0.0149, "step": 5679 }, { "epoch": 1.16, "learning_rate": 0.00026450694342804133, "loss": 0.0021, "step": 5680 }, { "epoch": 1.16, "learning_rate": 0.0002644944204914779, "loss": 0.0067, "step": 5681 }, { "epoch": 1.16, "learning_rate": 0.00026448189564264144, "loss": 0.0129, "step": 5682 }, { "epoch": 1.16, "learning_rate": 0.00026446936888174127, "loss": 0.0142, "step": 5683 }, { "epoch": 1.16, "learning_rate": 0.0002644568402089865, "loss": 0.0108, "step": 5684 }, { "epoch": 1.16, "learning_rate": 0.0002644443096245865, "loss": 0.0295, "step": 5685 }, { "epoch": 1.16, "learning_rate": 0.00026443177712875043, "loss": 0.0165, "step": 5686 }, { "epoch": 1.16, "learning_rate": 0.00026441924272168775, "loss": 0.0188, "step": 5687 }, { "epoch": 1.16, "learning_rate": 0.00026440670640360777, "loss": 0.025, "step": 5688 }, { "epoch": 1.16, "learning_rate": 0.00026439416817471975, "loss": 0.0068, "step": 5689 }, { "epoch": 1.16, "learning_rate": 0.0002643816280352332, "loss": 0.0051, "step": 5690 }, { "epoch": 1.16, "learning_rate": 0.00026436908598535754, "loss": 0.0147, "step": 5691 }, { "epoch": 1.16, "learning_rate": 0.00026435654202530234, "loss": 0.0043, "step": 5692 }, { "epoch": 1.16, "learning_rate": 0.0002643439961552769, "loss": 0.0146, "step": 5693 }, { "epoch": 1.16, "learning_rate": 0.000264331448375491, "loss": 0.0333, "step": 5694 }, { "epoch": 1.16, "learning_rate": 0.000264318898686154, "loss": 0.0066, "step": 5695 }, { "epoch": 1.16, "learning_rate": 0.00026430634708747564, "loss": 0.007, "step": 5696 }, { "epoch": 1.16, "learning_rate": 0.0002642937935796656, "loss": 0.0045, "step": 5697 }, { "epoch": 1.16, "learning_rate": 0.0002642812381629334, "loss": 0.0124, "step": 5698 }, { "epoch": 1.16, "learning_rate": 0.0002642686808374887, "loss": 0.0189, "step": 5699 }, { "epoch": 1.16, "learning_rate": 0.00026425612160354146, "loss": 0.0082, "step": 5700 }, { "epoch": 1.16, "learning_rate": 0.0002642435604613012, "loss": 0.0095, "step": 5701 }, { "epoch": 1.16, "learning_rate": 0.000264230997410978, "loss": 0.0054, "step": 5702 }, { "epoch": 1.16, "learning_rate": 0.0002642184324527814, "loss": 0.0008, "step": 5703 }, { "epoch": 1.16, "learning_rate": 0.0002642058655869214, "loss": 0.0182, "step": 5704 }, { "epoch": 1.16, "learning_rate": 0.00026419329681360784, "loss": 0.012, "step": 5705 }, { "epoch": 1.16, "learning_rate": 0.0002641807261330507, "loss": 0.0058, "step": 5706 }, { "epoch": 1.16, "learning_rate": 0.0002641681535454599, "loss": 0.007, "step": 5707 }, { "epoch": 1.16, "learning_rate": 0.0002641555790510454, "loss": 0.0357, "step": 5708 }, { "epoch": 1.16, "learning_rate": 0.0002641430026500173, "loss": 0.0062, "step": 5709 }, { "epoch": 1.16, "learning_rate": 0.00026413042434258555, "loss": 0.0103, "step": 5710 }, { "epoch": 1.16, "learning_rate": 0.00026411784412896027, "loss": 0.0254, "step": 5711 }, { "epoch": 1.16, "learning_rate": 0.0002641052620093516, "loss": 0.0039, "step": 5712 }, { "epoch": 1.16, "learning_rate": 0.0002640926779839697, "loss": 0.0159, "step": 5713 }, { "epoch": 1.16, "learning_rate": 0.0002640800920530247, "loss": 0.0281, "step": 5714 }, { "epoch": 1.16, "learning_rate": 0.00026406750421672674, "loss": 0.0094, "step": 5715 }, { "epoch": 1.16, "learning_rate": 0.0002640549144752862, "loss": 0.0043, "step": 5716 }, { "epoch": 1.16, "learning_rate": 0.00026404232282891326, "loss": 0.0195, "step": 5717 }, { "epoch": 1.16, "learning_rate": 0.00026402972927781835, "loss": 0.0316, "step": 5718 }, { "epoch": 1.16, "learning_rate": 0.00026401713382221163, "loss": 0.0155, "step": 5719 }, { "epoch": 1.16, "learning_rate": 0.0002640045364623036, "loss": 0.0087, "step": 5720 }, { "epoch": 1.16, "learning_rate": 0.00026399193719830457, "loss": 0.007, "step": 5721 }, { "epoch": 1.17, "learning_rate": 0.00026397933603042507, "loss": 0.0279, "step": 5722 }, { "epoch": 1.17, "learning_rate": 0.0002639667329588755, "loss": 0.0134, "step": 5723 }, { "epoch": 1.17, "learning_rate": 0.0002639541279838663, "loss": 0.0249, "step": 5724 }, { "epoch": 1.17, "learning_rate": 0.0002639415211056081, "loss": 0.0229, "step": 5725 }, { "epoch": 1.17, "learning_rate": 0.00026392891232431145, "loss": 0.0033, "step": 5726 }, { "epoch": 1.17, "learning_rate": 0.00026391630164018684, "loss": 0.0093, "step": 5727 }, { "epoch": 1.17, "learning_rate": 0.000263903689053445, "loss": 0.0108, "step": 5728 }, { "epoch": 1.17, "learning_rate": 0.0002638910745642965, "loss": 0.0411, "step": 5729 }, { "epoch": 1.17, "learning_rate": 0.0002638784581729521, "loss": 0.01, "step": 5730 }, { "epoch": 1.17, "learning_rate": 0.0002638658398796225, "loss": 0.0051, "step": 5731 }, { "epoch": 1.17, "learning_rate": 0.0002638532196845185, "loss": 0.03, "step": 5732 }, { "epoch": 1.17, "learning_rate": 0.0002638405975878507, "loss": 0.007, "step": 5733 }, { "epoch": 1.17, "learning_rate": 0.0002638279735898301, "loss": 0.0286, "step": 5734 }, { "epoch": 1.17, "learning_rate": 0.00026381534769066747, "loss": 0.0294, "step": 5735 }, { "epoch": 1.17, "learning_rate": 0.0002638027198905737, "loss": 0.0212, "step": 5736 }, { "epoch": 1.17, "learning_rate": 0.00026379009018975965, "loss": 0.0218, "step": 5737 }, { "epoch": 1.17, "learning_rate": 0.0002637774585884363, "loss": 0.0218, "step": 5738 }, { "epoch": 1.17, "learning_rate": 0.0002637648250868146, "loss": 0.0134, "step": 5739 }, { "epoch": 1.17, "learning_rate": 0.0002637521896851057, "loss": 0.0064, "step": 5740 }, { "epoch": 1.17, "learning_rate": 0.00026373955238352036, "loss": 0.0347, "step": 5741 }, { "epoch": 1.17, "learning_rate": 0.00026372691318226986, "loss": 0.0152, "step": 5742 }, { "epoch": 1.17, "learning_rate": 0.00026371427208156525, "loss": 0.0253, "step": 5743 }, { "epoch": 1.17, "learning_rate": 0.00026370162908161766, "loss": 0.0084, "step": 5744 }, { "epoch": 1.17, "learning_rate": 0.00026368898418263815, "loss": 0.0083, "step": 5745 }, { "epoch": 1.17, "learning_rate": 0.00026367633738483807, "loss": 0.0318, "step": 5746 }, { "epoch": 1.17, "learning_rate": 0.0002636636886884286, "loss": 0.0182, "step": 5747 }, { "epoch": 1.17, "learning_rate": 0.0002636510380936209, "loss": 0.0171, "step": 5748 }, { "epoch": 1.17, "learning_rate": 0.0002636383856006264, "loss": 0.0284, "step": 5749 }, { "epoch": 1.17, "learning_rate": 0.0002636257312096563, "loss": 0.0274, "step": 5750 }, { "epoch": 1.17, "learning_rate": 0.00026361307492092206, "loss": 0.0124, "step": 5751 }, { "epoch": 1.17, "learning_rate": 0.00026360041673463493, "loss": 0.0172, "step": 5752 }, { "epoch": 1.17, "learning_rate": 0.00026358775665100647, "loss": 0.0102, "step": 5753 }, { "epoch": 1.17, "learning_rate": 0.0002635750946702481, "loss": 0.0086, "step": 5754 }, { "epoch": 1.17, "learning_rate": 0.00026356243079257117, "loss": 0.0286, "step": 5755 }, { "epoch": 1.17, "learning_rate": 0.00026354976501818733, "loss": 0.0213, "step": 5756 }, { "epoch": 1.17, "learning_rate": 0.00026353709734730805, "loss": 0.0103, "step": 5757 }, { "epoch": 1.17, "learning_rate": 0.0002635244277801449, "loss": 0.0089, "step": 5758 }, { "epoch": 1.17, "learning_rate": 0.00026351175631690956, "loss": 0.0188, "step": 5759 }, { "epoch": 1.17, "learning_rate": 0.0002634990829578136, "loss": 0.0328, "step": 5760 }, { "epoch": 1.17, "learning_rate": 0.00026348640770306874, "loss": 0.0169, "step": 5761 }, { "epoch": 1.17, "learning_rate": 0.00026347373055288665, "loss": 0.008, "step": 5762 }, { "epoch": 1.17, "learning_rate": 0.00026346105150747904, "loss": 0.0245, "step": 5763 }, { "epoch": 1.17, "learning_rate": 0.0002634483705670577, "loss": 0.0282, "step": 5764 }, { "epoch": 1.17, "learning_rate": 0.00026343568773183444, "loss": 0.0298, "step": 5765 }, { "epoch": 1.17, "learning_rate": 0.00026342300300202104, "loss": 0.0211, "step": 5766 }, { "epoch": 1.17, "learning_rate": 0.0002634103163778294, "loss": 0.0133, "step": 5767 }, { "epoch": 1.17, "learning_rate": 0.0002633976278594714, "loss": 0.0066, "step": 5768 }, { "epoch": 1.17, "learning_rate": 0.000263384937447159, "loss": 0.0388, "step": 5769 }, { "epoch": 1.17, "learning_rate": 0.00026337224514110403, "loss": 0.0065, "step": 5770 }, { "epoch": 1.18, "learning_rate": 0.00026335955094151865, "loss": 0.0178, "step": 5771 }, { "epoch": 1.18, "learning_rate": 0.00026334685484861477, "loss": 0.0252, "step": 5772 }, { "epoch": 1.18, "learning_rate": 0.0002633341568626044, "loss": 0.0215, "step": 5773 }, { "epoch": 1.18, "learning_rate": 0.0002633214569836997, "loss": 0.0247, "step": 5774 }, { "epoch": 1.18, "learning_rate": 0.0002633087552121128, "loss": 0.0515, "step": 5775 }, { "epoch": 1.18, "learning_rate": 0.00026329605154805575, "loss": 0.0032, "step": 5776 }, { "epoch": 1.18, "learning_rate": 0.00026328334599174085, "loss": 0.0063, "step": 5777 }, { "epoch": 1.18, "learning_rate": 0.00026327063854338014, "loss": 0.0192, "step": 5778 }, { "epoch": 1.18, "learning_rate": 0.000263257929203186, "loss": 0.0108, "step": 5779 }, { "epoch": 1.18, "learning_rate": 0.00026324521797137067, "loss": 0.0194, "step": 5780 }, { "epoch": 1.18, "learning_rate": 0.0002632325048481464, "loss": 0.0311, "step": 5781 }, { "epoch": 1.18, "learning_rate": 0.0002632197898337256, "loss": 0.0101, "step": 5782 }, { "epoch": 1.18, "learning_rate": 0.00026320707292832056, "loss": 0.0206, "step": 5783 }, { "epoch": 1.18, "learning_rate": 0.0002631943541321437, "loss": 0.0281, "step": 5784 }, { "epoch": 1.18, "learning_rate": 0.0002631816334454075, "loss": 0.0083, "step": 5785 }, { "epoch": 1.18, "learning_rate": 0.00026316891086832433, "loss": 0.0094, "step": 5786 }, { "epoch": 1.18, "learning_rate": 0.00026315618640110675, "loss": 0.0108, "step": 5787 }, { "epoch": 1.18, "learning_rate": 0.00026314346004396725, "loss": 0.0231, "step": 5788 }, { "epoch": 1.18, "learning_rate": 0.00026313073179711844, "loss": 0.0107, "step": 5789 }, { "epoch": 1.18, "learning_rate": 0.00026311800166077277, "loss": 0.0052, "step": 5790 }, { "epoch": 1.18, "learning_rate": 0.000263105269635143, "loss": 0.017, "step": 5791 }, { "epoch": 1.18, "learning_rate": 0.00026309253572044173, "loss": 0.017, "step": 5792 }, { "epoch": 1.18, "learning_rate": 0.00026307979991688164, "loss": 0.0259, "step": 5793 }, { "epoch": 1.18, "learning_rate": 0.0002630670622246754, "loss": 0.0112, "step": 5794 }, { "epoch": 1.18, "learning_rate": 0.0002630543226440358, "loss": 0.0089, "step": 5795 }, { "epoch": 1.18, "learning_rate": 0.00026304158117517563, "loss": 0.0195, "step": 5796 }, { "epoch": 1.18, "learning_rate": 0.0002630288378183077, "loss": 0.0098, "step": 5797 }, { "epoch": 1.18, "learning_rate": 0.0002630160925736448, "loss": 0.0206, "step": 5798 }, { "epoch": 1.18, "learning_rate": 0.00026300334544139976, "loss": 0.022, "step": 5799 }, { "epoch": 1.18, "learning_rate": 0.0002629905964217856, "loss": 0.04, "step": 5800 }, { "epoch": 1.18, "learning_rate": 0.00026297784551501517, "loss": 0.0213, "step": 5801 }, { "epoch": 1.18, "learning_rate": 0.0002629650927213015, "loss": 0.0334, "step": 5802 }, { "epoch": 1.18, "learning_rate": 0.0002629523380408575, "loss": 0.0144, "step": 5803 }, { "epoch": 1.18, "learning_rate": 0.0002629395814738963, "loss": 0.0031, "step": 5804 }, { "epoch": 1.18, "learning_rate": 0.00026292682302063084, "loss": 0.0199, "step": 5805 }, { "epoch": 1.18, "learning_rate": 0.0002629140626812743, "loss": 0.0218, "step": 5806 }, { "epoch": 1.18, "learning_rate": 0.0002629013004560398, "loss": 0.0092, "step": 5807 }, { "epoch": 1.18, "learning_rate": 0.0002628885363451404, "loss": 0.0261, "step": 5808 }, { "epoch": 1.18, "learning_rate": 0.0002628757703487894, "loss": 0.0097, "step": 5809 }, { "epoch": 1.18, "learning_rate": 0.00026286300246719995, "loss": 0.0097, "step": 5810 }, { "epoch": 1.18, "learning_rate": 0.0002628502327005853, "loss": 0.0276, "step": 5811 }, { "epoch": 1.18, "learning_rate": 0.0002628374610491588, "loss": 0.0042, "step": 5812 }, { "epoch": 1.18, "learning_rate": 0.0002628246875131336, "loss": 0.0064, "step": 5813 }, { "epoch": 1.18, "learning_rate": 0.00026281191209272324, "loss": 0.0075, "step": 5814 }, { "epoch": 1.18, "learning_rate": 0.00026279913478814096, "loss": 0.0121, "step": 5815 }, { "epoch": 1.18, "learning_rate": 0.0002627863555996002, "loss": 0.0239, "step": 5816 }, { "epoch": 1.18, "learning_rate": 0.00026277357452731445, "loss": 0.0312, "step": 5817 }, { "epoch": 1.18, "learning_rate": 0.0002627607915714971, "loss": 0.0126, "step": 5818 }, { "epoch": 1.18, "learning_rate": 0.00026274800673236167, "loss": 0.0255, "step": 5819 }, { "epoch": 1.19, "learning_rate": 0.0002627352200101217, "loss": 0.0118, "step": 5820 }, { "epoch": 1.19, "learning_rate": 0.0002627224314049908, "loss": 0.0235, "step": 5821 }, { "epoch": 1.19, "learning_rate": 0.00026270964091718247, "loss": 0.0388, "step": 5822 }, { "epoch": 1.19, "learning_rate": 0.00026269684854691034, "loss": 0.0043, "step": 5823 }, { "epoch": 1.19, "learning_rate": 0.00026268405429438817, "loss": 0.0116, "step": 5824 }, { "epoch": 1.19, "learning_rate": 0.00026267125815982963, "loss": 0.0189, "step": 5825 }, { "epoch": 1.19, "learning_rate": 0.00026265846014344833, "loss": 0.0109, "step": 5826 }, { "epoch": 1.19, "learning_rate": 0.0002626456602454581, "loss": 0.003, "step": 5827 }, { "epoch": 1.19, "learning_rate": 0.00026263285846607264, "loss": 0.0185, "step": 5828 }, { "epoch": 1.19, "learning_rate": 0.000262620054805506, "loss": 0.0095, "step": 5829 }, { "epoch": 1.19, "learning_rate": 0.00026260724926397176, "loss": 0.0025, "step": 5830 }, { "epoch": 1.19, "learning_rate": 0.00026259444184168385, "loss": 0.0211, "step": 5831 }, { "epoch": 1.19, "learning_rate": 0.0002625816325388563, "loss": 0.0126, "step": 5832 }, { "epoch": 1.19, "learning_rate": 0.00026256882135570293, "loss": 0.0187, "step": 5833 }, { "epoch": 1.19, "learning_rate": 0.0002625560082924378, "loss": 0.0048, "step": 5834 }, { "epoch": 1.19, "learning_rate": 0.0002625431933492748, "loss": 0.0022, "step": 5835 }, { "epoch": 1.19, "learning_rate": 0.00026253037652642806, "loss": 0.0023, "step": 5836 }, { "epoch": 1.19, "learning_rate": 0.00026251755782411164, "loss": 0.0044, "step": 5837 }, { "epoch": 1.19, "learning_rate": 0.00026250473724253963, "loss": 0.0158, "step": 5838 }, { "epoch": 1.19, "learning_rate": 0.0002624919147819261, "loss": 0.0096, "step": 5839 }, { "epoch": 1.19, "learning_rate": 0.0002624790904424853, "loss": 0.0204, "step": 5840 }, { "epoch": 1.19, "learning_rate": 0.0002624662642244313, "loss": 0.0111, "step": 5841 }, { "epoch": 1.19, "learning_rate": 0.0002624534361279784, "loss": 0.0054, "step": 5842 }, { "epoch": 1.19, "learning_rate": 0.0002624406061533409, "loss": 0.0033, "step": 5843 }, { "epoch": 1.19, "learning_rate": 0.000262427774300733, "loss": 0.0414, "step": 5844 }, { "epoch": 1.19, "learning_rate": 0.000262414940570369, "loss": 0.0247, "step": 5845 }, { "epoch": 1.19, "learning_rate": 0.0002624021049624634, "loss": 0.0242, "step": 5846 }, { "epoch": 1.19, "learning_rate": 0.00026238926747723044, "loss": 0.0075, "step": 5847 }, { "epoch": 1.19, "learning_rate": 0.0002623764281148845, "loss": 0.0197, "step": 5848 }, { "epoch": 1.19, "learning_rate": 0.0002623635868756401, "loss": 0.0124, "step": 5849 }, { "epoch": 1.19, "learning_rate": 0.00026235074375971176, "loss": 0.0033, "step": 5850 }, { "epoch": 1.19, "learning_rate": 0.00026233789876731385, "loss": 0.0252, "step": 5851 }, { "epoch": 1.19, "learning_rate": 0.000262325051898661, "loss": 0.0064, "step": 5852 }, { "epoch": 1.19, "learning_rate": 0.0002623122031539678, "loss": 0.0103, "step": 5853 }, { "epoch": 1.19, "learning_rate": 0.00026229935253344874, "loss": 0.0152, "step": 5854 }, { "epoch": 1.19, "learning_rate": 0.00026228650003731855, "loss": 0.0077, "step": 5855 }, { "epoch": 1.19, "learning_rate": 0.0002622736456657918, "loss": 0.03, "step": 5856 }, { "epoch": 1.19, "learning_rate": 0.0002622607894190833, "loss": 0.0127, "step": 5857 }, { "epoch": 1.19, "learning_rate": 0.0002622479312974077, "loss": 0.0318, "step": 5858 }, { "epoch": 1.19, "learning_rate": 0.00026223507130097975, "loss": 0.0111, "step": 5859 }, { "epoch": 1.19, "learning_rate": 0.00026222220943001424, "loss": 0.0057, "step": 5860 }, { "epoch": 1.19, "learning_rate": 0.000262209345684726, "loss": 0.0038, "step": 5861 }, { "epoch": 1.19, "learning_rate": 0.0002621964800653299, "loss": 0.004, "step": 5862 }, { "epoch": 1.19, "learning_rate": 0.0002621836125720408, "loss": 0.0132, "step": 5863 }, { "epoch": 1.19, "learning_rate": 0.0002621707432050736, "loss": 0.0083, "step": 5864 }, { "epoch": 1.19, "learning_rate": 0.00026215787196464323, "loss": 0.0219, "step": 5865 }, { "epoch": 1.19, "learning_rate": 0.00026214499885096474, "loss": 0.0089, "step": 5866 }, { "epoch": 1.19, "learning_rate": 0.000262132123864253, "loss": 0.0194, "step": 5867 }, { "epoch": 1.19, "learning_rate": 0.0002621192470047232, "loss": 0.0498, "step": 5868 }, { "epoch": 1.2, "learning_rate": 0.0002621063682725903, "loss": 0.0147, "step": 5869 }, { "epoch": 1.2, "learning_rate": 0.0002620934876680694, "loss": 0.0158, "step": 5870 }, { "epoch": 1.2, "learning_rate": 0.00026208060519137573, "loss": 0.0055, "step": 5871 }, { "epoch": 1.2, "learning_rate": 0.0002620677208427243, "loss": 0.0079, "step": 5872 }, { "epoch": 1.2, "learning_rate": 0.0002620548346223305, "loss": 0.0185, "step": 5873 }, { "epoch": 1.2, "learning_rate": 0.0002620419465304094, "loss": 0.0323, "step": 5874 }, { "epoch": 1.2, "learning_rate": 0.0002620290565671763, "loss": 0.0048, "step": 5875 }, { "epoch": 1.2, "learning_rate": 0.00026201616473284646, "loss": 0.0084, "step": 5876 }, { "epoch": 1.2, "learning_rate": 0.0002620032710276352, "loss": 0.0192, "step": 5877 }, { "epoch": 1.2, "learning_rate": 0.00026199037545175793, "loss": 0.0072, "step": 5878 }, { "epoch": 1.2, "learning_rate": 0.00026197747800543004, "loss": 0.0312, "step": 5879 }, { "epoch": 1.2, "learning_rate": 0.00026196457868886685, "loss": 0.0268, "step": 5880 }, { "epoch": 1.2, "learning_rate": 0.00026195167750228383, "loss": 0.0058, "step": 5881 }, { "epoch": 1.2, "learning_rate": 0.0002619387744458965, "loss": 0.0141, "step": 5882 }, { "epoch": 1.2, "learning_rate": 0.0002619258695199203, "loss": 0.0295, "step": 5883 }, { "epoch": 1.2, "learning_rate": 0.00026191296272457085, "loss": 0.034, "step": 5884 }, { "epoch": 1.2, "learning_rate": 0.00026190005406006363, "loss": 0.0162, "step": 5885 }, { "epoch": 1.2, "learning_rate": 0.0002618871435266143, "loss": 0.0077, "step": 5886 }, { "epoch": 1.2, "learning_rate": 0.0002618742311244385, "loss": 0.0068, "step": 5887 }, { "epoch": 1.2, "learning_rate": 0.00026186131685375185, "loss": 0.0431, "step": 5888 }, { "epoch": 1.2, "learning_rate": 0.00026184840071477, "loss": 0.0062, "step": 5889 }, { "epoch": 1.2, "learning_rate": 0.0002618354827077088, "loss": 0.0376, "step": 5890 }, { "epoch": 1.2, "learning_rate": 0.0002618225628327839, "loss": 0.0298, "step": 5891 }, { "epoch": 1.2, "learning_rate": 0.0002618096410902111, "loss": 0.0128, "step": 5892 }, { "epoch": 1.2, "learning_rate": 0.0002617967174802063, "loss": 0.0215, "step": 5893 }, { "epoch": 1.2, "learning_rate": 0.0002617837920029852, "loss": 0.0063, "step": 5894 }, { "epoch": 1.2, "learning_rate": 0.00026177086465876384, "loss": 0.0013, "step": 5895 }, { "epoch": 1.2, "learning_rate": 0.00026175793544775804, "loss": 0.0353, "step": 5896 }, { "epoch": 1.2, "learning_rate": 0.00026174500437018376, "loss": 0.019, "step": 5897 }, { "epoch": 1.2, "learning_rate": 0.000261732071426257, "loss": 0.0042, "step": 5898 }, { "epoch": 1.2, "learning_rate": 0.00026171913661619366, "loss": 0.0178, "step": 5899 }, { "epoch": 1.2, "learning_rate": 0.0002617061999402099, "loss": 0.0054, "step": 5900 }, { "epoch": 1.2, "learning_rate": 0.00026169326139852177, "loss": 0.0161, "step": 5901 }, { "epoch": 1.2, "learning_rate": 0.0002616803209913453, "loss": 0.026, "step": 5902 }, { "epoch": 1.2, "learning_rate": 0.00026166737871889667, "loss": 0.0102, "step": 5903 }, { "epoch": 1.2, "learning_rate": 0.000261654434581392, "loss": 0.0145, "step": 5904 }, { "epoch": 1.2, "learning_rate": 0.00026164148857904756, "loss": 0.0147, "step": 5905 }, { "epoch": 1.2, "learning_rate": 0.0002616285407120795, "loss": 0.033, "step": 5906 }, { "epoch": 1.2, "learning_rate": 0.0002616155909807041, "loss": 0.0122, "step": 5907 }, { "epoch": 1.2, "learning_rate": 0.0002616026393851376, "loss": 0.0141, "step": 5908 }, { "epoch": 1.2, "learning_rate": 0.0002615896859255964, "loss": 0.0089, "step": 5909 }, { "epoch": 1.2, "learning_rate": 0.00026157673060229683, "loss": 0.0195, "step": 5910 }, { "epoch": 1.2, "learning_rate": 0.0002615637734154552, "loss": 0.0231, "step": 5911 }, { "epoch": 1.2, "learning_rate": 0.000261550814365288, "loss": 0.0224, "step": 5912 }, { "epoch": 1.2, "learning_rate": 0.00026153785345201154, "loss": 0.0198, "step": 5913 }, { "epoch": 1.2, "learning_rate": 0.00026152489067584245, "loss": 0.0237, "step": 5914 }, { "epoch": 1.2, "learning_rate": 0.00026151192603699716, "loss": 0.0085, "step": 5915 }, { "epoch": 1.2, "learning_rate": 0.00026149895953569226, "loss": 0.0247, "step": 5916 }, { "epoch": 1.2, "learning_rate": 0.0002614859911721442, "loss": 0.0176, "step": 5917 }, { "epoch": 1.21, "learning_rate": 0.00026147302094656964, "loss": 0.0332, "step": 5918 }, { "epoch": 1.21, "learning_rate": 0.0002614600488591853, "loss": 0.0214, "step": 5919 }, { "epoch": 1.21, "learning_rate": 0.0002614470749102077, "loss": 0.0095, "step": 5920 }, { "epoch": 1.21, "learning_rate": 0.00026143409909985354, "loss": 0.0227, "step": 5921 }, { "epoch": 1.21, "learning_rate": 0.0002614211214283396, "loss": 0.0192, "step": 5922 }, { "epoch": 1.21, "learning_rate": 0.0002614081418958826, "loss": 0.036, "step": 5923 }, { "epoch": 1.21, "learning_rate": 0.0002613951605026994, "loss": 0.0277, "step": 5924 }, { "epoch": 1.21, "learning_rate": 0.00026138217724900665, "loss": 0.0283, "step": 5925 }, { "epoch": 1.21, "learning_rate": 0.00026136919213502134, "loss": 0.0236, "step": 5926 }, { "epoch": 1.21, "learning_rate": 0.0002613562051609603, "loss": 0.022, "step": 5927 }, { "epoch": 1.21, "learning_rate": 0.0002613432163270404, "loss": 0.0243, "step": 5928 }, { "epoch": 1.21, "learning_rate": 0.00026133022563347864, "loss": 0.0147, "step": 5929 }, { "epoch": 1.21, "learning_rate": 0.000261317233080492, "loss": 0.0112, "step": 5930 }, { "epoch": 1.21, "learning_rate": 0.0002613042386682974, "loss": 0.0061, "step": 5931 }, { "epoch": 1.21, "learning_rate": 0.00026129124239711185, "loss": 0.0123, "step": 5932 }, { "epoch": 1.21, "learning_rate": 0.00026127824426715255, "loss": 0.011, "step": 5933 }, { "epoch": 1.21, "learning_rate": 0.0002612652442786365, "loss": 0.021, "step": 5934 }, { "epoch": 1.21, "learning_rate": 0.0002612522424317808, "loss": 0.0078, "step": 5935 }, { "epoch": 1.21, "learning_rate": 0.0002612392387268028, "loss": 0.0269, "step": 5936 }, { "epoch": 1.21, "learning_rate": 0.0002612262331639194, "loss": 0.0064, "step": 5937 }, { "epoch": 1.21, "learning_rate": 0.00026121322574334795, "loss": 0.0063, "step": 5938 }, { "epoch": 1.21, "learning_rate": 0.00026120021646530576, "loss": 0.0086, "step": 5939 }, { "epoch": 1.21, "learning_rate": 0.00026118720533001, "loss": 0.0076, "step": 5940 }, { "epoch": 1.21, "learning_rate": 0.00026117419233767804, "loss": 0.0048, "step": 5941 }, { "epoch": 1.21, "learning_rate": 0.00026116117748852723, "loss": 0.008, "step": 5942 }, { "epoch": 1.21, "learning_rate": 0.00026114816078277495, "loss": 0.0105, "step": 5943 }, { "epoch": 1.21, "learning_rate": 0.00026113514222063854, "loss": 0.0137, "step": 5944 }, { "epoch": 1.21, "learning_rate": 0.00026112212180233544, "loss": 0.0064, "step": 5945 }, { "epoch": 1.21, "learning_rate": 0.0002611090995280832, "loss": 0.0202, "step": 5946 }, { "epoch": 1.21, "learning_rate": 0.00026109607539809927, "loss": 0.0082, "step": 5947 }, { "epoch": 1.21, "learning_rate": 0.0002610830494126012, "loss": 0.0191, "step": 5948 }, { "epoch": 1.21, "learning_rate": 0.0002610700215718064, "loss": 0.021, "step": 5949 }, { "epoch": 1.21, "learning_rate": 0.00026105699187593264, "loss": 0.0113, "step": 5950 }, { "epoch": 1.21, "learning_rate": 0.00026104396032519754, "loss": 0.0089, "step": 5951 }, { "epoch": 1.21, "learning_rate": 0.00026103092691981866, "loss": 0.0092, "step": 5952 }, { "epoch": 1.21, "learning_rate": 0.00026101789166001367, "loss": 0.0048, "step": 5953 }, { "epoch": 1.21, "learning_rate": 0.0002610048545460004, "loss": 0.0227, "step": 5954 }, { "epoch": 1.21, "learning_rate": 0.00026099181557799644, "loss": 0.003, "step": 5955 }, { "epoch": 1.21, "learning_rate": 0.0002609787747562197, "loss": 0.001, "step": 5956 }, { "epoch": 1.21, "learning_rate": 0.00026096573208088793, "loss": 0.0031, "step": 5957 }, { "epoch": 1.21, "learning_rate": 0.00026095268755221894, "loss": 0.0202, "step": 5958 }, { "epoch": 1.21, "learning_rate": 0.0002609396411704307, "loss": 0.0015, "step": 5959 }, { "epoch": 1.21, "learning_rate": 0.00026092659293574095, "loss": 0.0123, "step": 5960 }, { "epoch": 1.21, "learning_rate": 0.00026091354284836775, "loss": 0.0094, "step": 5961 }, { "epoch": 1.21, "learning_rate": 0.00026090049090852905, "loss": 0.0237, "step": 5962 }, { "epoch": 1.21, "learning_rate": 0.00026088743711644277, "loss": 0.0243, "step": 5963 }, { "epoch": 1.21, "learning_rate": 0.000260874381472327, "loss": 0.0308, "step": 5964 }, { "epoch": 1.21, "learning_rate": 0.0002608613239763997, "loss": 0.0363, "step": 5965 }, { "epoch": 1.21, "learning_rate": 0.00026084826462887913, "loss": 0.0168, "step": 5966 }, { "epoch": 1.21, "learning_rate": 0.00026083520342998326, "loss": 0.0034, "step": 5967 }, { "epoch": 1.22, "learning_rate": 0.0002608221403799303, "loss": 0.015, "step": 5968 }, { "epoch": 1.22, "learning_rate": 0.00026080907547893834, "loss": 0.0114, "step": 5969 }, { "epoch": 1.22, "learning_rate": 0.0002607960087272257, "loss": 0.0118, "step": 5970 }, { "epoch": 1.22, "learning_rate": 0.00026078294012501054, "loss": 0.0082, "step": 5971 }, { "epoch": 1.22, "learning_rate": 0.00026076986967251125, "loss": 0.0275, "step": 5972 }, { "epoch": 1.22, "learning_rate": 0.00026075679736994596, "loss": 0.0161, "step": 5973 }, { "epoch": 1.22, "learning_rate": 0.0002607437232175331, "loss": 0.0182, "step": 5974 }, { "epoch": 1.22, "learning_rate": 0.000260730647215491, "loss": 0.0111, "step": 5975 }, { "epoch": 1.22, "learning_rate": 0.00026071756936403806, "loss": 0.0138, "step": 5976 }, { "epoch": 1.22, "learning_rate": 0.0002607044896633928, "loss": 0.0072, "step": 5977 }, { "epoch": 1.22, "learning_rate": 0.00026069140811377353, "loss": 0.0148, "step": 5978 }, { "epoch": 1.22, "learning_rate": 0.0002606783247153988, "loss": 0.0269, "step": 5979 }, { "epoch": 1.22, "learning_rate": 0.0002606652394684871, "loss": 0.0131, "step": 5980 }, { "epoch": 1.22, "learning_rate": 0.0002606521523732571, "loss": 0.0516, "step": 5981 }, { "epoch": 1.22, "learning_rate": 0.00026063906342992723, "loss": 0.0468, "step": 5982 }, { "epoch": 1.22, "learning_rate": 0.0002606259726387161, "loss": 0.0375, "step": 5983 }, { "epoch": 1.22, "learning_rate": 0.00026061287999984255, "loss": 0.0159, "step": 5984 }, { "epoch": 1.22, "learning_rate": 0.00026059978551352497, "loss": 0.0133, "step": 5985 }, { "epoch": 1.22, "learning_rate": 0.0002605866891799822, "loss": 0.0077, "step": 5986 }, { "epoch": 1.22, "learning_rate": 0.0002605735909994331, "loss": 0.0114, "step": 5987 }, { "epoch": 1.22, "learning_rate": 0.0002605604909720962, "loss": 0.0239, "step": 5988 }, { "epoch": 1.22, "learning_rate": 0.00026054738909819043, "loss": 0.0111, "step": 5989 }, { "epoch": 1.22, "learning_rate": 0.0002605342853779346, "loss": 0.0163, "step": 5990 }, { "epoch": 1.22, "learning_rate": 0.00026052117981154754, "loss": 0.0166, "step": 5991 }, { "epoch": 1.22, "learning_rate": 0.00026050807239924817, "loss": 0.014, "step": 5992 }, { "epoch": 1.22, "learning_rate": 0.0002604949631412554, "loss": 0.0265, "step": 5993 }, { "epoch": 1.22, "learning_rate": 0.0002604818520377881, "loss": 0.0072, "step": 5994 }, { "epoch": 1.22, "learning_rate": 0.0002604687390890654, "loss": 0.0118, "step": 5995 }, { "epoch": 1.22, "learning_rate": 0.00026045562429530625, "loss": 0.0123, "step": 5996 }, { "epoch": 1.22, "learning_rate": 0.0002604425076567296, "loss": 0.0209, "step": 5997 }, { "epoch": 1.22, "learning_rate": 0.00026042938917355467, "loss": 0.0188, "step": 5998 }, { "epoch": 1.22, "learning_rate": 0.0002604162688460004, "loss": 0.0295, "step": 5999 }, { "epoch": 1.22, "learning_rate": 0.0002604031466742861, "loss": 0.0181, "step": 6000 }, { "epoch": 1.22, "learning_rate": 0.00026039002265863077, "loss": 0.0154, "step": 6001 }, { "epoch": 1.22, "learning_rate": 0.0002603768967992537, "loss": 0.0432, "step": 6002 }, { "epoch": 1.22, "learning_rate": 0.0002603637690963742, "loss": 0.0156, "step": 6003 }, { "epoch": 1.22, "learning_rate": 0.00026035063955021136, "loss": 0.0377, "step": 6004 }, { "epoch": 1.22, "learning_rate": 0.00026033750816098456, "loss": 0.0182, "step": 6005 }, { "epoch": 1.22, "learning_rate": 0.00026032437492891304, "loss": 0.0059, "step": 6006 }, { "epoch": 1.22, "learning_rate": 0.00026031123985421624, "loss": 0.0138, "step": 6007 }, { "epoch": 1.22, "learning_rate": 0.0002602981029371135, "loss": 0.0257, "step": 6008 }, { "epoch": 1.22, "learning_rate": 0.0002602849641778243, "loss": 0.0088, "step": 6009 }, { "epoch": 1.22, "learning_rate": 0.00026027182357656796, "loss": 0.0176, "step": 6010 }, { "epoch": 1.22, "learning_rate": 0.000260258681133564, "loss": 0.0182, "step": 6011 }, { "epoch": 1.22, "learning_rate": 0.00026024553684903196, "loss": 0.0086, "step": 6012 }, { "epoch": 1.22, "learning_rate": 0.0002602323907231914, "loss": 0.0116, "step": 6013 }, { "epoch": 1.22, "learning_rate": 0.00026021924275626177, "loss": 0.0043, "step": 6014 }, { "epoch": 1.22, "learning_rate": 0.00026020609294846275, "loss": 0.0158, "step": 6015 }, { "epoch": 1.22, "learning_rate": 0.0002601929413000139, "loss": 0.0119, "step": 6016 }, { "epoch": 1.23, "learning_rate": 0.00026017978781113504, "loss": 0.0041, "step": 6017 }, { "epoch": 1.23, "learning_rate": 0.0002601666324820457, "loss": 0.0092, "step": 6018 }, { "epoch": 1.23, "learning_rate": 0.0002601534753129656, "loss": 0.016, "step": 6019 }, { "epoch": 1.23, "learning_rate": 0.00026014031630411453, "loss": 0.0083, "step": 6020 }, { "epoch": 1.23, "learning_rate": 0.00026012715545571235, "loss": 0.0054, "step": 6021 }, { "epoch": 1.23, "learning_rate": 0.0002601139927679787, "loss": 0.0391, "step": 6022 }, { "epoch": 1.23, "learning_rate": 0.0002601008282411336, "loss": 0.0028, "step": 6023 }, { "epoch": 1.23, "learning_rate": 0.00026008766187539677, "loss": 0.0067, "step": 6024 }, { "epoch": 1.23, "learning_rate": 0.0002600744936709882, "loss": 0.0128, "step": 6025 }, { "epoch": 1.23, "learning_rate": 0.00026006132362812784, "loss": 0.0292, "step": 6026 }, { "epoch": 1.23, "learning_rate": 0.0002600481517470356, "loss": 0.0112, "step": 6027 }, { "epoch": 1.23, "learning_rate": 0.00026003497802793145, "loss": 0.0028, "step": 6028 }, { "epoch": 1.23, "learning_rate": 0.00026002180247103557, "loss": 0.0323, "step": 6029 }, { "epoch": 1.23, "learning_rate": 0.0002600086250765678, "loss": 0.0109, "step": 6030 }, { "epoch": 1.23, "learning_rate": 0.0002599954458447484, "loss": 0.0329, "step": 6031 }, { "epoch": 1.23, "learning_rate": 0.00025998226477579734, "loss": 0.0137, "step": 6032 }, { "epoch": 1.23, "learning_rate": 0.00025996908186993496, "loss": 0.0148, "step": 6033 }, { "epoch": 1.23, "learning_rate": 0.00025995589712738125, "loss": 0.0051, "step": 6034 }, { "epoch": 1.23, "learning_rate": 0.0002599427105483566, "loss": 0.005, "step": 6035 }, { "epoch": 1.23, "learning_rate": 0.000259929522133081, "loss": 0.0147, "step": 6036 }, { "epoch": 1.23, "learning_rate": 0.000259916331881775, "loss": 0.0196, "step": 6037 }, { "epoch": 1.23, "learning_rate": 0.0002599031397946587, "loss": 0.0298, "step": 6038 }, { "epoch": 1.23, "learning_rate": 0.0002598899458719526, "loss": 0.0146, "step": 6039 }, { "epoch": 1.23, "learning_rate": 0.00025987675011387686, "loss": 0.0102, "step": 6040 }, { "epoch": 1.23, "learning_rate": 0.00025986355252065205, "loss": 0.0122, "step": 6041 }, { "epoch": 1.23, "learning_rate": 0.0002598503530924986, "loss": 0.012, "step": 6042 }, { "epoch": 1.23, "learning_rate": 0.00025983715182963677, "loss": 0.0153, "step": 6043 }, { "epoch": 1.23, "learning_rate": 0.00025982394873228724, "loss": 0.0173, "step": 6044 }, { "epoch": 1.23, "learning_rate": 0.0002598107438006704, "loss": 0.0195, "step": 6045 }, { "epoch": 1.23, "learning_rate": 0.00025979753703500694, "loss": 0.0158, "step": 6046 }, { "epoch": 1.23, "learning_rate": 0.00025978432843551727, "loss": 0.0076, "step": 6047 }, { "epoch": 1.23, "learning_rate": 0.00025977111800242213, "loss": 0.0238, "step": 6048 }, { "epoch": 1.23, "learning_rate": 0.0002597579057359421, "loss": 0.0113, "step": 6049 }, { "epoch": 1.23, "learning_rate": 0.0002597446916362979, "loss": 0.0251, "step": 6050 }, { "epoch": 1.23, "learning_rate": 0.00025973147570371017, "loss": 0.0068, "step": 6051 }, { "epoch": 1.23, "learning_rate": 0.0002597182579383996, "loss": 0.014, "step": 6052 }, { "epoch": 1.23, "learning_rate": 0.0002597050383405871, "loss": 0.0114, "step": 6053 }, { "epoch": 1.23, "learning_rate": 0.00025969181691049334, "loss": 0.0113, "step": 6054 }, { "epoch": 1.23, "learning_rate": 0.00025967859364833915, "loss": 0.0258, "step": 6055 }, { "epoch": 1.23, "learning_rate": 0.0002596653685543455, "loss": 0.0241, "step": 6056 }, { "epoch": 1.23, "learning_rate": 0.00025965214162873313, "loss": 0.0399, "step": 6057 }, { "epoch": 1.23, "learning_rate": 0.00025963891287172295, "loss": 0.0109, "step": 6058 }, { "epoch": 1.23, "learning_rate": 0.0002596256822835361, "loss": 0.0118, "step": 6059 }, { "epoch": 1.23, "learning_rate": 0.0002596124498643933, "loss": 0.0065, "step": 6060 }, { "epoch": 1.23, "learning_rate": 0.0002595992156145157, "loss": 0.0053, "step": 6061 }, { "epoch": 1.23, "learning_rate": 0.0002595859795341244, "loss": 0.009, "step": 6062 }, { "epoch": 1.23, "learning_rate": 0.00025957274162344035, "loss": 0.0197, "step": 6063 }, { "epoch": 1.23, "learning_rate": 0.00025955950188268464, "loss": 0.0175, "step": 6064 }, { "epoch": 1.23, "learning_rate": 0.00025954626031207846, "loss": 0.0049, "step": 6065 }, { "epoch": 1.24, "learning_rate": 0.00025953301691184296, "loss": 0.0215, "step": 6066 }, { "epoch": 1.24, "learning_rate": 0.0002595197716821993, "loss": 0.0043, "step": 6067 }, { "epoch": 1.24, "learning_rate": 0.0002595065246233688, "loss": 0.0067, "step": 6068 }, { "epoch": 1.24, "learning_rate": 0.0002594932757355725, "loss": 0.0101, "step": 6069 }, { "epoch": 1.24, "learning_rate": 0.0002594800250190319, "loss": 0.0341, "step": 6070 }, { "epoch": 1.24, "learning_rate": 0.00025946677247396817, "loss": 0.0197, "step": 6071 }, { "epoch": 1.24, "learning_rate": 0.00025945351810060277, "loss": 0.0151, "step": 6072 }, { "epoch": 1.24, "learning_rate": 0.0002594402618991569, "loss": 0.0059, "step": 6073 }, { "epoch": 1.24, "learning_rate": 0.0002594270038698522, "loss": 0.0206, "step": 6074 }, { "epoch": 1.24, "learning_rate": 0.00025941374401290993, "loss": 0.0019, "step": 6075 }, { "epoch": 1.24, "learning_rate": 0.00025940048232855163, "loss": 0.0136, "step": 6076 }, { "epoch": 1.24, "learning_rate": 0.0002593872188169987, "loss": 0.0397, "step": 6077 }, { "epoch": 1.24, "learning_rate": 0.0002593739534784728, "loss": 0.0082, "step": 6078 }, { "epoch": 1.24, "learning_rate": 0.00025936068631319533, "loss": 0.0085, "step": 6079 }, { "epoch": 1.24, "learning_rate": 0.000259347417321388, "loss": 0.0423, "step": 6080 }, { "epoch": 1.24, "learning_rate": 0.00025933414650327247, "loss": 0.0178, "step": 6081 }, { "epoch": 1.24, "learning_rate": 0.00025932087385907023, "loss": 0.0066, "step": 6082 }, { "epoch": 1.24, "learning_rate": 0.0002593075993890031, "loss": 0.0276, "step": 6083 }, { "epoch": 1.24, "learning_rate": 0.00025929432309329265, "loss": 0.0066, "step": 6084 }, { "epoch": 1.24, "learning_rate": 0.00025928104497216075, "loss": 0.003, "step": 6085 }, { "epoch": 1.24, "learning_rate": 0.0002592677650258291, "loss": 0.0091, "step": 6086 }, { "epoch": 1.24, "learning_rate": 0.0002592544832545195, "loss": 0.0295, "step": 6087 }, { "epoch": 1.24, "learning_rate": 0.00025924119965845384, "loss": 0.0386, "step": 6088 }, { "epoch": 1.24, "learning_rate": 0.00025922791423785394, "loss": 0.0078, "step": 6089 }, { "epoch": 1.24, "learning_rate": 0.0002592146269929417, "loss": 0.0011, "step": 6090 }, { "epoch": 1.24, "learning_rate": 0.00025920133792393897, "loss": 0.0055, "step": 6091 }, { "epoch": 1.24, "learning_rate": 0.0002591880470310678, "loss": 0.0236, "step": 6092 }, { "epoch": 1.24, "learning_rate": 0.00025917475431455015, "loss": 0.0208, "step": 6093 }, { "epoch": 1.24, "learning_rate": 0.000259161459774608, "loss": 0.0202, "step": 6094 }, { "epoch": 1.24, "learning_rate": 0.00025914816341146335, "loss": 0.0115, "step": 6095 }, { "epoch": 1.24, "learning_rate": 0.0002591348652253384, "loss": 0.022, "step": 6096 }, { "epoch": 1.24, "learning_rate": 0.00025912156521645525, "loss": 0.0161, "step": 6097 }, { "epoch": 1.24, "learning_rate": 0.0002591082633850359, "loss": 0.0149, "step": 6098 }, { "epoch": 1.24, "learning_rate": 0.0002590949597313027, "loss": 0.0246, "step": 6099 }, { "epoch": 1.24, "learning_rate": 0.00025908165425547763, "loss": 0.0069, "step": 6100 }, { "epoch": 1.24, "learning_rate": 0.000259068346957783, "loss": 0.0055, "step": 6101 }, { "epoch": 1.24, "learning_rate": 0.0002590550378384412, "loss": 0.0023, "step": 6102 }, { "epoch": 1.24, "learning_rate": 0.0002590417268976743, "loss": 0.0101, "step": 6103 }, { "epoch": 1.24, "learning_rate": 0.00025902841413570486, "loss": 0.0132, "step": 6104 }, { "epoch": 1.24, "learning_rate": 0.000259015099552755, "loss": 0.0069, "step": 6105 }, { "epoch": 1.24, "learning_rate": 0.00025900178314904726, "loss": 0.0324, "step": 6106 }, { "epoch": 1.24, "learning_rate": 0.000258988464924804, "loss": 0.0258, "step": 6107 }, { "epoch": 1.24, "learning_rate": 0.0002589751448802476, "loss": 0.092, "step": 6108 }, { "epoch": 1.24, "learning_rate": 0.0002589618230156006, "loss": 0.0247, "step": 6109 }, { "epoch": 1.24, "learning_rate": 0.00025894849933108543, "loss": 0.0127, "step": 6110 }, { "epoch": 1.24, "learning_rate": 0.0002589351738269247, "loss": 0.0019, "step": 6111 }, { "epoch": 1.24, "learning_rate": 0.00025892184650334096, "loss": 0.0249, "step": 6112 }, { "epoch": 1.24, "learning_rate": 0.0002589085173605567, "loss": 0.0214, "step": 6113 }, { "epoch": 1.24, "learning_rate": 0.00025889518639879465, "loss": 0.0068, "step": 6114 }, { "epoch": 1.25, "learning_rate": 0.0002588818536182775, "loss": 0.0103, "step": 6115 }, { "epoch": 1.25, "learning_rate": 0.0002588685190192278, "loss": 0.0087, "step": 6116 }, { "epoch": 1.25, "learning_rate": 0.00025885518260186836, "loss": 0.0153, "step": 6117 }, { "epoch": 1.25, "learning_rate": 0.0002588418443664219, "loss": 0.0238, "step": 6118 }, { "epoch": 1.25, "learning_rate": 0.00025882850431311114, "loss": 0.024, "step": 6119 }, { "epoch": 1.25, "learning_rate": 0.0002588151624421589, "loss": 0.0026, "step": 6120 }, { "epoch": 1.25, "learning_rate": 0.00025880181875378815, "loss": 0.0145, "step": 6121 }, { "epoch": 1.25, "learning_rate": 0.00025878847324822157, "loss": 0.0037, "step": 6122 }, { "epoch": 1.25, "learning_rate": 0.0002587751259256822, "loss": 0.0036, "step": 6123 }, { "epoch": 1.25, "learning_rate": 0.0002587617767863929, "loss": 0.0066, "step": 6124 }, { "epoch": 1.25, "learning_rate": 0.0002587484258305766, "loss": 0.0142, "step": 6125 }, { "epoch": 1.25, "learning_rate": 0.00025873507305845627, "loss": 0.0183, "step": 6126 }, { "epoch": 1.25, "learning_rate": 0.000258721718470255, "loss": 0.0363, "step": 6127 }, { "epoch": 1.25, "learning_rate": 0.0002587083620661958, "loss": 0.0105, "step": 6128 }, { "epoch": 1.25, "learning_rate": 0.00025869500384650176, "loss": 0.0067, "step": 6129 }, { "epoch": 1.25, "learning_rate": 0.00025868164381139593, "loss": 0.0175, "step": 6130 }, { "epoch": 1.25, "learning_rate": 0.00025866828196110153, "loss": 0.0037, "step": 6131 }, { "epoch": 1.25, "learning_rate": 0.00025865491829584175, "loss": 0.0051, "step": 6132 }, { "epoch": 1.25, "learning_rate": 0.00025864155281583965, "loss": 0.0121, "step": 6133 }, { "epoch": 1.25, "learning_rate": 0.0002586281855213186, "loss": 0.0207, "step": 6134 }, { "epoch": 1.25, "learning_rate": 0.0002586148164125018, "loss": 0.0174, "step": 6135 }, { "epoch": 1.25, "learning_rate": 0.0002586014454896125, "loss": 0.0242, "step": 6136 }, { "epoch": 1.25, "learning_rate": 0.00025858807275287406, "loss": 0.0171, "step": 6137 }, { "epoch": 1.25, "learning_rate": 0.0002585746982025098, "loss": 0.0312, "step": 6138 }, { "epoch": 1.25, "learning_rate": 0.0002585613218387433, "loss": 0.0328, "step": 6139 }, { "epoch": 1.25, "learning_rate": 0.0002585479436617976, "loss": 0.0136, "step": 6140 }, { "epoch": 1.25, "learning_rate": 0.0002585345636718965, "loss": 0.0038, "step": 6141 }, { "epoch": 1.25, "learning_rate": 0.0002585211818692632, "loss": 0.0088, "step": 6142 }, { "epoch": 1.25, "learning_rate": 0.0002585077982541214, "loss": 0.0073, "step": 6143 }, { "epoch": 1.25, "learning_rate": 0.0002584944128266945, "loss": 0.0106, "step": 6144 }, { "epoch": 1.25, "learning_rate": 0.0002584810255872061, "loss": 0.0082, "step": 6145 }, { "epoch": 1.25, "learning_rate": 0.0002584676365358798, "loss": 0.0105, "step": 6146 }, { "epoch": 1.25, "learning_rate": 0.0002584542456729392, "loss": 0.0097, "step": 6147 }, { "epoch": 1.25, "learning_rate": 0.000258440852998608, "loss": 0.0106, "step": 6148 }, { "epoch": 1.25, "learning_rate": 0.0002584274585131099, "loss": 0.0072, "step": 6149 }, { "epoch": 1.25, "learning_rate": 0.00025841406221666855, "loss": 0.005, "step": 6150 }, { "epoch": 1.25, "learning_rate": 0.00025840066410950767, "loss": 0.0088, "step": 6151 }, { "epoch": 1.25, "learning_rate": 0.0002583872641918511, "loss": 0.0038, "step": 6152 }, { "epoch": 1.25, "learning_rate": 0.00025837386246392265, "loss": 0.0168, "step": 6153 }, { "epoch": 1.25, "learning_rate": 0.00025836045892594614, "loss": 0.0074, "step": 6154 }, { "epoch": 1.25, "learning_rate": 0.0002583470535781454, "loss": 0.0062, "step": 6155 }, { "epoch": 1.25, "learning_rate": 0.0002583336464207443, "loss": 0.0126, "step": 6156 }, { "epoch": 1.25, "learning_rate": 0.00025832023745396684, "loss": 0.0288, "step": 6157 }, { "epoch": 1.25, "learning_rate": 0.000258306826678037, "loss": 0.0119, "step": 6158 }, { "epoch": 1.25, "learning_rate": 0.0002582934140931786, "loss": 0.0077, "step": 6159 }, { "epoch": 1.25, "learning_rate": 0.0002582799996996159, "loss": 0.0126, "step": 6160 }, { "epoch": 1.25, "learning_rate": 0.00025826658349757274, "loss": 0.0024, "step": 6161 }, { "epoch": 1.25, "learning_rate": 0.00025825316548727325, "loss": 0.0081, "step": 6162 }, { "epoch": 1.25, "learning_rate": 0.0002582397456689416, "loss": 0.0198, "step": 6163 }, { "epoch": 1.26, "learning_rate": 0.00025822632404280183, "loss": 0.0232, "step": 6164 }, { "epoch": 1.26, "learning_rate": 0.00025821290060907816, "loss": 0.008, "step": 6165 }, { "epoch": 1.26, "learning_rate": 0.00025819947536799483, "loss": 0.0215, "step": 6166 }, { "epoch": 1.26, "learning_rate": 0.000258186048319776, "loss": 0.039, "step": 6167 }, { "epoch": 1.26, "learning_rate": 0.0002581726194646459, "loss": 0.0234, "step": 6168 }, { "epoch": 1.26, "learning_rate": 0.00025815918880282894, "loss": 0.0342, "step": 6169 }, { "epoch": 1.26, "learning_rate": 0.00025814575633454934, "loss": 0.0039, "step": 6170 }, { "epoch": 1.26, "learning_rate": 0.0002581323220600314, "loss": 0.0054, "step": 6171 }, { "epoch": 1.26, "learning_rate": 0.00025811888597949967, "loss": 0.0112, "step": 6172 }, { "epoch": 1.26, "learning_rate": 0.00025810544809317846, "loss": 0.004, "step": 6173 }, { "epoch": 1.26, "learning_rate": 0.00025809200840129216, "loss": 0.0166, "step": 6174 }, { "epoch": 1.26, "learning_rate": 0.00025807856690406527, "loss": 0.015, "step": 6175 }, { "epoch": 1.26, "learning_rate": 0.0002580651236017223, "loss": 0.0024, "step": 6176 }, { "epoch": 1.26, "learning_rate": 0.0002580516784944878, "loss": 0.0294, "step": 6177 }, { "epoch": 1.26, "learning_rate": 0.00025803823158258626, "loss": 0.0074, "step": 6178 }, { "epoch": 1.26, "learning_rate": 0.00025802478286624235, "loss": 0.0212, "step": 6179 }, { "epoch": 1.26, "learning_rate": 0.00025801133234568065, "loss": 0.0236, "step": 6180 }, { "epoch": 1.26, "learning_rate": 0.00025799788002112584, "loss": 0.0065, "step": 6181 }, { "epoch": 1.26, "learning_rate": 0.0002579844258928025, "loss": 0.0316, "step": 6182 }, { "epoch": 1.26, "learning_rate": 0.0002579709699609355, "loss": 0.0251, "step": 6183 }, { "epoch": 1.26, "learning_rate": 0.00025795751222574946, "loss": 0.0188, "step": 6184 }, { "epoch": 1.26, "learning_rate": 0.00025794405268746916, "loss": 0.045, "step": 6185 }, { "epoch": 1.26, "learning_rate": 0.0002579305913463195, "loss": 0.0093, "step": 6186 }, { "epoch": 1.26, "learning_rate": 0.0002579171282025251, "loss": 0.0268, "step": 6187 }, { "epoch": 1.26, "learning_rate": 0.00025790366325631107, "loss": 0.0144, "step": 6188 }, { "epoch": 1.26, "learning_rate": 0.0002578901965079021, "loss": 0.01, "step": 6189 }, { "epoch": 1.26, "learning_rate": 0.00025787672795752324, "loss": 0.0072, "step": 6190 }, { "epoch": 1.26, "learning_rate": 0.0002578632576053994, "loss": 0.018, "step": 6191 }, { "epoch": 1.26, "learning_rate": 0.0002578497854517555, "loss": 0.0109, "step": 6192 }, { "epoch": 1.26, "learning_rate": 0.0002578363114968166, "loss": 0.008, "step": 6193 }, { "epoch": 1.26, "learning_rate": 0.0002578228357408078, "loss": 0.0196, "step": 6194 }, { "epoch": 1.26, "learning_rate": 0.000257809358183954, "loss": 0.0114, "step": 6195 }, { "epoch": 1.26, "learning_rate": 0.00025779587882648056, "loss": 0.0102, "step": 6196 }, { "epoch": 1.26, "learning_rate": 0.0002577823976686124, "loss": 0.012, "step": 6197 }, { "epoch": 1.26, "learning_rate": 0.00025776891471057477, "loss": 0.0093, "step": 6198 }, { "epoch": 1.26, "learning_rate": 0.0002577554299525928, "loss": 0.0123, "step": 6199 }, { "epoch": 1.26, "learning_rate": 0.0002577419433948918, "loss": 0.009, "step": 6200 }, { "epoch": 1.26, "learning_rate": 0.0002577284550376969, "loss": 0.0129, "step": 6201 }, { "epoch": 1.26, "learning_rate": 0.0002577149648812335, "loss": 0.0152, "step": 6202 }, { "epoch": 1.26, "learning_rate": 0.00025770147292572684, "loss": 0.0137, "step": 6203 }, { "epoch": 1.26, "learning_rate": 0.00025768797917140226, "loss": 0.019, "step": 6204 }, { "epoch": 1.26, "learning_rate": 0.0002576744836184851, "loss": 0.024, "step": 6205 }, { "epoch": 1.26, "learning_rate": 0.00025766098626720093, "loss": 0.0058, "step": 6206 }, { "epoch": 1.26, "learning_rate": 0.000257647487117775, "loss": 0.0087, "step": 6207 }, { "epoch": 1.26, "learning_rate": 0.0002576339861704329, "loss": 0.0144, "step": 6208 }, { "epoch": 1.26, "learning_rate": 0.0002576204834254, "loss": 0.0274, "step": 6209 }, { "epoch": 1.26, "learning_rate": 0.0002576069788829019, "loss": 0.0218, "step": 6210 }, { "epoch": 1.26, "learning_rate": 0.00025759347254316413, "loss": 0.0076, "step": 6211 }, { "epoch": 1.26, "learning_rate": 0.00025757996440641223, "loss": 0.0102, "step": 6212 }, { "epoch": 1.27, "learning_rate": 0.0002575664544728719, "loss": 0.0146, "step": 6213 }, { "epoch": 1.27, "learning_rate": 0.0002575529427427687, "loss": 0.0133, "step": 6214 }, { "epoch": 1.27, "learning_rate": 0.0002575394292163284, "loss": 0.0168, "step": 6215 }, { "epoch": 1.27, "learning_rate": 0.00025752591389377656, "loss": 0.0221, "step": 6216 }, { "epoch": 1.27, "learning_rate": 0.00025751239677533904, "loss": 0.0147, "step": 6217 }, { "epoch": 1.27, "learning_rate": 0.00025749887786124154, "loss": 0.0072, "step": 6218 }, { "epoch": 1.27, "learning_rate": 0.00025748535715170985, "loss": 0.0052, "step": 6219 }, { "epoch": 1.27, "learning_rate": 0.0002574718346469698, "loss": 0.0072, "step": 6220 }, { "epoch": 1.27, "learning_rate": 0.0002574583103472472, "loss": 0.0051, "step": 6221 }, { "epoch": 1.27, "learning_rate": 0.0002574447842527681, "loss": 0.0042, "step": 6222 }, { "epoch": 1.27, "learning_rate": 0.00025743125636375815, "loss": 0.0154, "step": 6223 }, { "epoch": 1.27, "learning_rate": 0.00025741772668044354, "loss": 0.0238, "step": 6224 }, { "epoch": 1.27, "learning_rate": 0.00025740419520305004, "loss": 0.0112, "step": 6225 }, { "epoch": 1.27, "learning_rate": 0.0002573906619318038, "loss": 0.0056, "step": 6226 }, { "epoch": 1.27, "learning_rate": 0.00025737712686693074, "loss": 0.0136, "step": 6227 }, { "epoch": 1.27, "learning_rate": 0.00025736359000865704, "loss": 0.0226, "step": 6228 }, { "epoch": 1.27, "learning_rate": 0.0002573500513572087, "loss": 0.0307, "step": 6229 }, { "epoch": 1.27, "learning_rate": 0.00025733651091281183, "loss": 0.0157, "step": 6230 }, { "epoch": 1.27, "learning_rate": 0.0002573229686756926, "loss": 0.0145, "step": 6231 }, { "epoch": 1.27, "learning_rate": 0.00025730942464607725, "loss": 0.0396, "step": 6232 }, { "epoch": 1.27, "learning_rate": 0.00025729587882419196, "loss": 0.008, "step": 6233 }, { "epoch": 1.27, "learning_rate": 0.00025728233121026295, "loss": 0.0092, "step": 6234 }, { "epoch": 1.27, "learning_rate": 0.0002572687818045165, "loss": 0.0196, "step": 6235 }, { "epoch": 1.27, "learning_rate": 0.0002572552306071789, "loss": 0.0098, "step": 6236 }, { "epoch": 1.27, "learning_rate": 0.0002572416776184765, "loss": 0.016, "step": 6237 }, { "epoch": 1.27, "learning_rate": 0.0002572281228386356, "loss": 0.009, "step": 6238 }, { "epoch": 1.27, "learning_rate": 0.0002572145662678827, "loss": 0.0105, "step": 6239 }, { "epoch": 1.27, "learning_rate": 0.00025720100790644414, "loss": 0.0041, "step": 6240 }, { "epoch": 1.27, "learning_rate": 0.00025718744775454636, "loss": 0.0486, "step": 6241 }, { "epoch": 1.27, "learning_rate": 0.00025717388581241596, "loss": 0.0051, "step": 6242 }, { "epoch": 1.27, "learning_rate": 0.00025716032208027926, "loss": 0.0121, "step": 6243 }, { "epoch": 1.27, "learning_rate": 0.000257146756558363, "loss": 0.0186, "step": 6244 }, { "epoch": 1.27, "learning_rate": 0.00025713318924689354, "loss": 0.0261, "step": 6245 }, { "epoch": 1.27, "learning_rate": 0.00025711962014609766, "loss": 0.019, "step": 6246 }, { "epoch": 1.27, "learning_rate": 0.00025710604925620193, "loss": 0.0123, "step": 6247 }, { "epoch": 1.27, "learning_rate": 0.00025709247657743295, "loss": 0.0188, "step": 6248 }, { "epoch": 1.27, "learning_rate": 0.00025707890211001754, "loss": 0.0079, "step": 6249 }, { "epoch": 1.27, "learning_rate": 0.0002570653258541823, "loss": 0.0108, "step": 6250 }, { "epoch": 1.27, "learning_rate": 0.00025705174781015397, "loss": 0.0108, "step": 6251 }, { "epoch": 1.27, "learning_rate": 0.0002570381679781594, "loss": 0.0025, "step": 6252 }, { "epoch": 1.27, "learning_rate": 0.0002570245863584254, "loss": 0.0108, "step": 6253 }, { "epoch": 1.27, "learning_rate": 0.0002570110029511788, "loss": 0.0182, "step": 6254 }, { "epoch": 1.27, "learning_rate": 0.00025699741775664646, "loss": 0.0073, "step": 6255 }, { "epoch": 1.27, "learning_rate": 0.0002569838307750552, "loss": 0.0118, "step": 6256 }, { "epoch": 1.27, "learning_rate": 0.00025697024200663205, "loss": 0.0239, "step": 6257 }, { "epoch": 1.27, "learning_rate": 0.00025695665145160395, "loss": 0.0187, "step": 6258 }, { "epoch": 1.27, "learning_rate": 0.0002569430591101979, "loss": 0.0205, "step": 6259 }, { "epoch": 1.27, "learning_rate": 0.00025692946498264086, "loss": 0.0175, "step": 6260 }, { "epoch": 1.27, "learning_rate": 0.00025691586906915993, "loss": 0.0377, "step": 6261 }, { "epoch": 1.28, "learning_rate": 0.00025690227136998214, "loss": 0.0064, "step": 6262 }, { "epoch": 1.28, "learning_rate": 0.0002568886718853346, "loss": 0.0046, "step": 6263 }, { "epoch": 1.28, "learning_rate": 0.0002568750706154446, "loss": 0.0251, "step": 6264 }, { "epoch": 1.28, "learning_rate": 0.0002568614675605391, "loss": 0.0323, "step": 6265 }, { "epoch": 1.28, "learning_rate": 0.0002568478627208453, "loss": 0.0143, "step": 6266 }, { "epoch": 1.28, "learning_rate": 0.0002568342560965906, "loss": 0.0063, "step": 6267 }, { "epoch": 1.28, "learning_rate": 0.0002568206476880022, "loss": 0.0186, "step": 6268 }, { "epoch": 1.28, "learning_rate": 0.00025680703749530727, "loss": 0.0107, "step": 6269 }, { "epoch": 1.28, "learning_rate": 0.00025679342551873316, "loss": 0.0129, "step": 6270 }, { "epoch": 1.28, "learning_rate": 0.00025677981175850737, "loss": 0.0013, "step": 6271 }, { "epoch": 1.28, "learning_rate": 0.0002567661962148571, "loss": 0.0269, "step": 6272 }, { "epoch": 1.28, "learning_rate": 0.0002567525788880098, "loss": 0.0144, "step": 6273 }, { "epoch": 1.28, "learning_rate": 0.0002567389597781929, "loss": 0.0197, "step": 6274 }, { "epoch": 1.28, "learning_rate": 0.000256725338885634, "loss": 0.0184, "step": 6275 }, { "epoch": 1.28, "learning_rate": 0.0002567117162105604, "loss": 0.015, "step": 6276 }, { "epoch": 1.28, "learning_rate": 0.0002566980917531997, "loss": 0.0098, "step": 6277 }, { "epoch": 1.28, "learning_rate": 0.00025668446551377946, "loss": 0.0082, "step": 6278 }, { "epoch": 1.28, "learning_rate": 0.0002566708374925273, "loss": 0.0085, "step": 6279 }, { "epoch": 1.28, "learning_rate": 0.0002566572076896708, "loss": 0.0093, "step": 6280 }, { "epoch": 1.28, "learning_rate": 0.0002566435761054376, "loss": 0.0309, "step": 6281 }, { "epoch": 1.28, "learning_rate": 0.0002566299427400553, "loss": 0.0042, "step": 6282 }, { "epoch": 1.28, "learning_rate": 0.0002566163075937517, "loss": 0.0127, "step": 6283 }, { "epoch": 1.28, "learning_rate": 0.0002566026706667546, "loss": 0.0187, "step": 6284 }, { "epoch": 1.28, "learning_rate": 0.00025658903195929165, "loss": 0.0024, "step": 6285 }, { "epoch": 1.28, "learning_rate": 0.0002565753914715906, "loss": 0.0049, "step": 6286 }, { "epoch": 1.28, "learning_rate": 0.00025656174920387937, "loss": 0.0216, "step": 6287 }, { "epoch": 1.28, "learning_rate": 0.00025654810515638577, "loss": 0.0022, "step": 6288 }, { "epoch": 1.28, "learning_rate": 0.00025653445932933774, "loss": 0.0211, "step": 6289 }, { "epoch": 1.28, "learning_rate": 0.0002565208117229631, "loss": 0.0335, "step": 6290 }, { "epoch": 1.28, "learning_rate": 0.00025650716233748986, "loss": 0.0154, "step": 6291 }, { "epoch": 1.28, "learning_rate": 0.0002564935111731459, "loss": 0.0151, "step": 6292 }, { "epoch": 1.28, "learning_rate": 0.0002564798582301593, "loss": 0.0095, "step": 6293 }, { "epoch": 1.28, "learning_rate": 0.00025646620350875814, "loss": 0.0098, "step": 6294 }, { "epoch": 1.28, "learning_rate": 0.00025645254700917033, "loss": 0.015, "step": 6295 }, { "epoch": 1.28, "learning_rate": 0.0002564388887316241, "loss": 0.0045, "step": 6296 }, { "epoch": 1.28, "learning_rate": 0.00025642522867634746, "loss": 0.0102, "step": 6297 }, { "epoch": 1.28, "learning_rate": 0.0002564115668435687, "loss": 0.0115, "step": 6298 }, { "epoch": 1.28, "learning_rate": 0.0002563979032335158, "loss": 0.0051, "step": 6299 }, { "epoch": 1.28, "learning_rate": 0.0002563842378464171, "loss": 0.0214, "step": 6300 }, { "epoch": 1.28, "learning_rate": 0.00025637057068250084, "loss": 0.032, "step": 6301 }, { "epoch": 1.28, "learning_rate": 0.00025635690174199527, "loss": 0.0422, "step": 6302 }, { "epoch": 1.28, "learning_rate": 0.0002563432310251287, "loss": 0.0169, "step": 6303 }, { "epoch": 1.28, "learning_rate": 0.00025632955853212937, "loss": 0.0091, "step": 6304 }, { "epoch": 1.28, "learning_rate": 0.00025631588426322575, "loss": 0.0253, "step": 6305 }, { "epoch": 1.28, "learning_rate": 0.00025630220821864613, "loss": 0.0038, "step": 6306 }, { "epoch": 1.28, "learning_rate": 0.000256288530398619, "loss": 0.0085, "step": 6307 }, { "epoch": 1.28, "learning_rate": 0.00025627485080337276, "loss": 0.0258, "step": 6308 }, { "epoch": 1.28, "learning_rate": 0.0002562611694331359, "loss": 0.0116, "step": 6309 }, { "epoch": 1.28, "learning_rate": 0.000256247486288137, "loss": 0.0062, "step": 6310 }, { "epoch": 1.29, "learning_rate": 0.0002562338013686045, "loss": 0.0049, "step": 6311 }, { "epoch": 1.29, "learning_rate": 0.0002562201146747669, "loss": 0.0201, "step": 6312 }, { "epoch": 1.29, "learning_rate": 0.00025620642620685294, "loss": 0.0201, "step": 6313 }, { "epoch": 1.29, "learning_rate": 0.0002561927359650912, "loss": 0.0319, "step": 6314 }, { "epoch": 1.29, "learning_rate": 0.0002561790439497103, "loss": 0.0097, "step": 6315 }, { "epoch": 1.29, "learning_rate": 0.00025616535016093897, "loss": 0.0051, "step": 6316 }, { "epoch": 1.29, "learning_rate": 0.00025615165459900584, "loss": 0.0085, "step": 6317 }, { "epoch": 1.29, "learning_rate": 0.00025613795726413973, "loss": 0.011, "step": 6318 }, { "epoch": 1.29, "learning_rate": 0.00025612425815656935, "loss": 0.0213, "step": 6319 }, { "epoch": 1.29, "learning_rate": 0.0002561105572765235, "loss": 0.0363, "step": 6320 }, { "epoch": 1.29, "learning_rate": 0.0002560968546242312, "loss": 0.0138, "step": 6321 }, { "epoch": 1.29, "learning_rate": 0.000256083150199921, "loss": 0.0112, "step": 6322 }, { "epoch": 1.29, "learning_rate": 0.00025606944400382203, "loss": 0.0246, "step": 6323 }, { "epoch": 1.29, "learning_rate": 0.0002560557360361631, "loss": 0.0117, "step": 6324 }, { "epoch": 1.29, "learning_rate": 0.0002560420262971732, "loss": 0.0066, "step": 6325 }, { "epoch": 1.29, "learning_rate": 0.00025602831478708127, "loss": 0.0068, "step": 6326 }, { "epoch": 1.29, "learning_rate": 0.0002560146015061164, "loss": 0.0098, "step": 6327 }, { "epoch": 1.29, "learning_rate": 0.0002560008864545075, "loss": 0.0069, "step": 6328 }, { "epoch": 1.29, "learning_rate": 0.0002559871696324837, "loss": 0.015, "step": 6329 }, { "epoch": 1.29, "learning_rate": 0.00025597345104027414, "loss": 0.0193, "step": 6330 }, { "epoch": 1.29, "learning_rate": 0.00025595973067810786, "loss": 0.0305, "step": 6331 }, { "epoch": 1.29, "learning_rate": 0.00025594600854621414, "loss": 0.0189, "step": 6332 }, { "epoch": 1.29, "learning_rate": 0.00025593228464482204, "loss": 0.0182, "step": 6333 }, { "epoch": 1.29, "learning_rate": 0.0002559185589741608, "loss": 0.0129, "step": 6334 }, { "epoch": 1.29, "learning_rate": 0.0002559048315344597, "loss": 0.0048, "step": 6335 }, { "epoch": 1.29, "learning_rate": 0.00025589110232594807, "loss": 0.01, "step": 6336 }, { "epoch": 1.29, "learning_rate": 0.0002558773713488551, "loss": 0.0165, "step": 6337 }, { "epoch": 1.29, "learning_rate": 0.00025586363860341017, "loss": 0.0259, "step": 6338 }, { "epoch": 1.29, "learning_rate": 0.00025584990408984265, "loss": 0.0156, "step": 6339 }, { "epoch": 1.29, "learning_rate": 0.0002558361678083819, "loss": 0.0102, "step": 6340 }, { "epoch": 1.29, "learning_rate": 0.00025582242975925743, "loss": 0.0094, "step": 6341 }, { "epoch": 1.29, "learning_rate": 0.0002558086899426986, "loss": 0.0068, "step": 6342 }, { "epoch": 1.29, "learning_rate": 0.0002557949483589349, "loss": 0.014, "step": 6343 }, { "epoch": 1.29, "learning_rate": 0.00025578120500819587, "loss": 0.0172, "step": 6344 }, { "epoch": 1.29, "learning_rate": 0.000255767459890711, "loss": 0.0209, "step": 6345 }, { "epoch": 1.29, "learning_rate": 0.00025575371300671, "loss": 0.0171, "step": 6346 }, { "epoch": 1.29, "learning_rate": 0.0002557399643564223, "loss": 0.0203, "step": 6347 }, { "epoch": 1.29, "learning_rate": 0.0002557262139400776, "loss": 0.0227, "step": 6348 }, { "epoch": 1.29, "learning_rate": 0.0002557124617579056, "loss": 0.0064, "step": 6349 }, { "epoch": 1.29, "learning_rate": 0.00025569870781013586, "loss": 0.0121, "step": 6350 }, { "epoch": 1.29, "learning_rate": 0.0002556849520969982, "loss": 0.0052, "step": 6351 }, { "epoch": 1.29, "learning_rate": 0.0002556711946187224, "loss": 0.0351, "step": 6352 }, { "epoch": 1.29, "learning_rate": 0.00025565743537553815, "loss": 0.0058, "step": 6353 }, { "epoch": 1.29, "learning_rate": 0.00025564367436767526, "loss": 0.0246, "step": 6354 }, { "epoch": 1.29, "learning_rate": 0.00025562991159536365, "loss": 0.0098, "step": 6355 }, { "epoch": 1.29, "learning_rate": 0.00025561614705883306, "loss": 0.0421, "step": 6356 }, { "epoch": 1.29, "learning_rate": 0.0002556023807583135, "loss": 0.0078, "step": 6357 }, { "epoch": 1.29, "learning_rate": 0.00025558861269403484, "loss": 0.0078, "step": 6358 }, { "epoch": 1.29, "learning_rate": 0.00025557484286622696, "loss": 0.0234, "step": 6359 }, { "epoch": 1.3, "learning_rate": 0.00025556107127512004, "loss": 0.0052, "step": 6360 }, { "epoch": 1.3, "learning_rate": 0.0002555472979209439, "loss": 0.0145, "step": 6361 }, { "epoch": 1.3, "learning_rate": 0.00025553352280392863, "loss": 0.0066, "step": 6362 }, { "epoch": 1.3, "learning_rate": 0.00025551974592430437, "loss": 0.0189, "step": 6363 }, { "epoch": 1.3, "learning_rate": 0.00025550596728230113, "loss": 0.0125, "step": 6364 }, { "epoch": 1.3, "learning_rate": 0.00025549218687814914, "loss": 0.0163, "step": 6365 }, { "epoch": 1.3, "learning_rate": 0.0002554784047120784, "loss": 0.0233, "step": 6366 }, { "epoch": 1.3, "learning_rate": 0.00025546462078431925, "loss": 0.0181, "step": 6367 }, { "epoch": 1.3, "learning_rate": 0.0002554508350951019, "loss": 0.0337, "step": 6368 }, { "epoch": 1.3, "learning_rate": 0.00025543704764465646, "loss": 0.0464, "step": 6369 }, { "epoch": 1.3, "learning_rate": 0.0002554232584332134, "loss": 0.0088, "step": 6370 }, { "epoch": 1.3, "learning_rate": 0.00025540946746100286, "loss": 0.0085, "step": 6371 }, { "epoch": 1.3, "learning_rate": 0.00025539567472825526, "loss": 0.0232, "step": 6372 }, { "epoch": 1.3, "learning_rate": 0.0002553818802352009, "loss": 0.0144, "step": 6373 }, { "epoch": 1.3, "learning_rate": 0.0002553680839820703, "loss": 0.0365, "step": 6374 }, { "epoch": 1.3, "learning_rate": 0.00025535428596909374, "loss": 0.0129, "step": 6375 }, { "epoch": 1.3, "learning_rate": 0.00025534048619650174, "loss": 0.0102, "step": 6376 }, { "epoch": 1.3, "learning_rate": 0.00025532668466452473, "loss": 0.0115, "step": 6377 }, { "epoch": 1.3, "learning_rate": 0.0002553128813733934, "loss": 0.0433, "step": 6378 }, { "epoch": 1.3, "learning_rate": 0.00025529907632333807, "loss": 0.032, "step": 6379 }, { "epoch": 1.3, "learning_rate": 0.00025528526951458936, "loss": 0.0034, "step": 6380 }, { "epoch": 1.3, "learning_rate": 0.000255271460947378, "loss": 0.045, "step": 6381 }, { "epoch": 1.3, "learning_rate": 0.0002552576506219345, "loss": 0.0057, "step": 6382 }, { "epoch": 1.3, "learning_rate": 0.0002552438385384895, "loss": 0.0059, "step": 6383 }, { "epoch": 1.3, "learning_rate": 0.00025523002469727375, "loss": 0.0264, "step": 6384 }, { "epoch": 1.3, "learning_rate": 0.00025521620909851796, "loss": 0.0035, "step": 6385 }, { "epoch": 1.3, "learning_rate": 0.00025520239174245293, "loss": 0.0024, "step": 6386 }, { "epoch": 1.3, "learning_rate": 0.00025518857262930926, "loss": 0.0071, "step": 6387 }, { "epoch": 1.3, "learning_rate": 0.000255174751759318, "loss": 0.0082, "step": 6388 }, { "epoch": 1.3, "learning_rate": 0.0002551609291327098, "loss": 0.0318, "step": 6389 }, { "epoch": 1.3, "learning_rate": 0.0002551471047497155, "loss": 0.0145, "step": 6390 }, { "epoch": 1.3, "learning_rate": 0.00025513327861056615, "loss": 0.0299, "step": 6391 }, { "epoch": 1.3, "learning_rate": 0.0002551194507154926, "loss": 0.0525, "step": 6392 }, { "epoch": 1.3, "learning_rate": 0.00025510562106472573, "loss": 0.0272, "step": 6393 }, { "epoch": 1.3, "learning_rate": 0.0002550917896584967, "loss": 0.0253, "step": 6394 }, { "epoch": 1.3, "learning_rate": 0.0002550779564970363, "loss": 0.0201, "step": 6395 }, { "epoch": 1.3, "learning_rate": 0.0002550641215805757, "loss": 0.0068, "step": 6396 }, { "epoch": 1.3, "learning_rate": 0.000255050284909346, "loss": 0.0058, "step": 6397 }, { "epoch": 1.3, "learning_rate": 0.0002550364464835782, "loss": 0.0211, "step": 6398 }, { "epoch": 1.3, "learning_rate": 0.0002550226063035035, "loss": 0.0206, "step": 6399 }, { "epoch": 1.3, "learning_rate": 0.000255008764369353, "loss": 0.006, "step": 6400 }, { "epoch": 1.3, "learning_rate": 0.0002549949206813579, "loss": 0.0187, "step": 6401 }, { "epoch": 1.3, "learning_rate": 0.0002549810752397495, "loss": 0.0286, "step": 6402 }, { "epoch": 1.3, "learning_rate": 0.00025496722804475895, "loss": 0.0162, "step": 6403 }, { "epoch": 1.3, "learning_rate": 0.0002549533790966175, "loss": 0.0074, "step": 6404 }, { "epoch": 1.3, "learning_rate": 0.00025493952839555656, "loss": 0.0138, "step": 6405 }, { "epoch": 1.3, "learning_rate": 0.0002549256759418074, "loss": 0.0106, "step": 6406 }, { "epoch": 1.3, "learning_rate": 0.0002549118217356014, "loss": 0.0077, "step": 6407 }, { "epoch": 1.3, "learning_rate": 0.0002548979657771699, "loss": 0.034, "step": 6408 }, { "epoch": 1.3, "learning_rate": 0.0002548841080667444, "loss": 0.0309, "step": 6409 }, { "epoch": 1.31, "learning_rate": 0.00025487024860455635, "loss": 0.0116, "step": 6410 }, { "epoch": 1.31, "learning_rate": 0.00025485638739083716, "loss": 0.0202, "step": 6411 }, { "epoch": 1.31, "learning_rate": 0.0002548425244258183, "loss": 0.0045, "step": 6412 }, { "epoch": 1.31, "learning_rate": 0.00025482865970973147, "loss": 0.0198, "step": 6413 }, { "epoch": 1.31, "learning_rate": 0.0002548147932428081, "loss": 0.0339, "step": 6414 }, { "epoch": 1.31, "learning_rate": 0.00025480092502527986, "loss": 0.0143, "step": 6415 }, { "epoch": 1.31, "learning_rate": 0.00025478705505737833, "loss": 0.0064, "step": 6416 }, { "epoch": 1.31, "learning_rate": 0.00025477318333933516, "loss": 0.0077, "step": 6417 }, { "epoch": 1.31, "learning_rate": 0.00025475930987138204, "loss": 0.012, "step": 6418 }, { "epoch": 1.31, "learning_rate": 0.0002547454346537507, "loss": 0.0069, "step": 6419 }, { "epoch": 1.31, "learning_rate": 0.00025473155768667295, "loss": 0.0122, "step": 6420 }, { "epoch": 1.31, "learning_rate": 0.00025471767897038047, "loss": 0.0234, "step": 6421 }, { "epoch": 1.31, "learning_rate": 0.0002547037985051051, "loss": 0.0102, "step": 6422 }, { "epoch": 1.31, "learning_rate": 0.0002546899162910786, "loss": 0.0096, "step": 6423 }, { "epoch": 1.31, "learning_rate": 0.0002546760323285329, "loss": 0.0189, "step": 6424 }, { "epoch": 1.31, "learning_rate": 0.0002546621466176998, "loss": 0.0047, "step": 6425 }, { "epoch": 1.31, "learning_rate": 0.0002546482591588114, "loss": 0.0103, "step": 6426 }, { "epoch": 1.31, "learning_rate": 0.0002546343699520995, "loss": 0.0069, "step": 6427 }, { "epoch": 1.31, "learning_rate": 0.00025462047899779607, "loss": 0.0162, "step": 6428 }, { "epoch": 1.31, "learning_rate": 0.0002546065862961332, "loss": 0.0054, "step": 6429 }, { "epoch": 1.31, "learning_rate": 0.00025459269184734286, "loss": 0.0349, "step": 6430 }, { "epoch": 1.31, "learning_rate": 0.0002545787956516572, "loss": 0.0029, "step": 6431 }, { "epoch": 1.31, "learning_rate": 0.0002545648977093082, "loss": 0.0053, "step": 6432 }, { "epoch": 1.31, "learning_rate": 0.00025455099802052796, "loss": 0.0219, "step": 6433 }, { "epoch": 1.31, "learning_rate": 0.00025453709658554874, "loss": 0.0183, "step": 6434 }, { "epoch": 1.31, "learning_rate": 0.00025452319340460276, "loss": 0.0448, "step": 6435 }, { "epoch": 1.31, "learning_rate": 0.00025450928847792204, "loss": 0.0066, "step": 6436 }, { "epoch": 1.31, "learning_rate": 0.00025449538180573897, "loss": 0.0183, "step": 6437 }, { "epoch": 1.31, "learning_rate": 0.0002544814733882858, "loss": 0.0114, "step": 6438 }, { "epoch": 1.31, "learning_rate": 0.00025446756322579475, "loss": 0.0122, "step": 6439 }, { "epoch": 1.31, "learning_rate": 0.00025445365131849824, "loss": 0.005, "step": 6440 }, { "epoch": 1.31, "learning_rate": 0.00025443973766662854, "loss": 0.0479, "step": 6441 }, { "epoch": 1.31, "learning_rate": 0.0002544258222704181, "loss": 0.0071, "step": 6442 }, { "epoch": 1.31, "learning_rate": 0.00025441190513009936, "loss": 0.0245, "step": 6443 }, { "epoch": 1.31, "learning_rate": 0.0002543979862459046, "loss": 0.0112, "step": 6444 }, { "epoch": 1.31, "learning_rate": 0.0002543840656180665, "loss": 0.0139, "step": 6445 }, { "epoch": 1.31, "learning_rate": 0.0002543701432468174, "loss": 0.0153, "step": 6446 }, { "epoch": 1.31, "learning_rate": 0.00025435621913239, "loss": 0.0063, "step": 6447 }, { "epoch": 1.31, "learning_rate": 0.00025434229327501664, "loss": 0.0146, "step": 6448 }, { "epoch": 1.31, "learning_rate": 0.00025432836567493007, "loss": 0.0119, "step": 6449 }, { "epoch": 1.31, "learning_rate": 0.0002543144363323629, "loss": 0.0224, "step": 6450 }, { "epoch": 1.31, "learning_rate": 0.0002543005052475477, "loss": 0.0227, "step": 6451 }, { "epoch": 1.31, "learning_rate": 0.00025428657242071716, "loss": 0.0262, "step": 6452 }, { "epoch": 1.31, "learning_rate": 0.000254272637852104, "loss": 0.0343, "step": 6453 }, { "epoch": 1.31, "learning_rate": 0.00025425870154194096, "loss": 0.0169, "step": 6454 }, { "epoch": 1.31, "learning_rate": 0.00025424476349046084, "loss": 0.0145, "step": 6455 }, { "epoch": 1.31, "learning_rate": 0.0002542308236978964, "loss": 0.0218, "step": 6456 }, { "epoch": 1.31, "learning_rate": 0.00025421688216448044, "loss": 0.0064, "step": 6457 }, { "epoch": 1.31, "learning_rate": 0.0002542029388904458, "loss": 0.031, "step": 6458 }, { "epoch": 1.32, "learning_rate": 0.00025418899387602534, "loss": 0.0043, "step": 6459 }, { "epoch": 1.32, "learning_rate": 0.0002541750471214521, "loss": 0.0261, "step": 6460 }, { "epoch": 1.32, "learning_rate": 0.0002541610986269589, "loss": 0.0072, "step": 6461 }, { "epoch": 1.32, "learning_rate": 0.00025414714839277873, "loss": 0.0077, "step": 6462 }, { "epoch": 1.32, "learning_rate": 0.0002541331964191446, "loss": 0.0015, "step": 6463 }, { "epoch": 1.32, "learning_rate": 0.00025411924270628955, "loss": 0.0136, "step": 6464 }, { "epoch": 1.32, "learning_rate": 0.00025410528725444654, "loss": 0.014, "step": 6465 }, { "epoch": 1.32, "learning_rate": 0.0002540913300638488, "loss": 0.0092, "step": 6466 }, { "epoch": 1.32, "learning_rate": 0.0002540773711347293, "loss": 0.0132, "step": 6467 }, { "epoch": 1.32, "learning_rate": 0.0002540634104673213, "loss": 0.0203, "step": 6468 }, { "epoch": 1.32, "learning_rate": 0.0002540494480618578, "loss": 0.02, "step": 6469 }, { "epoch": 1.32, "learning_rate": 0.0002540354839185722, "loss": 0.0154, "step": 6470 }, { "epoch": 1.32, "learning_rate": 0.00025402151803769764, "loss": 0.0216, "step": 6471 }, { "epoch": 1.32, "learning_rate": 0.0002540075504194673, "loss": 0.0142, "step": 6472 }, { "epoch": 1.32, "learning_rate": 0.0002539935810641146, "loss": 0.0066, "step": 6473 }, { "epoch": 1.32, "learning_rate": 0.0002539796099718728, "loss": 0.0138, "step": 6474 }, { "epoch": 1.32, "learning_rate": 0.00025396563714297525, "loss": 0.0067, "step": 6475 }, { "epoch": 1.32, "learning_rate": 0.00025395166257765527, "loss": 0.0279, "step": 6476 }, { "epoch": 1.32, "learning_rate": 0.00025393768627614635, "loss": 0.0224, "step": 6477 }, { "epoch": 1.32, "learning_rate": 0.0002539237082386818, "loss": 0.0124, "step": 6478 }, { "epoch": 1.32, "learning_rate": 0.0002539097284654952, "loss": 0.0153, "step": 6479 }, { "epoch": 1.32, "learning_rate": 0.00025389574695682004, "loss": 0.0142, "step": 6480 }, { "epoch": 1.32, "learning_rate": 0.0002538817637128897, "loss": 0.005, "step": 6481 }, { "epoch": 1.32, "learning_rate": 0.00025386777873393786, "loss": 0.0065, "step": 6482 }, { "epoch": 1.32, "learning_rate": 0.000253853792020198, "loss": 0.0122, "step": 6483 }, { "epoch": 1.32, "learning_rate": 0.00025383980357190385, "loss": 0.0078, "step": 6484 }, { "epoch": 1.32, "learning_rate": 0.0002538258133892889, "loss": 0.0109, "step": 6485 }, { "epoch": 1.32, "learning_rate": 0.00025381182147258695, "loss": 0.016, "step": 6486 }, { "epoch": 1.32, "learning_rate": 0.00025379782782203157, "loss": 0.0205, "step": 6487 }, { "epoch": 1.32, "learning_rate": 0.00025378383243785654, "loss": 0.0155, "step": 6488 }, { "epoch": 1.32, "learning_rate": 0.0002537698353202956, "loss": 0.0153, "step": 6489 }, { "epoch": 1.32, "learning_rate": 0.00025375583646958255, "loss": 0.0314, "step": 6490 }, { "epoch": 1.32, "learning_rate": 0.0002537418358859512, "loss": 0.0153, "step": 6491 }, { "epoch": 1.32, "learning_rate": 0.00025372783356963533, "loss": 0.0046, "step": 6492 }, { "epoch": 1.32, "learning_rate": 0.00025371382952086885, "loss": 0.0081, "step": 6493 }, { "epoch": 1.32, "learning_rate": 0.0002536998237398856, "loss": 0.0063, "step": 6494 }, { "epoch": 1.32, "learning_rate": 0.0002536858162269196, "loss": 0.0226, "step": 6495 }, { "epoch": 1.32, "learning_rate": 0.00025367180698220476, "loss": 0.01, "step": 6496 }, { "epoch": 1.32, "learning_rate": 0.000253657796005975, "loss": 0.0021, "step": 6497 }, { "epoch": 1.32, "learning_rate": 0.0002536437832984644, "loss": 0.0166, "step": 6498 }, { "epoch": 1.32, "learning_rate": 0.000253629768859907, "loss": 0.0126, "step": 6499 }, { "epoch": 1.32, "learning_rate": 0.0002536157526905368, "loss": 0.024, "step": 6500 }, { "epoch": 1.32, "learning_rate": 0.00025360173479058797, "loss": 0.0051, "step": 6501 }, { "epoch": 1.32, "learning_rate": 0.0002535877151602946, "loss": 0.0208, "step": 6502 }, { "epoch": 1.32, "learning_rate": 0.0002535736937998909, "loss": 0.0043, "step": 6503 }, { "epoch": 1.32, "learning_rate": 0.00025355967070961094, "loss": 0.0101, "step": 6504 }, { "epoch": 1.32, "learning_rate": 0.000253545645889689, "loss": 0.0161, "step": 6505 }, { "epoch": 1.32, "learning_rate": 0.0002535316193403593, "loss": 0.0103, "step": 6506 }, { "epoch": 1.32, "learning_rate": 0.0002535175910618562, "loss": 0.0034, "step": 6507 }, { "epoch": 1.33, "learning_rate": 0.0002535035610544139, "loss": 0.0201, "step": 6508 }, { "epoch": 1.33, "learning_rate": 0.0002534895293182667, "loss": 0.0143, "step": 6509 }, { "epoch": 1.33, "learning_rate": 0.00025347549585364907, "loss": 0.0131, "step": 6510 }, { "epoch": 1.33, "learning_rate": 0.0002534614606607953, "loss": 0.0246, "step": 6511 }, { "epoch": 1.33, "learning_rate": 0.00025344742373993985, "loss": 0.0207, "step": 6512 }, { "epoch": 1.33, "learning_rate": 0.0002534333850913172, "loss": 0.0034, "step": 6513 }, { "epoch": 1.33, "learning_rate": 0.0002534193447151617, "loss": 0.0062, "step": 6514 }, { "epoch": 1.33, "learning_rate": 0.000253405302611708, "loss": 0.0133, "step": 6515 }, { "epoch": 1.33, "learning_rate": 0.0002533912587811905, "loss": 0.0114, "step": 6516 }, { "epoch": 1.33, "learning_rate": 0.0002533772132238438, "loss": 0.0138, "step": 6517 }, { "epoch": 1.33, "learning_rate": 0.0002533631659399025, "loss": 0.0185, "step": 6518 }, { "epoch": 1.33, "learning_rate": 0.00025334911692960125, "loss": 0.0209, "step": 6519 }, { "epoch": 1.33, "learning_rate": 0.0002533350661931747, "loss": 0.0174, "step": 6520 }, { "epoch": 1.33, "learning_rate": 0.00025332101373085736, "loss": 0.0194, "step": 6521 }, { "epoch": 1.33, "learning_rate": 0.0002533069595428842, "loss": 0.0193, "step": 6522 }, { "epoch": 1.33, "learning_rate": 0.0002532929036294897, "loss": 0.0252, "step": 6523 }, { "epoch": 1.33, "learning_rate": 0.0002532788459909088, "loss": 0.0088, "step": 6524 }, { "epoch": 1.33, "learning_rate": 0.0002532647866273762, "loss": 0.0125, "step": 6525 }, { "epoch": 1.33, "learning_rate": 0.0002532507255391267, "loss": 0.016, "step": 6526 }, { "epoch": 1.33, "learning_rate": 0.00025323666272639525, "loss": 0.0224, "step": 6527 }, { "epoch": 1.33, "learning_rate": 0.0002532225981894166, "loss": 0.0106, "step": 6528 }, { "epoch": 1.33, "learning_rate": 0.0002532085319284258, "loss": 0.0178, "step": 6529 }, { "epoch": 1.33, "learning_rate": 0.00025319446394365757, "loss": 0.0083, "step": 6530 }, { "epoch": 1.33, "learning_rate": 0.0002531803942353471, "loss": 0.0093, "step": 6531 }, { "epoch": 1.33, "learning_rate": 0.00025316632280372926, "loss": 0.0106, "step": 6532 }, { "epoch": 1.33, "learning_rate": 0.00025315224964903905, "loss": 0.0123, "step": 6533 }, { "epoch": 1.33, "learning_rate": 0.0002531381747715116, "loss": 0.0116, "step": 6534 }, { "epoch": 1.33, "learning_rate": 0.00025312409817138196, "loss": 0.0157, "step": 6535 }, { "epoch": 1.33, "learning_rate": 0.00025311001984888514, "loss": 0.0045, "step": 6536 }, { "epoch": 1.33, "learning_rate": 0.00025309593980425645, "loss": 0.0114, "step": 6537 }, { "epoch": 1.33, "learning_rate": 0.00025308185803773087, "loss": 0.0064, "step": 6538 }, { "epoch": 1.33, "learning_rate": 0.00025306777454954375, "loss": 0.0137, "step": 6539 }, { "epoch": 1.33, "learning_rate": 0.00025305368933993024, "loss": 0.0041, "step": 6540 }, { "epoch": 1.33, "learning_rate": 0.00025303960240912555, "loss": 0.0331, "step": 6541 }, { "epoch": 1.33, "learning_rate": 0.000253025513757365, "loss": 0.0016, "step": 6542 }, { "epoch": 1.33, "learning_rate": 0.0002530114233848839, "loss": 0.0375, "step": 6543 }, { "epoch": 1.33, "learning_rate": 0.0002529973312919176, "loss": 0.0052, "step": 6544 }, { "epoch": 1.33, "learning_rate": 0.0002529832374787014, "loss": 0.0184, "step": 6545 }, { "epoch": 1.33, "learning_rate": 0.0002529691419454708, "loss": 0.0201, "step": 6546 }, { "epoch": 1.33, "learning_rate": 0.0002529550446924611, "loss": 0.035, "step": 6547 }, { "epoch": 1.33, "learning_rate": 0.0002529409457199079, "loss": 0.0154, "step": 6548 }, { "epoch": 1.33, "learning_rate": 0.0002529268450280465, "loss": 0.0273, "step": 6549 }, { "epoch": 1.33, "learning_rate": 0.00025291274261711255, "loss": 0.0177, "step": 6550 }, { "epoch": 1.33, "learning_rate": 0.00025289863848734155, "loss": 0.0185, "step": 6551 }, { "epoch": 1.33, "learning_rate": 0.000252884532638969, "loss": 0.0026, "step": 6552 }, { "epoch": 1.33, "learning_rate": 0.0002528704250722306, "loss": 0.0259, "step": 6553 }, { "epoch": 1.33, "learning_rate": 0.0002528563157873619, "loss": 0.0096, "step": 6554 }, { "epoch": 1.33, "learning_rate": 0.00025284220478459854, "loss": 0.0128, "step": 6555 }, { "epoch": 1.33, "learning_rate": 0.00025282809206417624, "loss": 0.0064, "step": 6556 }, { "epoch": 1.34, "learning_rate": 0.0002528139776263307, "loss": 0.0146, "step": 6557 }, { "epoch": 1.34, "learning_rate": 0.00025279986147129773, "loss": 0.0067, "step": 6558 }, { "epoch": 1.34, "learning_rate": 0.00025278574359931293, "loss": 0.0159, "step": 6559 }, { "epoch": 1.34, "learning_rate": 0.0002527716240106122, "loss": 0.0146, "step": 6560 }, { "epoch": 1.34, "learning_rate": 0.0002527575027054315, "loss": 0.0148, "step": 6561 }, { "epoch": 1.34, "learning_rate": 0.00025274337968400634, "loss": 0.0066, "step": 6562 }, { "epoch": 1.34, "learning_rate": 0.0002527292549465729, "loss": 0.0167, "step": 6563 }, { "epoch": 1.34, "learning_rate": 0.00025271512849336697, "loss": 0.016, "step": 6564 }, { "epoch": 1.34, "learning_rate": 0.0002527010003246245, "loss": 0.0076, "step": 6565 }, { "epoch": 1.34, "learning_rate": 0.00025268687044058144, "loss": 0.0069, "step": 6566 }, { "epoch": 1.34, "learning_rate": 0.00025267273884147385, "loss": 0.0093, "step": 6567 }, { "epoch": 1.34, "learning_rate": 0.0002526586055275377, "loss": 0.0066, "step": 6568 }, { "epoch": 1.34, "learning_rate": 0.00025264447049900906, "loss": 0.0178, "step": 6569 }, { "epoch": 1.34, "learning_rate": 0.000252630333756124, "loss": 0.0053, "step": 6570 }, { "epoch": 1.34, "learning_rate": 0.0002526161952991186, "loss": 0.037, "step": 6571 }, { "epoch": 1.34, "learning_rate": 0.0002526020551282291, "loss": 0.0174, "step": 6572 }, { "epoch": 1.34, "learning_rate": 0.0002525879132436916, "loss": 0.0411, "step": 6573 }, { "epoch": 1.34, "learning_rate": 0.00025257376964574223, "loss": 0.0102, "step": 6574 }, { "epoch": 1.34, "learning_rate": 0.00025255962433461734, "loss": 0.0071, "step": 6575 }, { "epoch": 1.34, "learning_rate": 0.00025254547731055313, "loss": 0.0171, "step": 6576 }, { "epoch": 1.34, "learning_rate": 0.00025253132857378587, "loss": 0.0189, "step": 6577 }, { "epoch": 1.34, "learning_rate": 0.0002525171781245519, "loss": 0.0109, "step": 6578 }, { "epoch": 1.34, "learning_rate": 0.00025250302596308753, "loss": 0.0133, "step": 6579 }, { "epoch": 1.34, "learning_rate": 0.0002524888720896291, "loss": 0.0079, "step": 6580 }, { "epoch": 1.34, "learning_rate": 0.0002524747165044131, "loss": 0.0161, "step": 6581 }, { "epoch": 1.34, "learning_rate": 0.00025246055920767586, "loss": 0.0176, "step": 6582 }, { "epoch": 1.34, "learning_rate": 0.00025244640019965394, "loss": 0.0086, "step": 6583 }, { "epoch": 1.34, "learning_rate": 0.00025243223948058366, "loss": 0.0112, "step": 6584 }, { "epoch": 1.34, "learning_rate": 0.00025241807705070167, "loss": 0.0054, "step": 6585 }, { "epoch": 1.34, "learning_rate": 0.00025240391291024447, "loss": 0.0242, "step": 6586 }, { "epoch": 1.34, "learning_rate": 0.00025238974705944864, "loss": 0.0069, "step": 6587 }, { "epoch": 1.34, "learning_rate": 0.00025237557949855076, "loss": 0.0116, "step": 6588 }, { "epoch": 1.34, "learning_rate": 0.0002523614102277874, "loss": 0.0173, "step": 6589 }, { "epoch": 1.34, "learning_rate": 0.0002523472392473953, "loss": 0.0182, "step": 6590 }, { "epoch": 1.34, "learning_rate": 0.00025233306655761113, "loss": 0.0133, "step": 6591 }, { "epoch": 1.34, "learning_rate": 0.00025231889215867156, "loss": 0.0185, "step": 6592 }, { "epoch": 1.34, "learning_rate": 0.00025230471605081333, "loss": 0.016, "step": 6593 }, { "epoch": 1.34, "learning_rate": 0.00025229053823427324, "loss": 0.0014, "step": 6594 }, { "epoch": 1.34, "learning_rate": 0.0002522763587092881, "loss": 0.0177, "step": 6595 }, { "epoch": 1.34, "learning_rate": 0.0002522621774760947, "loss": 0.0019, "step": 6596 }, { "epoch": 1.34, "learning_rate": 0.0002522479945349299, "loss": 0.0113, "step": 6597 }, { "epoch": 1.34, "learning_rate": 0.00025223380988603056, "loss": 0.0037, "step": 6598 }, { "epoch": 1.34, "learning_rate": 0.00025221962352963367, "loss": 0.0199, "step": 6599 }, { "epoch": 1.34, "learning_rate": 0.0002522054354659761, "loss": 0.0148, "step": 6600 }, { "epoch": 1.34, "learning_rate": 0.0002521912456952948, "loss": 0.0069, "step": 6601 }, { "epoch": 1.34, "learning_rate": 0.0002521770542178268, "loss": 0.0102, "step": 6602 }, { "epoch": 1.34, "learning_rate": 0.00025216286103380914, "loss": 0.0244, "step": 6603 }, { "epoch": 1.34, "learning_rate": 0.00025214866614347886, "loss": 0.0207, "step": 6604 }, { "epoch": 1.34, "learning_rate": 0.00025213446954707304, "loss": 0.0035, "step": 6605 }, { "epoch": 1.35, "learning_rate": 0.00025212027124482873, "loss": 0.0167, "step": 6606 }, { "epoch": 1.35, "learning_rate": 0.00025210607123698315, "loss": 0.0104, "step": 6607 }, { "epoch": 1.35, "learning_rate": 0.0002520918695237735, "loss": 0.0083, "step": 6608 }, { "epoch": 1.35, "learning_rate": 0.00025207766610543683, "loss": 0.0158, "step": 6609 }, { "epoch": 1.35, "learning_rate": 0.00025206346098221054, "loss": 0.0149, "step": 6610 }, { "epoch": 1.35, "learning_rate": 0.0002520492541543317, "loss": 0.0117, "step": 6611 }, { "epoch": 1.35, "learning_rate": 0.00025203504562203773, "loss": 0.0486, "step": 6612 }, { "epoch": 1.35, "learning_rate": 0.00025202083538556594, "loss": 0.0079, "step": 6613 }, { "epoch": 1.35, "learning_rate": 0.00025200662344515356, "loss": 0.0269, "step": 6614 }, { "epoch": 1.35, "learning_rate": 0.00025199240980103803, "loss": 0.0091, "step": 6615 }, { "epoch": 1.35, "learning_rate": 0.00025197819445345673, "loss": 0.0118, "step": 6616 }, { "epoch": 1.35, "learning_rate": 0.00025196397740264706, "loss": 0.0262, "step": 6617 }, { "epoch": 1.35, "learning_rate": 0.00025194975864884655, "loss": 0.016, "step": 6618 }, { "epoch": 1.35, "learning_rate": 0.0002519355381922926, "loss": 0.0035, "step": 6619 }, { "epoch": 1.35, "learning_rate": 0.00025192131603322276, "loss": 0.0126, "step": 6620 }, { "epoch": 1.35, "learning_rate": 0.0002519070921718745, "loss": 0.0016, "step": 6621 }, { "epoch": 1.35, "learning_rate": 0.0002518928666084855, "loss": 0.0074, "step": 6622 }, { "epoch": 1.35, "learning_rate": 0.0002518786393432933, "loss": 0.0051, "step": 6623 }, { "epoch": 1.35, "learning_rate": 0.00025186441037653546, "loss": 0.0054, "step": 6624 }, { "epoch": 1.35, "learning_rate": 0.0002518501797084497, "loss": 0.0237, "step": 6625 }, { "epoch": 1.35, "learning_rate": 0.00025183594733927365, "loss": 0.0234, "step": 6626 }, { "epoch": 1.35, "learning_rate": 0.00025182171326924515, "loss": 0.0144, "step": 6627 }, { "epoch": 1.35, "learning_rate": 0.0002518074774986018, "loss": 0.0129, "step": 6628 }, { "epoch": 1.35, "learning_rate": 0.00025179324002758135, "loss": 0.0386, "step": 6629 }, { "epoch": 1.35, "learning_rate": 0.0002517790008564217, "loss": 0.0077, "step": 6630 }, { "epoch": 1.35, "learning_rate": 0.0002517647599853606, "loss": 0.0124, "step": 6631 }, { "epoch": 1.35, "learning_rate": 0.00025175051741463584, "loss": 0.0086, "step": 6632 }, { "epoch": 1.35, "learning_rate": 0.00025173627314448545, "loss": 0.0406, "step": 6633 }, { "epoch": 1.35, "learning_rate": 0.00025172202717514724, "loss": 0.0096, "step": 6634 }, { "epoch": 1.35, "learning_rate": 0.0002517077795068591, "loss": 0.023, "step": 6635 }, { "epoch": 1.35, "learning_rate": 0.00025169353013985914, "loss": 0.0268, "step": 6636 }, { "epoch": 1.35, "learning_rate": 0.0002516792790743853, "loss": 0.0045, "step": 6637 }, { "epoch": 1.35, "learning_rate": 0.00025166502631067546, "loss": 0.0354, "step": 6638 }, { "epoch": 1.35, "learning_rate": 0.00025165077184896784, "loss": 0.0139, "step": 6639 }, { "epoch": 1.35, "learning_rate": 0.0002516365156895004, "loss": 0.0121, "step": 6640 }, { "epoch": 1.35, "learning_rate": 0.0002516222578325113, "loss": 0.0115, "step": 6641 }, { "epoch": 1.35, "learning_rate": 0.00025160799827823876, "loss": 0.0105, "step": 6642 }, { "epoch": 1.35, "learning_rate": 0.00025159373702692076, "loss": 0.0108, "step": 6643 }, { "epoch": 1.35, "learning_rate": 0.0002515794740787956, "loss": 0.0156, "step": 6644 }, { "epoch": 1.35, "learning_rate": 0.0002515652094341015, "loss": 0.0065, "step": 6645 }, { "epoch": 1.35, "learning_rate": 0.0002515509430930767, "loss": 0.0041, "step": 6646 }, { "epoch": 1.35, "learning_rate": 0.00025153667505595944, "loss": 0.0318, "step": 6647 }, { "epoch": 1.35, "learning_rate": 0.00025152240532298796, "loss": 0.0172, "step": 6648 }, { "epoch": 1.35, "learning_rate": 0.0002515081338944008, "loss": 0.0075, "step": 6649 }, { "epoch": 1.35, "learning_rate": 0.0002514938607704361, "loss": 0.0214, "step": 6650 }, { "epoch": 1.35, "learning_rate": 0.00025147958595133236, "loss": 0.0086, "step": 6651 }, { "epoch": 1.35, "learning_rate": 0.00025146530943732806, "loss": 0.0099, "step": 6652 }, { "epoch": 1.35, "learning_rate": 0.00025145103122866145, "loss": 0.0042, "step": 6653 }, { "epoch": 1.35, "learning_rate": 0.0002514367513255712, "loss": 0.0085, "step": 6654 }, { "epoch": 1.36, "learning_rate": 0.00025142246972829565, "loss": 0.0124, "step": 6655 }, { "epoch": 1.36, "learning_rate": 0.0002514081864370735, "loss": 0.0234, "step": 6656 }, { "epoch": 1.36, "learning_rate": 0.00025139390145214317, "loss": 0.0356, "step": 6657 }, { "epoch": 1.36, "learning_rate": 0.0002513796147737433, "loss": 0.0119, "step": 6658 }, { "epoch": 1.36, "learning_rate": 0.00025136532640211245, "loss": 0.0067, "step": 6659 }, { "epoch": 1.36, "learning_rate": 0.00025135103633748936, "loss": 0.0179, "step": 6660 }, { "epoch": 1.36, "learning_rate": 0.00025133674458011263, "loss": 0.0047, "step": 6661 }, { "epoch": 1.36, "learning_rate": 0.00025132245113022097, "loss": 0.0178, "step": 6662 }, { "epoch": 1.36, "learning_rate": 0.00025130815598805315, "loss": 0.0114, "step": 6663 }, { "epoch": 1.36, "learning_rate": 0.0002512938591538478, "loss": 0.0104, "step": 6664 }, { "epoch": 1.36, "learning_rate": 0.00025127956062784393, "loss": 0.0177, "step": 6665 }, { "epoch": 1.36, "learning_rate": 0.0002512652604102802, "loss": 0.0221, "step": 6666 }, { "epoch": 1.36, "learning_rate": 0.00025125095850139534, "loss": 0.0166, "step": 6667 }, { "epoch": 1.36, "learning_rate": 0.00025123665490142845, "loss": 0.0047, "step": 6668 }, { "epoch": 1.36, "learning_rate": 0.0002512223496106183, "loss": 0.0441, "step": 6669 }, { "epoch": 1.36, "learning_rate": 0.0002512080426292039, "loss": 0.0094, "step": 6670 }, { "epoch": 1.36, "learning_rate": 0.00025119373395742406, "loss": 0.0142, "step": 6671 }, { "epoch": 1.36, "learning_rate": 0.0002511794235955179, "loss": 0.0092, "step": 6672 }, { "epoch": 1.36, "learning_rate": 0.0002511651115437243, "loss": 0.0063, "step": 6673 }, { "epoch": 1.36, "learning_rate": 0.00025115079780228247, "loss": 0.0117, "step": 6674 }, { "epoch": 1.36, "learning_rate": 0.0002511364823714313, "loss": 0.0156, "step": 6675 }, { "epoch": 1.36, "learning_rate": 0.00025112216525141005, "loss": 0.032, "step": 6676 }, { "epoch": 1.36, "learning_rate": 0.0002511078464424577, "loss": 0.0439, "step": 6677 }, { "epoch": 1.36, "learning_rate": 0.0002510935259448135, "loss": 0.0255, "step": 6678 }, { "epoch": 1.36, "learning_rate": 0.0002510792037587166, "loss": 0.0162, "step": 6679 }, { "epoch": 1.36, "learning_rate": 0.0002510648798844061, "loss": 0.0083, "step": 6680 }, { "epoch": 1.36, "learning_rate": 0.0002510505543221214, "loss": 0.0101, "step": 6681 }, { "epoch": 1.36, "learning_rate": 0.0002510362270721017, "loss": 0.0201, "step": 6682 }, { "epoch": 1.36, "learning_rate": 0.00025102189813458627, "loss": 0.0164, "step": 6683 }, { "epoch": 1.36, "learning_rate": 0.00025100756750981446, "loss": 0.0127, "step": 6684 }, { "epoch": 1.36, "learning_rate": 0.0002509932351980256, "loss": 0.035, "step": 6685 }, { "epoch": 1.36, "learning_rate": 0.0002509789011994591, "loss": 0.0121, "step": 6686 }, { "epoch": 1.36, "learning_rate": 0.00025096456551435426, "loss": 0.0207, "step": 6687 }, { "epoch": 1.36, "learning_rate": 0.0002509502281429507, "loss": 0.0205, "step": 6688 }, { "epoch": 1.36, "learning_rate": 0.0002509358890854877, "loss": 0.0146, "step": 6689 }, { "epoch": 1.36, "learning_rate": 0.00025092154834220485, "loss": 0.0083, "step": 6690 }, { "epoch": 1.36, "learning_rate": 0.00025090720591334164, "loss": 0.0038, "step": 6691 }, { "epoch": 1.36, "learning_rate": 0.0002508928617991376, "loss": 0.0031, "step": 6692 }, { "epoch": 1.36, "learning_rate": 0.00025087851599983233, "loss": 0.0081, "step": 6693 }, { "epoch": 1.36, "learning_rate": 0.00025086416851566545, "loss": 0.025, "step": 6694 }, { "epoch": 1.36, "learning_rate": 0.0002508498193468765, "loss": 0.0322, "step": 6695 }, { "epoch": 1.36, "learning_rate": 0.00025083546849370524, "loss": 0.0142, "step": 6696 }, { "epoch": 1.36, "learning_rate": 0.0002508211159563913, "loss": 0.0085, "step": 6697 }, { "epoch": 1.36, "learning_rate": 0.00025080676173517446, "loss": 0.0095, "step": 6698 }, { "epoch": 1.36, "learning_rate": 0.00025079240583029434, "loss": 0.0084, "step": 6699 }, { "epoch": 1.36, "learning_rate": 0.0002507780482419908, "loss": 0.0073, "step": 6700 }, { "epoch": 1.36, "learning_rate": 0.0002507636889705036, "loss": 0.016, "step": 6701 }, { "epoch": 1.36, "learning_rate": 0.0002507493280160727, "loss": 0.0252, "step": 6702 }, { "epoch": 1.36, "learning_rate": 0.0002507349653789378, "loss": 0.0382, "step": 6703 }, { "epoch": 1.37, "learning_rate": 0.0002507206010593387, "loss": 0.0177, "step": 6704 }, { "epoch": 1.37, "learning_rate": 0.00025070623505751556, "loss": 0.0323, "step": 6705 }, { "epoch": 1.37, "learning_rate": 0.00025069186737370817, "loss": 0.0049, "step": 6706 }, { "epoch": 1.37, "learning_rate": 0.00025067749800815656, "loss": 0.0134, "step": 6707 }, { "epoch": 1.37, "learning_rate": 0.00025066312696110063, "loss": 0.006, "step": 6708 }, { "epoch": 1.37, "learning_rate": 0.0002506487542327805, "loss": 0.0382, "step": 6709 }, { "epoch": 1.37, "learning_rate": 0.00025063437982343617, "loss": 0.0064, "step": 6710 }, { "epoch": 1.37, "learning_rate": 0.0002506200037333077, "loss": 0.0119, "step": 6711 }, { "epoch": 1.37, "learning_rate": 0.00025060562596263534, "loss": 0.0047, "step": 6712 }, { "epoch": 1.37, "learning_rate": 0.00025059124651165905, "loss": 0.0114, "step": 6713 }, { "epoch": 1.37, "learning_rate": 0.0002505768653806191, "loss": 0.0142, "step": 6714 }, { "epoch": 1.37, "learning_rate": 0.0002505624825697556, "loss": 0.0162, "step": 6715 }, { "epoch": 1.37, "learning_rate": 0.00025054809807930885, "loss": 0.0125, "step": 6716 }, { "epoch": 1.37, "learning_rate": 0.00025053371190951907, "loss": 0.0105, "step": 6717 }, { "epoch": 1.37, "learning_rate": 0.00025051932406062647, "loss": 0.0203, "step": 6718 }, { "epoch": 1.37, "learning_rate": 0.00025050493453287147, "loss": 0.0254, "step": 6719 }, { "epoch": 1.37, "learning_rate": 0.0002504905433264944, "loss": 0.0096, "step": 6720 }, { "epoch": 1.37, "learning_rate": 0.0002504761504417354, "loss": 0.0087, "step": 6721 }, { "epoch": 1.37, "learning_rate": 0.00025046175587883516, "loss": 0.022, "step": 6722 }, { "epoch": 1.37, "learning_rate": 0.0002504473596380339, "loss": 0.018, "step": 6723 }, { "epoch": 1.37, "learning_rate": 0.0002504329617195722, "loss": 0.0108, "step": 6724 }, { "epoch": 1.37, "learning_rate": 0.0002504185621236904, "loss": 0.0223, "step": 6725 }, { "epoch": 1.37, "learning_rate": 0.00025040416085062906, "loss": 0.0237, "step": 6726 }, { "epoch": 1.37, "learning_rate": 0.0002503897579006287, "loss": 0.0098, "step": 6727 }, { "epoch": 1.37, "learning_rate": 0.0002503753532739299, "loss": 0.0214, "step": 6728 }, { "epoch": 1.37, "learning_rate": 0.00025036094697077326, "loss": 0.0132, "step": 6729 }, { "epoch": 1.37, "learning_rate": 0.00025034653899139934, "loss": 0.0225, "step": 6730 }, { "epoch": 1.37, "learning_rate": 0.0002503321293360488, "loss": 0.0054, "step": 6731 }, { "epoch": 1.37, "learning_rate": 0.00025031771800496224, "loss": 0.0063, "step": 6732 }, { "epoch": 1.37, "learning_rate": 0.0002503033049983805, "loss": 0.0157, "step": 6733 }, { "epoch": 1.37, "learning_rate": 0.0002502888903165442, "loss": 0.0057, "step": 6734 }, { "epoch": 1.37, "learning_rate": 0.0002502744739596942, "loss": 0.0212, "step": 6735 }, { "epoch": 1.37, "learning_rate": 0.0002502600559280711, "loss": 0.0231, "step": 6736 }, { "epoch": 1.37, "learning_rate": 0.0002502456362219159, "loss": 0.0115, "step": 6737 }, { "epoch": 1.37, "learning_rate": 0.0002502312148414693, "loss": 0.0084, "step": 6738 }, { "epoch": 1.37, "learning_rate": 0.0002502167917869722, "loss": 0.0087, "step": 6739 }, { "epoch": 1.37, "learning_rate": 0.00025020236705866557, "loss": 0.011, "step": 6740 }, { "epoch": 1.37, "learning_rate": 0.00025018794065679017, "loss": 0.0082, "step": 6741 }, { "epoch": 1.37, "learning_rate": 0.00025017351258158706, "loss": 0.023, "step": 6742 }, { "epoch": 1.37, "learning_rate": 0.0002501590828332972, "loss": 0.0021, "step": 6743 }, { "epoch": 1.37, "learning_rate": 0.0002501446514121617, "loss": 0.0121, "step": 6744 }, { "epoch": 1.37, "learning_rate": 0.0002501302183184214, "loss": 0.0013, "step": 6745 }, { "epoch": 1.37, "learning_rate": 0.0002501157835523174, "loss": 0.0175, "step": 6746 }, { "epoch": 1.37, "learning_rate": 0.0002501013471140909, "loss": 0.0323, "step": 6747 }, { "epoch": 1.37, "learning_rate": 0.00025008690900398293, "loss": 0.0222, "step": 6748 }, { "epoch": 1.37, "learning_rate": 0.0002500724692222347, "loss": 0.0146, "step": 6749 }, { "epoch": 1.37, "learning_rate": 0.00025005802776908727, "loss": 0.0186, "step": 6750 }, { "epoch": 1.37, "learning_rate": 0.0002500435846447819, "loss": 0.0185, "step": 6751 }, { "epoch": 1.37, "learning_rate": 0.00025002913984955986, "loss": 0.0214, "step": 6752 }, { "epoch": 1.38, "learning_rate": 0.00025001469338366234, "loss": 0.0064, "step": 6753 }, { "epoch": 1.38, "learning_rate": 0.00025000024524733064, "loss": 0.0107, "step": 6754 }, { "epoch": 1.38, "learning_rate": 0.00024998579544080614, "loss": 0.0059, "step": 6755 }, { "epoch": 1.38, "learning_rate": 0.00024997134396433004, "loss": 0.0068, "step": 6756 }, { "epoch": 1.38, "learning_rate": 0.0002499568908181439, "loss": 0.0057, "step": 6757 }, { "epoch": 1.38, "learning_rate": 0.0002499424360024889, "loss": 0.0132, "step": 6758 }, { "epoch": 1.38, "learning_rate": 0.00024992797951760656, "loss": 0.0111, "step": 6759 }, { "epoch": 1.38, "learning_rate": 0.00024991352136373836, "loss": 0.0135, "step": 6760 }, { "epoch": 1.38, "learning_rate": 0.00024989906154112575, "loss": 0.0054, "step": 6761 }, { "epoch": 1.38, "learning_rate": 0.0002498846000500103, "loss": 0.0084, "step": 6762 }, { "epoch": 1.38, "learning_rate": 0.0002498701368906334, "loss": 0.011, "step": 6763 }, { "epoch": 1.38, "learning_rate": 0.0002498556720632367, "loss": 0.0364, "step": 6764 }, { "epoch": 1.38, "learning_rate": 0.0002498412055680618, "loss": 0.0234, "step": 6765 }, { "epoch": 1.38, "learning_rate": 0.00024982673740535035, "loss": 0.0091, "step": 6766 }, { "epoch": 1.38, "learning_rate": 0.00024981226757534396, "loss": 0.0186, "step": 6767 }, { "epoch": 1.38, "learning_rate": 0.0002497977960782842, "loss": 0.0033, "step": 6768 }, { "epoch": 1.38, "learning_rate": 0.00024978332291441293, "loss": 0.0203, "step": 6769 }, { "epoch": 1.38, "learning_rate": 0.00024976884808397174, "loss": 0.0065, "step": 6770 }, { "epoch": 1.38, "learning_rate": 0.00024975437158720256, "loss": 0.0116, "step": 6771 }, { "epoch": 1.38, "learning_rate": 0.000249739893424347, "loss": 0.0082, "step": 6772 }, { "epoch": 1.38, "learning_rate": 0.000249725413595647, "loss": 0.0284, "step": 6773 }, { "epoch": 1.38, "learning_rate": 0.0002497109321013443, "loss": 0.025, "step": 6774 }, { "epoch": 1.38, "learning_rate": 0.00024969644894168086, "loss": 0.047, "step": 6775 }, { "epoch": 1.38, "learning_rate": 0.00024968196411689854, "loss": 0.0089, "step": 6776 }, { "epoch": 1.38, "learning_rate": 0.0002496674776272392, "loss": 0.014, "step": 6777 }, { "epoch": 1.38, "learning_rate": 0.0002496529894729449, "loss": 0.0182, "step": 6778 }, { "epoch": 1.38, "learning_rate": 0.00024963849965425753, "loss": 0.0211, "step": 6779 }, { "epoch": 1.38, "learning_rate": 0.00024962400817141916, "loss": 0.014, "step": 6780 }, { "epoch": 1.38, "learning_rate": 0.00024960951502467176, "loss": 0.0204, "step": 6781 }, { "epoch": 1.38, "learning_rate": 0.0002495950202142575, "loss": 0.0094, "step": 6782 }, { "epoch": 1.38, "learning_rate": 0.00024958052374041834, "loss": 0.0088, "step": 6783 }, { "epoch": 1.38, "learning_rate": 0.00024956602560339647, "loss": 0.0165, "step": 6784 }, { "epoch": 1.38, "learning_rate": 0.0002495515258034341, "loss": 0.0262, "step": 6785 }, { "epoch": 1.38, "learning_rate": 0.00024953702434077325, "loss": 0.0112, "step": 6786 }, { "epoch": 1.38, "learning_rate": 0.0002495225212156562, "loss": 0.0333, "step": 6787 }, { "epoch": 1.38, "learning_rate": 0.00024950801642832524, "loss": 0.0115, "step": 6788 }, { "epoch": 1.38, "learning_rate": 0.0002494935099790225, "loss": 0.039, "step": 6789 }, { "epoch": 1.38, "learning_rate": 0.00024947900186799045, "loss": 0.0092, "step": 6790 }, { "epoch": 1.38, "learning_rate": 0.0002494644920954712, "loss": 0.0091, "step": 6791 }, { "epoch": 1.38, "learning_rate": 0.00024944998066170717, "loss": 0.0101, "step": 6792 }, { "epoch": 1.38, "learning_rate": 0.0002494354675669408, "loss": 0.0051, "step": 6793 }, { "epoch": 1.38, "learning_rate": 0.0002494209528114144, "loss": 0.0173, "step": 6794 }, { "epoch": 1.38, "learning_rate": 0.0002494064363953704, "loss": 0.0029, "step": 6795 }, { "epoch": 1.38, "learning_rate": 0.0002493919183190513, "loss": 0.0106, "step": 6796 }, { "epoch": 1.38, "learning_rate": 0.00024937739858269946, "loss": 0.0106, "step": 6797 }, { "epoch": 1.38, "learning_rate": 0.00024936287718655754, "loss": 0.0018, "step": 6798 }, { "epoch": 1.38, "learning_rate": 0.00024934835413086806, "loss": 0.0104, "step": 6799 }, { "epoch": 1.38, "learning_rate": 0.0002493338294158735, "loss": 0.0359, "step": 6800 }, { "epoch": 1.38, "learning_rate": 0.0002493193030418165, "loss": 0.0268, "step": 6801 }, { "epoch": 1.39, "learning_rate": 0.00024930477500893956, "loss": 0.018, "step": 6802 }, { "epoch": 1.39, "learning_rate": 0.0002492902453174855, "loss": 0.0187, "step": 6803 }, { "epoch": 1.39, "learning_rate": 0.00024927571396769695, "loss": 0.0247, "step": 6804 }, { "epoch": 1.39, "learning_rate": 0.00024926118095981655, "loss": 0.0153, "step": 6805 }, { "epoch": 1.39, "learning_rate": 0.00024924664629408705, "loss": 0.0112, "step": 6806 }, { "epoch": 1.39, "learning_rate": 0.0002492321099707512, "loss": 0.009, "step": 6807 }, { "epoch": 1.39, "learning_rate": 0.0002492175719900518, "loss": 0.0833, "step": 6808 }, { "epoch": 1.39, "learning_rate": 0.0002492030323522317, "loss": 0.0077, "step": 6809 }, { "epoch": 1.39, "learning_rate": 0.0002491884910575337, "loss": 0.0069, "step": 6810 }, { "epoch": 1.39, "learning_rate": 0.00024917394810620064, "loss": 0.0236, "step": 6811 }, { "epoch": 1.39, "learning_rate": 0.00024915940349847545, "loss": 0.02, "step": 6812 }, { "epoch": 1.39, "learning_rate": 0.00024914485723460104, "loss": 0.003, "step": 6813 }, { "epoch": 1.39, "learning_rate": 0.0002491303093148204, "loss": 0.0135, "step": 6814 }, { "epoch": 1.39, "learning_rate": 0.00024911575973937645, "loss": 0.0099, "step": 6815 }, { "epoch": 1.39, "learning_rate": 0.00024910120850851216, "loss": 0.0026, "step": 6816 }, { "epoch": 1.39, "learning_rate": 0.00024908665562247074, "loss": 0.0291, "step": 6817 }, { "epoch": 1.39, "learning_rate": 0.00024907210108149504, "loss": 0.0084, "step": 6818 }, { "epoch": 1.39, "learning_rate": 0.00024905754488582825, "loss": 0.0175, "step": 6819 }, { "epoch": 1.39, "learning_rate": 0.0002490429870357135, "loss": 0.0116, "step": 6820 }, { "epoch": 1.39, "learning_rate": 0.0002490284275313939, "loss": 0.0147, "step": 6821 }, { "epoch": 1.39, "learning_rate": 0.00024901386637311265, "loss": 0.012, "step": 6822 }, { "epoch": 1.39, "learning_rate": 0.0002489993035611129, "loss": 0.0086, "step": 6823 }, { "epoch": 1.39, "learning_rate": 0.00024898473909563794, "loss": 0.0078, "step": 6824 }, { "epoch": 1.39, "learning_rate": 0.00024897017297693095, "loss": 0.021, "step": 6825 }, { "epoch": 1.39, "learning_rate": 0.00024895560520523524, "loss": 0.0172, "step": 6826 }, { "epoch": 1.39, "learning_rate": 0.0002489410357807942, "loss": 0.007, "step": 6827 }, { "epoch": 1.39, "learning_rate": 0.00024892646470385104, "loss": 0.0111, "step": 6828 }, { "epoch": 1.39, "learning_rate": 0.00024891189197464924, "loss": 0.0294, "step": 6829 }, { "epoch": 1.39, "learning_rate": 0.00024889731759343206, "loss": 0.0123, "step": 6830 }, { "epoch": 1.39, "learning_rate": 0.00024888274156044306, "loss": 0.0097, "step": 6831 }, { "epoch": 1.39, "learning_rate": 0.0002488681638759256, "loss": 0.0044, "step": 6832 }, { "epoch": 1.39, "learning_rate": 0.0002488535845401231, "loss": 0.0099, "step": 6833 }, { "epoch": 1.39, "learning_rate": 0.0002488390035532793, "loss": 0.0029, "step": 6834 }, { "epoch": 1.39, "learning_rate": 0.00024882442091563744, "loss": 0.0353, "step": 6835 }, { "epoch": 1.39, "learning_rate": 0.00024880983662744127, "loss": 0.0082, "step": 6836 }, { "epoch": 1.39, "learning_rate": 0.00024879525068893424, "loss": 0.0185, "step": 6837 }, { "epoch": 1.39, "learning_rate": 0.0002487806631003601, "loss": 0.0246, "step": 6838 }, { "epoch": 1.39, "learning_rate": 0.00024876607386196243, "loss": 0.005, "step": 6839 }, { "epoch": 1.39, "learning_rate": 0.0002487514829739848, "loss": 0.0132, "step": 6840 }, { "epoch": 1.39, "learning_rate": 0.0002487368904366711, "loss": 0.0244, "step": 6841 }, { "epoch": 1.39, "learning_rate": 0.00024872229625026493, "loss": 0.045, "step": 6842 }, { "epoch": 1.39, "learning_rate": 0.00024870770041501004, "loss": 0.033, "step": 6843 }, { "epoch": 1.39, "learning_rate": 0.00024869310293115023, "loss": 0.0194, "step": 6844 }, { "epoch": 1.39, "learning_rate": 0.00024867850379892934, "loss": 0.0113, "step": 6845 }, { "epoch": 1.39, "learning_rate": 0.0002486639030185911, "loss": 0.0115, "step": 6846 }, { "epoch": 1.39, "learning_rate": 0.0002486493005903795, "loss": 0.0045, "step": 6847 }, { "epoch": 1.39, "learning_rate": 0.00024863469651453834, "loss": 0.0024, "step": 6848 }, { "epoch": 1.39, "learning_rate": 0.00024862009079131155, "loss": 0.0037, "step": 6849 }, { "epoch": 1.39, "learning_rate": 0.0002486054834209431, "loss": 0.0139, "step": 6850 }, { "epoch": 1.39, "learning_rate": 0.00024859087440367694, "loss": 0.0315, "step": 6851 }, { "epoch": 1.4, "learning_rate": 0.0002485762637397571, "loss": 0.0287, "step": 6852 }, { "epoch": 1.4, "learning_rate": 0.0002485616514294275, "loss": 0.0148, "step": 6853 }, { "epoch": 1.4, "learning_rate": 0.00024854703747293237, "loss": 0.0068, "step": 6854 }, { "epoch": 1.4, "learning_rate": 0.00024853242187051567, "loss": 0.0118, "step": 6855 }, { "epoch": 1.4, "learning_rate": 0.0002485178046224215, "loss": 0.013, "step": 6856 }, { "epoch": 1.4, "learning_rate": 0.00024850318572889403, "loss": 0.0034, "step": 6857 }, { "epoch": 1.4, "learning_rate": 0.0002484885651901774, "loss": 0.0108, "step": 6858 }, { "epoch": 1.4, "learning_rate": 0.0002484739430065159, "loss": 0.0125, "step": 6859 }, { "epoch": 1.4, "learning_rate": 0.0002484593191781536, "loss": 0.016, "step": 6860 }, { "epoch": 1.4, "learning_rate": 0.0002484446937053349, "loss": 0.0145, "step": 6861 }, { "epoch": 1.4, "learning_rate": 0.0002484300665883039, "loss": 0.0253, "step": 6862 }, { "epoch": 1.4, "learning_rate": 0.000248415437827305, "loss": 0.0165, "step": 6863 }, { "epoch": 1.4, "learning_rate": 0.00024840080742258254, "loss": 0.0058, "step": 6864 }, { "epoch": 1.4, "learning_rate": 0.00024838617537438083, "loss": 0.0418, "step": 6865 }, { "epoch": 1.4, "learning_rate": 0.0002483715416829443, "loss": 0.01, "step": 6866 }, { "epoch": 1.4, "learning_rate": 0.0002483569063485173, "loss": 0.0099, "step": 6867 }, { "epoch": 1.4, "learning_rate": 0.0002483422693713443, "loss": 0.0125, "step": 6868 }, { "epoch": 1.4, "learning_rate": 0.0002483276307516698, "loss": 0.01, "step": 6869 }, { "epoch": 1.4, "learning_rate": 0.00024831299048973823, "loss": 0.0119, "step": 6870 }, { "epoch": 1.4, "learning_rate": 0.00024829834858579417, "loss": 0.014, "step": 6871 }, { "epoch": 1.4, "learning_rate": 0.00024828370504008216, "loss": 0.0212, "step": 6872 }, { "epoch": 1.4, "learning_rate": 0.00024826905985284676, "loss": 0.011, "step": 6873 }, { "epoch": 1.4, "learning_rate": 0.0002482544130243325, "loss": 0.017, "step": 6874 }, { "epoch": 1.4, "learning_rate": 0.0002482397645547841, "loss": 0.008, "step": 6875 }, { "epoch": 1.4, "learning_rate": 0.0002482251144444462, "loss": 0.0273, "step": 6876 }, { "epoch": 1.4, "learning_rate": 0.00024821046269356343, "loss": 0.0101, "step": 6877 }, { "epoch": 1.4, "learning_rate": 0.0002481958093023806, "loss": 0.0076, "step": 6878 }, { "epoch": 1.4, "learning_rate": 0.00024818115427114234, "loss": 0.0283, "step": 6879 }, { "epoch": 1.4, "learning_rate": 0.00024816649760009353, "loss": 0.0053, "step": 6880 }, { "epoch": 1.4, "learning_rate": 0.0002481518392894789, "loss": 0.0239, "step": 6881 }, { "epoch": 1.4, "learning_rate": 0.00024813717933954327, "loss": 0.0075, "step": 6882 }, { "epoch": 1.4, "learning_rate": 0.0002481225177505315, "loss": 0.0147, "step": 6883 }, { "epoch": 1.4, "learning_rate": 0.00024810785452268846, "loss": 0.0097, "step": 6884 }, { "epoch": 1.4, "learning_rate": 0.0002480931896562591, "loss": 0.0096, "step": 6885 }, { "epoch": 1.4, "learning_rate": 0.0002480785231514882, "loss": 0.0099, "step": 6886 }, { "epoch": 1.4, "learning_rate": 0.00024806385500862095, "loss": 0.0099, "step": 6887 }, { "epoch": 1.4, "learning_rate": 0.00024804918522790216, "loss": 0.0192, "step": 6888 }, { "epoch": 1.4, "learning_rate": 0.00024803451380957687, "loss": 0.0115, "step": 6889 }, { "epoch": 1.4, "learning_rate": 0.00024801984075389016, "loss": 0.0239, "step": 6890 }, { "epoch": 1.4, "learning_rate": 0.0002480051660610871, "loss": 0.0117, "step": 6891 }, { "epoch": 1.4, "learning_rate": 0.0002479904897314128, "loss": 0.0096, "step": 6892 }, { "epoch": 1.4, "learning_rate": 0.00024797581176511227, "loss": 0.0277, "step": 6893 }, { "epoch": 1.4, "learning_rate": 0.0002479611321624308, "loss": 0.0231, "step": 6894 }, { "epoch": 1.4, "learning_rate": 0.00024794645092361347, "loss": 0.0096, "step": 6895 }, { "epoch": 1.4, "learning_rate": 0.00024793176804890557, "loss": 0.0034, "step": 6896 }, { "epoch": 1.4, "learning_rate": 0.0002479170835385522, "loss": 0.0182, "step": 6897 }, { "epoch": 1.4, "learning_rate": 0.0002479023973927988, "loss": 0.0124, "step": 6898 }, { "epoch": 1.4, "learning_rate": 0.00024788770961189054, "loss": 0.0268, "step": 6899 }, { "epoch": 1.4, "learning_rate": 0.00024787302019607275, "loss": 0.0103, "step": 6900 }, { "epoch": 1.41, "learning_rate": 0.00024785832914559077, "loss": 0.0017, "step": 6901 }, { "epoch": 1.41, "learning_rate": 0.00024784363646068996, "loss": 0.0257, "step": 6902 }, { "epoch": 1.41, "learning_rate": 0.0002478289421416157, "loss": 0.0159, "step": 6903 }, { "epoch": 1.41, "learning_rate": 0.0002478142461886135, "loss": 0.0181, "step": 6904 }, { "epoch": 1.41, "learning_rate": 0.0002477995486019287, "loss": 0.0048, "step": 6905 }, { "epoch": 1.41, "learning_rate": 0.00024778484938180683, "loss": 0.0146, "step": 6906 }, { "epoch": 1.41, "learning_rate": 0.00024777014852849345, "loss": 0.0088, "step": 6907 }, { "epoch": 1.41, "learning_rate": 0.00024775544604223397, "loss": 0.0229, "step": 6908 }, { "epoch": 1.41, "learning_rate": 0.0002477407419232741, "loss": 0.0129, "step": 6909 }, { "epoch": 1.41, "learning_rate": 0.00024772603617185927, "loss": 0.0043, "step": 6910 }, { "epoch": 1.41, "learning_rate": 0.0002477113287882352, "loss": 0.004, "step": 6911 }, { "epoch": 1.41, "learning_rate": 0.0002476966197726475, "loss": 0.027, "step": 6912 }, { "epoch": 1.41, "learning_rate": 0.00024768190912534177, "loss": 0.0077, "step": 6913 }, { "epoch": 1.41, "learning_rate": 0.00024766719684656376, "loss": 0.0089, "step": 6914 }, { "epoch": 1.41, "learning_rate": 0.0002476524829365593, "loss": 0.0095, "step": 6915 }, { "epoch": 1.41, "learning_rate": 0.000247637767395574, "loss": 0.0299, "step": 6916 }, { "epoch": 1.41, "learning_rate": 0.00024762305022385365, "loss": 0.0417, "step": 6917 }, { "epoch": 1.41, "learning_rate": 0.00024760833142164416, "loss": 0.0265, "step": 6918 }, { "epoch": 1.41, "learning_rate": 0.0002475936109891912, "loss": 0.0259, "step": 6919 }, { "epoch": 1.41, "learning_rate": 0.00024757888892674074, "loss": 0.0077, "step": 6920 }, { "epoch": 1.41, "learning_rate": 0.0002475641652345387, "loss": 0.0238, "step": 6921 }, { "epoch": 1.41, "learning_rate": 0.00024754943991283084, "loss": 0.0118, "step": 6922 }, { "epoch": 1.41, "learning_rate": 0.00024753471296186326, "loss": 0.0006, "step": 6923 }, { "epoch": 1.41, "learning_rate": 0.0002475199843818819, "loss": 0.0091, "step": 6924 }, { "epoch": 1.41, "learning_rate": 0.00024750525417313265, "loss": 0.0117, "step": 6925 }, { "epoch": 1.41, "learning_rate": 0.00024749052233586163, "loss": 0.0066, "step": 6926 }, { "epoch": 1.41, "learning_rate": 0.0002474757888703148, "loss": 0.0037, "step": 6927 }, { "epoch": 1.41, "learning_rate": 0.00024746105377673836, "loss": 0.02, "step": 6928 }, { "epoch": 1.41, "learning_rate": 0.0002474463170553784, "loss": 0.005, "step": 6929 }, { "epoch": 1.41, "learning_rate": 0.0002474315787064809, "loss": 0.0074, "step": 6930 }, { "epoch": 1.41, "learning_rate": 0.00024741683873029217, "loss": 0.0264, "step": 6931 }, { "epoch": 1.41, "learning_rate": 0.0002474020971270583, "loss": 0.0125, "step": 6932 }, { "epoch": 1.41, "learning_rate": 0.0002473873538970256, "loss": 0.0082, "step": 6933 }, { "epoch": 1.41, "learning_rate": 0.00024737260904044025, "loss": 0.0218, "step": 6934 }, { "epoch": 1.41, "learning_rate": 0.0002473578625575485, "loss": 0.02, "step": 6935 }, { "epoch": 1.41, "learning_rate": 0.0002473431144485967, "loss": 0.0188, "step": 6936 }, { "epoch": 1.41, "learning_rate": 0.0002473283647138312, "loss": 0.0136, "step": 6937 }, { "epoch": 1.41, "learning_rate": 0.0002473136133534982, "loss": 0.0142, "step": 6938 }, { "epoch": 1.41, "learning_rate": 0.00024729886036784415, "loss": 0.0052, "step": 6939 }, { "epoch": 1.41, "learning_rate": 0.00024728410575711553, "loss": 0.0128, "step": 6940 }, { "epoch": 1.41, "learning_rate": 0.00024726934952155866, "loss": 0.0142, "step": 6941 }, { "epoch": 1.41, "learning_rate": 0.0002472545916614201, "loss": 0.0399, "step": 6942 }, { "epoch": 1.41, "learning_rate": 0.00024723983217694623, "loss": 0.0113, "step": 6943 }, { "epoch": 1.41, "learning_rate": 0.0002472250710683836, "loss": 0.0082, "step": 6944 }, { "epoch": 1.41, "learning_rate": 0.0002472103083359788, "loss": 0.0093, "step": 6945 }, { "epoch": 1.41, "learning_rate": 0.00024719554397997827, "loss": 0.0202, "step": 6946 }, { "epoch": 1.41, "learning_rate": 0.00024718077800062877, "loss": 0.0136, "step": 6947 }, { "epoch": 1.41, "learning_rate": 0.00024716601039817684, "loss": 0.02, "step": 6948 }, { "epoch": 1.41, "learning_rate": 0.0002471512411728691, "loss": 0.0179, "step": 6949 }, { "epoch": 1.42, "learning_rate": 0.00024713647032495223, "loss": 0.0165, "step": 6950 }, { "epoch": 1.42, "learning_rate": 0.0002471216978546729, "loss": 0.012, "step": 6951 }, { "epoch": 1.42, "learning_rate": 0.00024710692376227796, "loss": 0.0101, "step": 6952 }, { "epoch": 1.42, "learning_rate": 0.00024709214804801414, "loss": 0.0477, "step": 6953 }, { "epoch": 1.42, "learning_rate": 0.0002470773707121281, "loss": 0.0037, "step": 6954 }, { "epoch": 1.42, "learning_rate": 0.0002470625917548667, "loss": 0.0246, "step": 6955 }, { "epoch": 1.42, "learning_rate": 0.00024704781117647687, "loss": 0.0142, "step": 6956 }, { "epoch": 1.42, "learning_rate": 0.00024703302897720536, "loss": 0.0284, "step": 6957 }, { "epoch": 1.42, "learning_rate": 0.0002470182451572991, "loss": 0.0084, "step": 6958 }, { "epoch": 1.42, "learning_rate": 0.000247003459717005, "loss": 0.0142, "step": 6959 }, { "epoch": 1.42, "learning_rate": 0.00024698867265657, "loss": 0.0058, "step": 6960 }, { "epoch": 1.42, "learning_rate": 0.00024697388397624116, "loss": 0.0091, "step": 6961 }, { "epoch": 1.42, "learning_rate": 0.00024695909367626536, "loss": 0.0168, "step": 6962 }, { "epoch": 1.42, "learning_rate": 0.0002469443017568897, "loss": 0.0095, "step": 6963 }, { "epoch": 1.42, "learning_rate": 0.0002469295082183612, "loss": 0.0301, "step": 6964 }, { "epoch": 1.42, "learning_rate": 0.0002469147130609269, "loss": 0.0123, "step": 6965 }, { "epoch": 1.42, "learning_rate": 0.000246899916284834, "loss": 0.0163, "step": 6966 }, { "epoch": 1.42, "learning_rate": 0.00024688511789032957, "loss": 0.0143, "step": 6967 }, { "epoch": 1.42, "learning_rate": 0.00024687031787766077, "loss": 0.0085, "step": 6968 }, { "epoch": 1.42, "learning_rate": 0.0002468555162470748, "loss": 0.0162, "step": 6969 }, { "epoch": 1.42, "learning_rate": 0.00024684071299881896, "loss": 0.0175, "step": 6970 }, { "epoch": 1.42, "learning_rate": 0.00024682590813314035, "loss": 0.0207, "step": 6971 }, { "epoch": 1.42, "learning_rate": 0.0002468111016502863, "loss": 0.0236, "step": 6972 }, { "epoch": 1.42, "learning_rate": 0.00024679629355050414, "loss": 0.0097, "step": 6973 }, { "epoch": 1.42, "learning_rate": 0.0002467814838340411, "loss": 0.0415, "step": 6974 }, { "epoch": 1.42, "learning_rate": 0.00024676667250114466, "loss": 0.0125, "step": 6975 }, { "epoch": 1.42, "learning_rate": 0.00024675185955206204, "loss": 0.0031, "step": 6976 }, { "epoch": 1.42, "learning_rate": 0.0002467370449870408, "loss": 0.0038, "step": 6977 }, { "epoch": 1.42, "learning_rate": 0.0002467222288063283, "loss": 0.0071, "step": 6978 }, { "epoch": 1.42, "learning_rate": 0.000246707411010172, "loss": 0.0181, "step": 6979 }, { "epoch": 1.42, "learning_rate": 0.0002466925915988194, "loss": 0.0175, "step": 6980 }, { "epoch": 1.42, "learning_rate": 0.000246677770572518, "loss": 0.0166, "step": 6981 }, { "epoch": 1.42, "learning_rate": 0.0002466629479315153, "loss": 0.007, "step": 6982 }, { "epoch": 1.42, "learning_rate": 0.00024664812367605895, "loss": 0.0052, "step": 6983 }, { "epoch": 1.42, "learning_rate": 0.00024663329780639647, "loss": 0.0111, "step": 6984 }, { "epoch": 1.42, "learning_rate": 0.00024661847032277556, "loss": 0.0226, "step": 6985 }, { "epoch": 1.42, "learning_rate": 0.00024660364122544375, "loss": 0.0334, "step": 6986 }, { "epoch": 1.42, "learning_rate": 0.00024658881051464884, "loss": 0.0316, "step": 6987 }, { "epoch": 1.42, "learning_rate": 0.0002465739781906384, "loss": 0.0127, "step": 6988 }, { "epoch": 1.42, "learning_rate": 0.00024655914425366027, "loss": 0.0118, "step": 6989 }, { "epoch": 1.42, "learning_rate": 0.00024654430870396215, "loss": 0.0154, "step": 6990 }, { "epoch": 1.42, "learning_rate": 0.00024652947154179183, "loss": 0.0101, "step": 6991 }, { "epoch": 1.42, "learning_rate": 0.00024651463276739716, "loss": 0.0031, "step": 6992 }, { "epoch": 1.42, "learning_rate": 0.00024649979238102593, "loss": 0.0255, "step": 6993 }, { "epoch": 1.42, "learning_rate": 0.00024648495038292594, "loss": 0.0144, "step": 6994 }, { "epoch": 1.42, "learning_rate": 0.00024647010677334526, "loss": 0.0231, "step": 6995 }, { "epoch": 1.42, "learning_rate": 0.0002464552615525316, "loss": 0.0143, "step": 6996 }, { "epoch": 1.42, "learning_rate": 0.000246440414720733, "loss": 0.0107, "step": 6997 }, { "epoch": 1.42, "learning_rate": 0.0002464255662781975, "loss": 0.0332, "step": 6998 }, { "epoch": 1.43, "learning_rate": 0.000246410716225173, "loss": 0.0066, "step": 6999 }, { "epoch": 1.43, "learning_rate": 0.0002463958645619075, "loss": 0.006, "step": 7000 }, { "epoch": 1.43, "learning_rate": 0.00024638101128864916, "loss": 0.0061, "step": 7001 }, { "epoch": 1.43, "learning_rate": 0.000246366156405646, "loss": 0.0062, "step": 7002 }, { "epoch": 1.43, "learning_rate": 0.00024635129991314614, "loss": 0.0189, "step": 7003 }, { "epoch": 1.43, "learning_rate": 0.0002463364418113977, "loss": 0.0154, "step": 7004 }, { "epoch": 1.43, "learning_rate": 0.0002463215821006488, "loss": 0.0365, "step": 7005 }, { "epoch": 1.43, "learning_rate": 0.0002463067207811476, "loss": 0.0155, "step": 7006 }, { "epoch": 1.43, "learning_rate": 0.0002462918578531425, "loss": 0.008, "step": 7007 }, { "epoch": 1.43, "learning_rate": 0.0002462769933168815, "loss": 0.0109, "step": 7008 }, { "epoch": 1.43, "learning_rate": 0.000246262127172613, "loss": 0.0321, "step": 7009 }, { "epoch": 1.43, "learning_rate": 0.0002462472594205853, "loss": 0.0104, "step": 7010 }, { "epoch": 1.43, "learning_rate": 0.0002462323900610467, "loss": 0.0238, "step": 7011 }, { "epoch": 1.43, "learning_rate": 0.0002462175190942455, "loss": 0.0092, "step": 7012 }, { "epoch": 1.43, "learning_rate": 0.0002462026465204301, "loss": 0.0104, "step": 7013 }, { "epoch": 1.43, "learning_rate": 0.00024618777233984896, "loss": 0.012, "step": 7014 }, { "epoch": 1.43, "learning_rate": 0.0002461728965527504, "loss": 0.0239, "step": 7015 }, { "epoch": 1.43, "learning_rate": 0.00024615801915938297, "loss": 0.0106, "step": 7016 }, { "epoch": 1.43, "learning_rate": 0.0002461431401599951, "loss": 0.0175, "step": 7017 }, { "epoch": 1.43, "learning_rate": 0.0002461282595548353, "loss": 0.0168, "step": 7018 }, { "epoch": 1.43, "learning_rate": 0.0002461133773441521, "loss": 0.0193, "step": 7019 }, { "epoch": 1.43, "learning_rate": 0.000246098493528194, "loss": 0.0267, "step": 7020 }, { "epoch": 1.43, "learning_rate": 0.0002460836081072098, "loss": 0.0082, "step": 7021 }, { "epoch": 1.43, "learning_rate": 0.00024606872108144786, "loss": 0.02, "step": 7022 }, { "epoch": 1.43, "learning_rate": 0.00024605383245115704, "loss": 0.0056, "step": 7023 }, { "epoch": 1.43, "learning_rate": 0.0002460389422165858, "loss": 0.0089, "step": 7024 }, { "epoch": 1.43, "learning_rate": 0.000246024050377983, "loss": 0.0017, "step": 7025 }, { "epoch": 1.43, "learning_rate": 0.00024600915693559727, "loss": 0.0087, "step": 7026 }, { "epoch": 1.43, "learning_rate": 0.0002459942618896774, "loss": 0.0171, "step": 7027 }, { "epoch": 1.43, "learning_rate": 0.00024597936524047215, "loss": 0.0205, "step": 7028 }, { "epoch": 1.43, "learning_rate": 0.00024596446698823036, "loss": 0.0017, "step": 7029 }, { "epoch": 1.43, "learning_rate": 0.0002459495671332008, "loss": 0.0567, "step": 7030 }, { "epoch": 1.43, "learning_rate": 0.00024593466567563235, "loss": 0.0107, "step": 7031 }, { "epoch": 1.43, "learning_rate": 0.0002459197626157739, "loss": 0.016, "step": 7032 }, { "epoch": 1.43, "learning_rate": 0.00024590485795387436, "loss": 0.0066, "step": 7033 }, { "epoch": 1.43, "learning_rate": 0.0002458899516901826, "loss": 0.0477, "step": 7034 }, { "epoch": 1.43, "learning_rate": 0.00024587504382494774, "loss": 0.0098, "step": 7035 }, { "epoch": 1.43, "learning_rate": 0.0002458601343584186, "loss": 0.0338, "step": 7036 }, { "epoch": 1.43, "learning_rate": 0.00024584522329084427, "loss": 0.0154, "step": 7037 }, { "epoch": 1.43, "learning_rate": 0.0002458303106224738, "loss": 0.0151, "step": 7038 }, { "epoch": 1.43, "learning_rate": 0.0002458153963535563, "loss": 0.0292, "step": 7039 }, { "epoch": 1.43, "learning_rate": 0.0002458004804843408, "loss": 0.0089, "step": 7040 }, { "epoch": 1.43, "learning_rate": 0.0002457855630150764, "loss": 0.0038, "step": 7041 }, { "epoch": 1.43, "learning_rate": 0.00024577064394601226, "loss": 0.0133, "step": 7042 }, { "epoch": 1.43, "learning_rate": 0.0002457557232773976, "loss": 0.0144, "step": 7043 }, { "epoch": 1.43, "learning_rate": 0.0002457408010094817, "loss": 0.0052, "step": 7044 }, { "epoch": 1.43, "learning_rate": 0.00024572587714251365, "loss": 0.0134, "step": 7045 }, { "epoch": 1.43, "learning_rate": 0.00024571095167674273, "loss": 0.0101, "step": 7046 }, { "epoch": 1.43, "learning_rate": 0.0002456960246124182, "loss": 0.0193, "step": 7047 }, { "epoch": 1.44, "learning_rate": 0.00024568109594978954, "loss": 0.0041, "step": 7048 }, { "epoch": 1.44, "learning_rate": 0.00024566616568910595, "loss": 0.0085, "step": 7049 }, { "epoch": 1.44, "learning_rate": 0.00024565123383061676, "loss": 0.0174, "step": 7050 }, { "epoch": 1.44, "learning_rate": 0.00024563630037457144, "loss": 0.0058, "step": 7051 }, { "epoch": 1.44, "learning_rate": 0.0002456213653212193, "loss": 0.0164, "step": 7052 }, { "epoch": 1.44, "learning_rate": 0.00024560642867080994, "loss": 0.0108, "step": 7053 }, { "epoch": 1.44, "learning_rate": 0.00024559149042359277, "loss": 0.018, "step": 7054 }, { "epoch": 1.44, "learning_rate": 0.0002455765505798172, "loss": 0.0115, "step": 7055 }, { "epoch": 1.44, "learning_rate": 0.0002455616091397329, "loss": 0.0123, "step": 7056 }, { "epoch": 1.44, "learning_rate": 0.00024554666610358925, "loss": 0.0086, "step": 7057 }, { "epoch": 1.44, "learning_rate": 0.00024553172147163596, "loss": 0.0178, "step": 7058 }, { "epoch": 1.44, "learning_rate": 0.0002455167752441226, "loss": 0.0107, "step": 7059 }, { "epoch": 1.44, "learning_rate": 0.0002455018274212988, "loss": 0.037, "step": 7060 }, { "epoch": 1.44, "learning_rate": 0.0002454868780034142, "loss": 0.0099, "step": 7061 }, { "epoch": 1.44, "learning_rate": 0.0002454719269907185, "loss": 0.0085, "step": 7062 }, { "epoch": 1.44, "learning_rate": 0.0002454569743834614, "loss": 0.0372, "step": 7063 }, { "epoch": 1.44, "learning_rate": 0.00024544202018189263, "loss": 0.0115, "step": 7064 }, { "epoch": 1.44, "learning_rate": 0.00024542706438626194, "loss": 0.0037, "step": 7065 }, { "epoch": 1.44, "learning_rate": 0.0002454121069968192, "loss": 0.0018, "step": 7066 }, { "epoch": 1.44, "learning_rate": 0.00024539714801381416, "loss": 0.0036, "step": 7067 }, { "epoch": 1.44, "learning_rate": 0.0002453821874374966, "loss": 0.0203, "step": 7068 }, { "epoch": 1.44, "learning_rate": 0.0002453672252681165, "loss": 0.0338, "step": 7069 }, { "epoch": 1.44, "learning_rate": 0.0002453522615059238, "loss": 0.0145, "step": 7070 }, { "epoch": 1.44, "learning_rate": 0.0002453372961511683, "loss": 0.0124, "step": 7071 }, { "epoch": 1.44, "learning_rate": 0.00024532232920409993, "loss": 0.0115, "step": 7072 }, { "epoch": 1.44, "learning_rate": 0.0002453073606649688, "loss": 0.0087, "step": 7073 }, { "epoch": 1.44, "learning_rate": 0.0002452923905340248, "loss": 0.0197, "step": 7074 }, { "epoch": 1.44, "learning_rate": 0.00024527741881151803, "loss": 0.0179, "step": 7075 }, { "epoch": 1.44, "learning_rate": 0.0002452624454976985, "loss": 0.0168, "step": 7076 }, { "epoch": 1.44, "learning_rate": 0.0002452474705928163, "loss": 0.0125, "step": 7077 }, { "epoch": 1.44, "learning_rate": 0.0002452324940971216, "loss": 0.019, "step": 7078 }, { "epoch": 1.44, "learning_rate": 0.0002452175160108644, "loss": 0.0039, "step": 7079 }, { "epoch": 1.44, "learning_rate": 0.000245202536334295, "loss": 0.0073, "step": 7080 }, { "epoch": 1.44, "learning_rate": 0.00024518755506766355, "loss": 0.0116, "step": 7081 }, { "epoch": 1.44, "learning_rate": 0.00024517257221122024, "loss": 0.0257, "step": 7082 }, { "epoch": 1.44, "learning_rate": 0.00024515758776521527, "loss": 0.025, "step": 7083 }, { "epoch": 1.44, "learning_rate": 0.000245142601729899, "loss": 0.0197, "step": 7084 }, { "epoch": 1.44, "learning_rate": 0.0002451276141055217, "loss": 0.0216, "step": 7085 }, { "epoch": 1.44, "learning_rate": 0.0002451126248923337, "loss": 0.004, "step": 7086 }, { "epoch": 1.44, "learning_rate": 0.00024509763409058527, "loss": 0.0153, "step": 7087 }, { "epoch": 1.44, "learning_rate": 0.00024508264170052684, "loss": 0.0065, "step": 7088 }, { "epoch": 1.44, "learning_rate": 0.0002450676477224089, "loss": 0.0156, "step": 7089 }, { "epoch": 1.44, "learning_rate": 0.0002450526521564817, "loss": 0.0045, "step": 7090 }, { "epoch": 1.44, "learning_rate": 0.0002450376550029958, "loss": 0.0147, "step": 7091 }, { "epoch": 1.44, "learning_rate": 0.0002450226562622017, "loss": 0.0121, "step": 7092 }, { "epoch": 1.44, "learning_rate": 0.0002450076559343498, "loss": 0.0115, "step": 7093 }, { "epoch": 1.44, "learning_rate": 0.0002449926540196908, "loss": 0.0221, "step": 7094 }, { "epoch": 1.44, "learning_rate": 0.0002449776505184751, "loss": 0.0046, "step": 7095 }, { "epoch": 1.44, "learning_rate": 0.0002449626454309534, "loss": 0.007, "step": 7096 }, { "epoch": 1.45, "learning_rate": 0.00024494763875737623, "loss": 0.0199, "step": 7097 }, { "epoch": 1.45, "learning_rate": 0.00024493263049799426, "loss": 0.0006, "step": 7098 }, { "epoch": 1.45, "learning_rate": 0.0002449176206530582, "loss": 0.0174, "step": 7099 }, { "epoch": 1.45, "learning_rate": 0.0002449026092228187, "loss": 0.0272, "step": 7100 }, { "epoch": 1.45, "learning_rate": 0.00024488759620752644, "loss": 0.023, "step": 7101 }, { "epoch": 1.45, "learning_rate": 0.0002448725816074323, "loss": 0.0158, "step": 7102 }, { "epoch": 1.45, "learning_rate": 0.00024485756542278684, "loss": 0.0069, "step": 7103 }, { "epoch": 1.45, "learning_rate": 0.00024484254765384106, "loss": 0.021, "step": 7104 }, { "epoch": 1.45, "learning_rate": 0.0002448275283008457, "loss": 0.0099, "step": 7105 }, { "epoch": 1.45, "learning_rate": 0.0002448125073640516, "loss": 0.0088, "step": 7106 }, { "epoch": 1.45, "learning_rate": 0.0002447974848437097, "loss": 0.0082, "step": 7107 }, { "epoch": 1.45, "learning_rate": 0.0002447824607400708, "loss": 0.0089, "step": 7108 }, { "epoch": 1.45, "learning_rate": 0.0002447674350533859, "loss": 0.0164, "step": 7109 }, { "epoch": 1.45, "learning_rate": 0.00024475240778390597, "loss": 0.0089, "step": 7110 }, { "epoch": 1.45, "learning_rate": 0.000244737378931882, "loss": 0.0054, "step": 7111 }, { "epoch": 1.45, "learning_rate": 0.0002447223484975649, "loss": 0.0289, "step": 7112 }, { "epoch": 1.45, "learning_rate": 0.0002447073164812058, "loss": 0.0057, "step": 7113 }, { "epoch": 1.45, "learning_rate": 0.0002446922828830558, "loss": 0.0049, "step": 7114 }, { "epoch": 1.45, "learning_rate": 0.00024467724770336585, "loss": 0.0078, "step": 7115 }, { "epoch": 1.45, "learning_rate": 0.00024466221094238724, "loss": 0.0459, "step": 7116 }, { "epoch": 1.45, "learning_rate": 0.00024464717260037097, "loss": 0.0119, "step": 7117 }, { "epoch": 1.45, "learning_rate": 0.00024463213267756826, "loss": 0.0121, "step": 7118 }, { "epoch": 1.45, "learning_rate": 0.0002446170911742303, "loss": 0.0144, "step": 7119 }, { "epoch": 1.45, "learning_rate": 0.00024460204809060833, "loss": 0.0089, "step": 7120 }, { "epoch": 1.45, "learning_rate": 0.00024458700342695354, "loss": 0.0051, "step": 7121 }, { "epoch": 1.45, "learning_rate": 0.00024457195718351725, "loss": 0.0137, "step": 7122 }, { "epoch": 1.45, "learning_rate": 0.00024455690936055083, "loss": 0.0155, "step": 7123 }, { "epoch": 1.45, "learning_rate": 0.00024454185995830544, "loss": 0.0124, "step": 7124 }, { "epoch": 1.45, "learning_rate": 0.0002445268089770326, "loss": 0.0148, "step": 7125 }, { "epoch": 1.45, "learning_rate": 0.0002445117564169836, "loss": 0.0063, "step": 7126 }, { "epoch": 1.45, "learning_rate": 0.0002444967022784099, "loss": 0.0251, "step": 7127 }, { "epoch": 1.45, "learning_rate": 0.0002444816465615628, "loss": 0.0058, "step": 7128 }, { "epoch": 1.45, "learning_rate": 0.00024446658926669397, "loss": 0.0079, "step": 7129 }, { "epoch": 1.45, "learning_rate": 0.0002444515303940547, "loss": 0.0163, "step": 7130 }, { "epoch": 1.45, "learning_rate": 0.0002444364699438966, "loss": 0.025, "step": 7131 }, { "epoch": 1.45, "learning_rate": 0.0002444214079164712, "loss": 0.037, "step": 7132 }, { "epoch": 1.45, "learning_rate": 0.00024440634431203, "loss": 0.0094, "step": 7133 }, { "epoch": 1.45, "learning_rate": 0.00024439127913082474, "loss": 0.0113, "step": 7134 }, { "epoch": 1.45, "learning_rate": 0.0002443762123731069, "loss": 0.0299, "step": 7135 }, { "epoch": 1.45, "learning_rate": 0.00024436114403912813, "loss": 0.0133, "step": 7136 }, { "epoch": 1.45, "learning_rate": 0.0002443460741291402, "loss": 0.0274, "step": 7137 }, { "epoch": 1.45, "learning_rate": 0.0002443310026433947, "loss": 0.0109, "step": 7138 }, { "epoch": 1.45, "learning_rate": 0.0002443159295821434, "loss": 0.0389, "step": 7139 }, { "epoch": 1.45, "learning_rate": 0.0002443008549456381, "loss": 0.013, "step": 7140 }, { "epoch": 1.45, "learning_rate": 0.0002442857787341304, "loss": 0.0306, "step": 7141 }, { "epoch": 1.45, "learning_rate": 0.0002442707009478723, "loss": 0.0165, "step": 7142 }, { "epoch": 1.45, "learning_rate": 0.0002442556215871155, "loss": 0.028, "step": 7143 }, { "epoch": 1.45, "learning_rate": 0.00024424054065211195, "loss": 0.0197, "step": 7144 }, { "epoch": 1.45, "learning_rate": 0.0002442254581431135, "loss": 0.0195, "step": 7145 }, { "epoch": 1.46, "learning_rate": 0.00024421037406037195, "loss": 0.0469, "step": 7146 }, { "epoch": 1.46, "learning_rate": 0.0002441952884041394, "loss": 0.0154, "step": 7147 }, { "epoch": 1.46, "learning_rate": 0.0002441802011746677, "loss": 0.0187, "step": 7148 }, { "epoch": 1.46, "learning_rate": 0.0002441651123722088, "loss": 0.0394, "step": 7149 }, { "epoch": 1.46, "learning_rate": 0.00024415002199701483, "loss": 0.0132, "step": 7150 }, { "epoch": 1.46, "learning_rate": 0.00024413493004933777, "loss": 0.0114, "step": 7151 }, { "epoch": 1.46, "learning_rate": 0.00024411983652942965, "loss": 0.0158, "step": 7152 }, { "epoch": 1.46, "learning_rate": 0.00024410474143754266, "loss": 0.0306, "step": 7153 }, { "epoch": 1.46, "learning_rate": 0.0002440896447739288, "loss": 0.0081, "step": 7154 }, { "epoch": 1.46, "learning_rate": 0.00024407454653884028, "loss": 0.009, "step": 7155 }, { "epoch": 1.46, "learning_rate": 0.00024405944673252928, "loss": 0.0096, "step": 7156 }, { "epoch": 1.46, "learning_rate": 0.00024404434535524796, "loss": 0.0096, "step": 7157 }, { "epoch": 1.46, "learning_rate": 0.00024402924240724856, "loss": 0.0126, "step": 7158 }, { "epoch": 1.46, "learning_rate": 0.00024401413788878326, "loss": 0.0456, "step": 7159 }, { "epoch": 1.46, "learning_rate": 0.00024399903180010444, "loss": 0.0179, "step": 7160 }, { "epoch": 1.46, "learning_rate": 0.00024398392414146436, "loss": 0.0278, "step": 7161 }, { "epoch": 1.46, "learning_rate": 0.00024396881491311532, "loss": 0.0265, "step": 7162 }, { "epoch": 1.46, "learning_rate": 0.0002439537041153097, "loss": 0.0111, "step": 7163 }, { "epoch": 1.46, "learning_rate": 0.00024393859174829985, "loss": 0.0062, "step": 7164 }, { "epoch": 1.46, "learning_rate": 0.00024392347781233825, "loss": 0.0125, "step": 7165 }, { "epoch": 1.46, "learning_rate": 0.0002439083623076772, "loss": 0.0137, "step": 7166 }, { "epoch": 1.46, "learning_rate": 0.0002438932452345693, "loss": 0.0319, "step": 7167 }, { "epoch": 1.46, "learning_rate": 0.00024387812659326695, "loss": 0.0055, "step": 7168 }, { "epoch": 1.46, "learning_rate": 0.00024386300638402268, "loss": 0.0145, "step": 7169 }, { "epoch": 1.46, "learning_rate": 0.00024384788460708902, "loss": 0.0145, "step": 7170 }, { "epoch": 1.46, "learning_rate": 0.00024383276126271856, "loss": 0.0191, "step": 7171 }, { "epoch": 1.46, "learning_rate": 0.0002438176363511638, "loss": 0.0162, "step": 7172 }, { "epoch": 1.46, "learning_rate": 0.00024380250987267747, "loss": 0.0017, "step": 7173 }, { "epoch": 1.46, "learning_rate": 0.00024378738182751216, "loss": 0.0058, "step": 7174 }, { "epoch": 1.46, "learning_rate": 0.00024377225221592055, "loss": 0.0173, "step": 7175 }, { "epoch": 1.46, "learning_rate": 0.0002437571210381553, "loss": 0.0233, "step": 7176 }, { "epoch": 1.46, "learning_rate": 0.0002437419882944691, "loss": 0.0167, "step": 7177 }, { "epoch": 1.46, "learning_rate": 0.00024372685398511485, "loss": 0.0101, "step": 7178 }, { "epoch": 1.46, "learning_rate": 0.00024371171811034514, "loss": 0.0152, "step": 7179 }, { "epoch": 1.46, "learning_rate": 0.00024369658067041285, "loss": 0.0136, "step": 7180 }, { "epoch": 1.46, "learning_rate": 0.00024368144166557083, "loss": 0.0226, "step": 7181 }, { "epoch": 1.46, "learning_rate": 0.00024366630109607187, "loss": 0.0233, "step": 7182 }, { "epoch": 1.46, "learning_rate": 0.0002436511589621689, "loss": 0.0297, "step": 7183 }, { "epoch": 1.46, "learning_rate": 0.00024363601526411477, "loss": 0.0346, "step": 7184 }, { "epoch": 1.46, "learning_rate": 0.00024362087000216244, "loss": 0.0044, "step": 7185 }, { "epoch": 1.46, "learning_rate": 0.00024360572317656487, "loss": 0.0255, "step": 7186 }, { "epoch": 1.46, "learning_rate": 0.000243590574787575, "loss": 0.0229, "step": 7187 }, { "epoch": 1.46, "learning_rate": 0.00024357542483544593, "loss": 0.0067, "step": 7188 }, { "epoch": 1.46, "learning_rate": 0.00024356027332043056, "loss": 0.0365, "step": 7189 }, { "epoch": 1.46, "learning_rate": 0.00024354512024278203, "loss": 0.0083, "step": 7190 }, { "epoch": 1.46, "learning_rate": 0.00024352996560275344, "loss": 0.0189, "step": 7191 }, { "epoch": 1.46, "learning_rate": 0.00024351480940059788, "loss": 0.0191, "step": 7192 }, { "epoch": 1.46, "learning_rate": 0.00024349965163656843, "loss": 0.0109, "step": 7193 }, { "epoch": 1.46, "learning_rate": 0.00024348449231091838, "loss": 0.0346, "step": 7194 }, { "epoch": 1.47, "learning_rate": 0.00024346933142390078, "loss": 0.0198, "step": 7195 }, { "epoch": 1.47, "learning_rate": 0.00024345416897576894, "loss": 0.0057, "step": 7196 }, { "epoch": 1.47, "learning_rate": 0.00024343900496677607, "loss": 0.0058, "step": 7197 }, { "epoch": 1.47, "learning_rate": 0.00024342383939717543, "loss": 0.0047, "step": 7198 }, { "epoch": 1.47, "learning_rate": 0.00024340867226722032, "loss": 0.0093, "step": 7199 }, { "epoch": 1.47, "learning_rate": 0.00024339350357716408, "loss": 0.0073, "step": 7200 }, { "epoch": 1.47, "learning_rate": 0.00024337833332726, "loss": 0.005, "step": 7201 }, { "epoch": 1.47, "learning_rate": 0.00024336316151776153, "loss": 0.0092, "step": 7202 }, { "epoch": 1.47, "learning_rate": 0.00024334798814892202, "loss": 0.0129, "step": 7203 }, { "epoch": 1.47, "learning_rate": 0.00024333281322099488, "loss": 0.0195, "step": 7204 }, { "epoch": 1.47, "learning_rate": 0.00024331763673423362, "loss": 0.0133, "step": 7205 }, { "epoch": 1.47, "learning_rate": 0.00024330245868889165, "loss": 0.0158, "step": 7206 }, { "epoch": 1.47, "learning_rate": 0.00024328727908522248, "loss": 0.0143, "step": 7207 }, { "epoch": 1.47, "learning_rate": 0.00024327209792347968, "loss": 0.012, "step": 7208 }, { "epoch": 1.47, "learning_rate": 0.00024325691520391676, "loss": 0.0249, "step": 7209 }, { "epoch": 1.47, "learning_rate": 0.00024324173092678733, "loss": 0.0111, "step": 7210 }, { "epoch": 1.47, "learning_rate": 0.000243226545092345, "loss": 0.0195, "step": 7211 }, { "epoch": 1.47, "learning_rate": 0.00024321135770084338, "loss": 0.0113, "step": 7212 }, { "epoch": 1.47, "learning_rate": 0.00024319616875253616, "loss": 0.015, "step": 7213 }, { "epoch": 1.47, "learning_rate": 0.00024318097824767697, "loss": 0.0089, "step": 7214 }, { "epoch": 1.47, "learning_rate": 0.0002431657861865196, "loss": 0.0202, "step": 7215 }, { "epoch": 1.47, "learning_rate": 0.0002431505925693177, "loss": 0.0084, "step": 7216 }, { "epoch": 1.47, "learning_rate": 0.00024313539739632506, "loss": 0.0113, "step": 7217 }, { "epoch": 1.47, "learning_rate": 0.0002431202006677955, "loss": 0.0277, "step": 7218 }, { "epoch": 1.47, "learning_rate": 0.00024310500238398277, "loss": 0.0112, "step": 7219 }, { "epoch": 1.47, "learning_rate": 0.00024308980254514082, "loss": 0.005, "step": 7220 }, { "epoch": 1.47, "learning_rate": 0.00024307460115152341, "loss": 0.0155, "step": 7221 }, { "epoch": 1.47, "learning_rate": 0.00024305939820338444, "loss": 0.0078, "step": 7222 }, { "epoch": 1.47, "learning_rate": 0.0002430441937009779, "loss": 0.0211, "step": 7223 }, { "epoch": 1.47, "learning_rate": 0.00024302898764455772, "loss": 0.0067, "step": 7224 }, { "epoch": 1.47, "learning_rate": 0.00024301378003437776, "loss": 0.0069, "step": 7225 }, { "epoch": 1.47, "learning_rate": 0.00024299857087069216, "loss": 0.0078, "step": 7226 }, { "epoch": 1.47, "learning_rate": 0.00024298336015375486, "loss": 0.0113, "step": 7227 }, { "epoch": 1.47, "learning_rate": 0.00024296814788381992, "loss": 0.0088, "step": 7228 }, { "epoch": 1.47, "learning_rate": 0.00024295293406114145, "loss": 0.0363, "step": 7229 }, { "epoch": 1.47, "learning_rate": 0.0002429377186859735, "loss": 0.0044, "step": 7230 }, { "epoch": 1.47, "learning_rate": 0.0002429225017585702, "loss": 0.0058, "step": 7231 }, { "epoch": 1.47, "learning_rate": 0.00024290728327918575, "loss": 0.02, "step": 7232 }, { "epoch": 1.47, "learning_rate": 0.00024289206324807426, "loss": 0.0056, "step": 7233 }, { "epoch": 1.47, "learning_rate": 0.00024287684166548999, "loss": 0.0083, "step": 7234 }, { "epoch": 1.47, "learning_rate": 0.00024286161853168716, "loss": 0.0077, "step": 7235 }, { "epoch": 1.47, "learning_rate": 0.00024284639384691996, "loss": 0.0089, "step": 7236 }, { "epoch": 1.47, "learning_rate": 0.00024283116761144276, "loss": 0.0306, "step": 7237 }, { "epoch": 1.47, "learning_rate": 0.0002428159398255098, "loss": 0.0101, "step": 7238 }, { "epoch": 1.47, "learning_rate": 0.0002428007104893755, "loss": 0.0139, "step": 7239 }, { "epoch": 1.47, "learning_rate": 0.00024278547960329412, "loss": 0.0066, "step": 7240 }, { "epoch": 1.47, "learning_rate": 0.00024277024716752007, "loss": 0.0074, "step": 7241 }, { "epoch": 1.47, "learning_rate": 0.00024275501318230783, "loss": 0.0153, "step": 7242 }, { "epoch": 1.47, "learning_rate": 0.00024273977764791176, "loss": 0.0178, "step": 7243 }, { "epoch": 1.48, "learning_rate": 0.00024272454056458635, "loss": 0.0123, "step": 7244 }, { "epoch": 1.48, "learning_rate": 0.00024270930193258603, "loss": 0.0115, "step": 7245 }, { "epoch": 1.48, "learning_rate": 0.00024269406175216542, "loss": 0.015, "step": 7246 }, { "epoch": 1.48, "learning_rate": 0.00024267882002357898, "loss": 0.0156, "step": 7247 }, { "epoch": 1.48, "learning_rate": 0.00024266357674708136, "loss": 0.0211, "step": 7248 }, { "epoch": 1.48, "learning_rate": 0.00024264833192292704, "loss": 0.0033, "step": 7249 }, { "epoch": 1.48, "learning_rate": 0.00024263308555137064, "loss": 0.0056, "step": 7250 }, { "epoch": 1.48, "learning_rate": 0.0002426178376326669, "loss": 0.0092, "step": 7251 }, { "epoch": 1.48, "learning_rate": 0.0002426025881670705, "loss": 0.0052, "step": 7252 }, { "epoch": 1.48, "learning_rate": 0.00024258733715483603, "loss": 0.0088, "step": 7253 }, { "epoch": 1.48, "learning_rate": 0.00024257208459621828, "loss": 0.0224, "step": 7254 }, { "epoch": 1.48, "learning_rate": 0.00024255683049147195, "loss": 0.0147, "step": 7255 }, { "epoch": 1.48, "learning_rate": 0.00024254157484085185, "loss": 0.0186, "step": 7256 }, { "epoch": 1.48, "learning_rate": 0.00024252631764461278, "loss": 0.0283, "step": 7257 }, { "epoch": 1.48, "learning_rate": 0.0002425110589030095, "loss": 0.0078, "step": 7258 }, { "epoch": 1.48, "learning_rate": 0.00024249579861629691, "loss": 0.0058, "step": 7259 }, { "epoch": 1.48, "learning_rate": 0.00024248053678472992, "loss": 0.0099, "step": 7260 }, { "epoch": 1.48, "learning_rate": 0.0002424652734085634, "loss": 0.0231, "step": 7261 }, { "epoch": 1.48, "learning_rate": 0.00024245000848805226, "loss": 0.0027, "step": 7262 }, { "epoch": 1.48, "learning_rate": 0.0002424347420234515, "loss": 0.0142, "step": 7263 }, { "epoch": 1.48, "learning_rate": 0.00024241947401501602, "loss": 0.0301, "step": 7264 }, { "epoch": 1.48, "learning_rate": 0.00024240420446300088, "loss": 0.0042, "step": 7265 }, { "epoch": 1.48, "learning_rate": 0.0002423889333676611, "loss": 0.0111, "step": 7266 }, { "epoch": 1.48, "learning_rate": 0.00024237366072925174, "loss": 0.007, "step": 7267 }, { "epoch": 1.48, "learning_rate": 0.0002423583865480279, "loss": 0.0047, "step": 7268 }, { "epoch": 1.48, "learning_rate": 0.0002423431108242446, "loss": 0.0028, "step": 7269 }, { "epoch": 1.48, "learning_rate": 0.00024232783355815707, "loss": 0.0155, "step": 7270 }, { "epoch": 1.48, "learning_rate": 0.0002423125547500205, "loss": 0.0125, "step": 7271 }, { "epoch": 1.48, "learning_rate": 0.00024229727440008996, "loss": 0.0208, "step": 7272 }, { "epoch": 1.48, "learning_rate": 0.0002422819925086207, "loss": 0.0043, "step": 7273 }, { "epoch": 1.48, "learning_rate": 0.000242266709075868, "loss": 0.0086, "step": 7274 }, { "epoch": 1.48, "learning_rate": 0.00024225142410208708, "loss": 0.0192, "step": 7275 }, { "epoch": 1.48, "learning_rate": 0.00024223613758753325, "loss": 0.0475, "step": 7276 }, { "epoch": 1.48, "learning_rate": 0.0002422208495324618, "loss": 0.014, "step": 7277 }, { "epoch": 1.48, "learning_rate": 0.0002422055599371281, "loss": 0.0067, "step": 7278 }, { "epoch": 1.48, "learning_rate": 0.0002421902688017875, "loss": 0.0134, "step": 7279 }, { "epoch": 1.48, "learning_rate": 0.0002421749761266954, "loss": 0.0208, "step": 7280 }, { "epoch": 1.48, "learning_rate": 0.00024215968191210717, "loss": 0.0117, "step": 7281 }, { "epoch": 1.48, "learning_rate": 0.00024214438615827828, "loss": 0.0081, "step": 7282 }, { "epoch": 1.48, "learning_rate": 0.00024212908886546425, "loss": 0.0183, "step": 7283 }, { "epoch": 1.48, "learning_rate": 0.0002421137900339205, "loss": 0.005, "step": 7284 }, { "epoch": 1.48, "learning_rate": 0.0002420984896639026, "loss": 0.0225, "step": 7285 }, { "epoch": 1.48, "learning_rate": 0.00024208318775566606, "loss": 0.0066, "step": 7286 }, { "epoch": 1.48, "learning_rate": 0.00024206788430946647, "loss": 0.008, "step": 7287 }, { "epoch": 1.48, "learning_rate": 0.00024205257932555943, "loss": 0.014, "step": 7288 }, { "epoch": 1.48, "learning_rate": 0.00024203727280420058, "loss": 0.0087, "step": 7289 }, { "epoch": 1.48, "learning_rate": 0.0002420219647456455, "loss": 0.0073, "step": 7290 }, { "epoch": 1.48, "learning_rate": 0.00024200665515014988, "loss": 0.0053, "step": 7291 }, { "epoch": 1.48, "learning_rate": 0.00024199134401796946, "loss": 0.0086, "step": 7292 }, { "epoch": 1.48, "learning_rate": 0.00024197603134935999, "loss": 0.0077, "step": 7293 }, { "epoch": 1.49, "learning_rate": 0.00024196071714457717, "loss": 0.0116, "step": 7294 }, { "epoch": 1.49, "learning_rate": 0.00024194540140387675, "loss": 0.0312, "step": 7295 }, { "epoch": 1.49, "learning_rate": 0.00024193008412751456, "loss": 0.0059, "step": 7296 }, { "epoch": 1.49, "learning_rate": 0.00024191476531574646, "loss": 0.0186, "step": 7297 }, { "epoch": 1.49, "learning_rate": 0.00024189944496882829, "loss": 0.0109, "step": 7298 }, { "epoch": 1.49, "learning_rate": 0.0002418841230870159, "loss": 0.0303, "step": 7299 }, { "epoch": 1.49, "learning_rate": 0.00024186879967056524, "loss": 0.006, "step": 7300 }, { "epoch": 1.49, "learning_rate": 0.0002418534747197322, "loss": 0.0079, "step": 7301 }, { "epoch": 1.49, "learning_rate": 0.0002418381482347727, "loss": 0.0085, "step": 7302 }, { "epoch": 1.49, "learning_rate": 0.00024182282021594284, "loss": 0.0018, "step": 7303 }, { "epoch": 1.49, "learning_rate": 0.00024180749066349852, "loss": 0.0208, "step": 7304 }, { "epoch": 1.49, "learning_rate": 0.0002417921595776958, "loss": 0.0116, "step": 7305 }, { "epoch": 1.49, "learning_rate": 0.00024177682695879075, "loss": 0.0054, "step": 7306 }, { "epoch": 1.49, "learning_rate": 0.0002417614928070394, "loss": 0.0116, "step": 7307 }, { "epoch": 1.49, "learning_rate": 0.00024174615712269795, "loss": 0.0127, "step": 7308 }, { "epoch": 1.49, "learning_rate": 0.00024173081990602256, "loss": 0.0106, "step": 7309 }, { "epoch": 1.49, "learning_rate": 0.00024171548115726923, "loss": 0.0227, "step": 7310 }, { "epoch": 1.49, "learning_rate": 0.00024170014087669426, "loss": 0.0505, "step": 7311 }, { "epoch": 1.49, "learning_rate": 0.00024168479906455385, "loss": 0.0163, "step": 7312 }, { "epoch": 1.49, "learning_rate": 0.00024166945572110427, "loss": 0.0064, "step": 7313 }, { "epoch": 1.49, "learning_rate": 0.00024165411084660167, "loss": 0.0121, "step": 7314 }, { "epoch": 1.49, "learning_rate": 0.00024163876444130246, "loss": 0.0981, "step": 7315 }, { "epoch": 1.49, "learning_rate": 0.00024162341650546285, "loss": 0.0258, "step": 7316 }, { "epoch": 1.49, "learning_rate": 0.00024160806703933928, "loss": 0.0061, "step": 7317 }, { "epoch": 1.49, "learning_rate": 0.00024159271604318804, "loss": 0.0093, "step": 7318 }, { "epoch": 1.49, "learning_rate": 0.00024157736351726556, "loss": 0.0118, "step": 7319 }, { "epoch": 1.49, "learning_rate": 0.00024156200946182828, "loss": 0.02, "step": 7320 }, { "epoch": 1.49, "learning_rate": 0.00024154665387713257, "loss": 0.011, "step": 7321 }, { "epoch": 1.49, "learning_rate": 0.00024153129676343491, "loss": 0.0197, "step": 7322 }, { "epoch": 1.49, "learning_rate": 0.0002415159381209919, "loss": 0.0213, "step": 7323 }, { "epoch": 1.49, "learning_rate": 0.0002415005779500599, "loss": 0.0135, "step": 7324 }, { "epoch": 1.49, "learning_rate": 0.00024148521625089552, "loss": 0.0279, "step": 7325 }, { "epoch": 1.49, "learning_rate": 0.00024146985302375538, "loss": 0.0097, "step": 7326 }, { "epoch": 1.49, "learning_rate": 0.00024145448826889604, "loss": 0.005, "step": 7327 }, { "epoch": 1.49, "learning_rate": 0.00024143912198657406, "loss": 0.0014, "step": 7328 }, { "epoch": 1.49, "learning_rate": 0.0002414237541770462, "loss": 0.0094, "step": 7329 }, { "epoch": 1.49, "learning_rate": 0.00024140838484056903, "loss": 0.0048, "step": 7330 }, { "epoch": 1.49, "learning_rate": 0.0002413930139773993, "loss": 0.0073, "step": 7331 }, { "epoch": 1.49, "learning_rate": 0.00024137764158779372, "loss": 0.0146, "step": 7332 }, { "epoch": 1.49, "learning_rate": 0.00024136226767200903, "loss": 0.0205, "step": 7333 }, { "epoch": 1.49, "learning_rate": 0.00024134689223030201, "loss": 0.0033, "step": 7334 }, { "epoch": 1.49, "learning_rate": 0.00024133151526292948, "loss": 0.0279, "step": 7335 }, { "epoch": 1.49, "learning_rate": 0.00024131613677014826, "loss": 0.0219, "step": 7336 }, { "epoch": 1.49, "learning_rate": 0.00024130075675221513, "loss": 0.0121, "step": 7337 }, { "epoch": 1.49, "learning_rate": 0.00024128537520938704, "loss": 0.0499, "step": 7338 }, { "epoch": 1.49, "learning_rate": 0.00024126999214192088, "loss": 0.0107, "step": 7339 }, { "epoch": 1.49, "learning_rate": 0.0002412546075500736, "loss": 0.0084, "step": 7340 }, { "epoch": 1.49, "learning_rate": 0.0002412392214341021, "loss": 0.0036, "step": 7341 }, { "epoch": 1.49, "learning_rate": 0.00024122383379426333, "loss": 0.0282, "step": 7342 }, { "epoch": 1.5, "learning_rate": 0.00024120844463081437, "loss": 0.0145, "step": 7343 }, { "epoch": 1.5, "learning_rate": 0.00024119305394401221, "loss": 0.0337, "step": 7344 }, { "epoch": 1.5, "learning_rate": 0.00024117766173411395, "loss": 0.0083, "step": 7345 }, { "epoch": 1.5, "learning_rate": 0.00024116226800137658, "loss": 0.031, "step": 7346 }, { "epoch": 1.5, "learning_rate": 0.00024114687274605725, "loss": 0.0125, "step": 7347 }, { "epoch": 1.5, "learning_rate": 0.00024113147596841313, "loss": 0.0154, "step": 7348 }, { "epoch": 1.5, "learning_rate": 0.00024111607766870132, "loss": 0.0071, "step": 7349 }, { "epoch": 1.5, "learning_rate": 0.00024110067784717903, "loss": 0.0163, "step": 7350 }, { "epoch": 1.5, "learning_rate": 0.00024108527650410343, "loss": 0.0229, "step": 7351 }, { "epoch": 1.5, "learning_rate": 0.0002410698736397318, "loss": 0.0252, "step": 7352 }, { "epoch": 1.5, "learning_rate": 0.00024105446925432137, "loss": 0.0038, "step": 7353 }, { "epoch": 1.5, "learning_rate": 0.00024103906334812942, "loss": 0.0217, "step": 7354 }, { "epoch": 1.5, "learning_rate": 0.00024102365592141325, "loss": 0.0198, "step": 7355 }, { "epoch": 1.5, "learning_rate": 0.00024100824697443024, "loss": 0.0083, "step": 7356 }, { "epoch": 1.5, "learning_rate": 0.00024099283650743769, "loss": 0.0094, "step": 7357 }, { "epoch": 1.5, "learning_rate": 0.000240977424520693, "loss": 0.0116, "step": 7358 }, { "epoch": 1.5, "learning_rate": 0.00024096201101445362, "loss": 0.0127, "step": 7359 }, { "epoch": 1.5, "learning_rate": 0.00024094659598897694, "loss": 0.0155, "step": 7360 }, { "epoch": 1.5, "learning_rate": 0.00024093117944452041, "loss": 0.0078, "step": 7361 }, { "epoch": 1.5, "learning_rate": 0.00024091576138134157, "loss": 0.0167, "step": 7362 }, { "epoch": 1.5, "learning_rate": 0.0002409003417996979, "loss": 0.0313, "step": 7363 }, { "epoch": 1.5, "learning_rate": 0.0002408849206998469, "loss": 0.0487, "step": 7364 }, { "epoch": 1.5, "learning_rate": 0.0002408694980820462, "loss": 0.0089, "step": 7365 }, { "epoch": 1.5, "learning_rate": 0.00024085407394655334, "loss": 0.0116, "step": 7366 }, { "epoch": 1.5, "learning_rate": 0.00024083864829362592, "loss": 0.0056, "step": 7367 }, { "epoch": 1.5, "learning_rate": 0.00024082322112352168, "loss": 0.0075, "step": 7368 }, { "epoch": 1.5, "learning_rate": 0.00024080779243649815, "loss": 0.0055, "step": 7369 }, { "epoch": 1.5, "learning_rate": 0.00024079236223281306, "loss": 0.0176, "step": 7370 }, { "epoch": 1.5, "learning_rate": 0.00024077693051272416, "loss": 0.007, "step": 7371 }, { "epoch": 1.5, "learning_rate": 0.00024076149727648917, "loss": 0.0273, "step": 7372 }, { "epoch": 1.5, "learning_rate": 0.0002407460625243659, "loss": 0.0226, "step": 7373 }, { "epoch": 1.5, "learning_rate": 0.000240730626256612, "loss": 0.0042, "step": 7374 }, { "epoch": 1.5, "learning_rate": 0.00024071518847348542, "loss": 0.0126, "step": 7375 }, { "epoch": 1.5, "learning_rate": 0.00024069974917524396, "loss": 0.0086, "step": 7376 }, { "epoch": 1.5, "learning_rate": 0.00024068430836214548, "loss": 0.0074, "step": 7377 }, { "epoch": 1.5, "learning_rate": 0.00024066886603444786, "loss": 0.0062, "step": 7378 }, { "epoch": 1.5, "learning_rate": 0.00024065342219240903, "loss": 0.0052, "step": 7379 }, { "epoch": 1.5, "learning_rate": 0.0002406379768362869, "loss": 0.0106, "step": 7380 }, { "epoch": 1.5, "learning_rate": 0.0002406225299663395, "loss": 0.008, "step": 7381 }, { "epoch": 1.5, "learning_rate": 0.0002406070815828248, "loss": 0.0172, "step": 7382 }, { "epoch": 1.5, "learning_rate": 0.00024059163168600078, "loss": 0.0098, "step": 7383 }, { "epoch": 1.5, "learning_rate": 0.00024057618027612554, "loss": 0.0371, "step": 7384 }, { "epoch": 1.5, "learning_rate": 0.00024056072735345707, "loss": 0.0251, "step": 7385 }, { "epoch": 1.5, "learning_rate": 0.0002405452729182535, "loss": 0.0086, "step": 7386 }, { "epoch": 1.5, "learning_rate": 0.00024052981697077303, "loss": 0.0189, "step": 7387 }, { "epoch": 1.5, "learning_rate": 0.0002405143595112737, "loss": 0.0328, "step": 7388 }, { "epoch": 1.5, "learning_rate": 0.0002404989005400137, "loss": 0.0029, "step": 7389 }, { "epoch": 1.5, "learning_rate": 0.00024048344005725119, "loss": 0.013, "step": 7390 }, { "epoch": 1.5, "learning_rate": 0.00024046797806324445, "loss": 0.0065, "step": 7391 }, { "epoch": 1.51, "learning_rate": 0.00024045251455825174, "loss": 0.0167, "step": 7392 }, { "epoch": 1.51, "learning_rate": 0.00024043704954253127, "loss": 0.0074, "step": 7393 }, { "epoch": 1.51, "learning_rate": 0.00024042158301634136, "loss": 0.0088, "step": 7394 }, { "epoch": 1.51, "learning_rate": 0.00024040611497994037, "loss": 0.0225, "step": 7395 }, { "epoch": 1.51, "learning_rate": 0.00024039064543358653, "loss": 0.0043, "step": 7396 }, { "epoch": 1.51, "learning_rate": 0.00024037517437753832, "loss": 0.0145, "step": 7397 }, { "epoch": 1.51, "learning_rate": 0.00024035970181205416, "loss": 0.0189, "step": 7398 }, { "epoch": 1.51, "learning_rate": 0.00024034422773739231, "loss": 0.0286, "step": 7399 }, { "epoch": 1.51, "learning_rate": 0.00024032875215381142, "loss": 0.0139, "step": 7400 }, { "epoch": 1.51, "learning_rate": 0.00024031327506156982, "loss": 0.0245, "step": 7401 }, { "epoch": 1.51, "learning_rate": 0.000240297796460926, "loss": 0.027, "step": 7402 }, { "epoch": 1.51, "learning_rate": 0.0002402823163521386, "loss": 0.0196, "step": 7403 }, { "epoch": 1.51, "learning_rate": 0.00024026683473546607, "loss": 0.0221, "step": 7404 }, { "epoch": 1.51, "learning_rate": 0.00024025135161116702, "loss": 0.0054, "step": 7405 }, { "epoch": 1.51, "learning_rate": 0.00024023586697950007, "loss": 0.0132, "step": 7406 }, { "epoch": 1.51, "learning_rate": 0.00024022038084072373, "loss": 0.0179, "step": 7407 }, { "epoch": 1.51, "learning_rate": 0.00024020489319509674, "loss": 0.0091, "step": 7408 }, { "epoch": 1.51, "learning_rate": 0.0002401894040428778, "loss": 0.0087, "step": 7409 }, { "epoch": 1.51, "learning_rate": 0.00024017391338432558, "loss": 0.0107, "step": 7410 }, { "epoch": 1.51, "learning_rate": 0.00024015842121969874, "loss": 0.0081, "step": 7411 }, { "epoch": 1.51, "learning_rate": 0.00024014292754925612, "loss": 0.0077, "step": 7412 }, { "epoch": 1.51, "learning_rate": 0.00024012743237325642, "loss": 0.0073, "step": 7413 }, { "epoch": 1.51, "learning_rate": 0.0002401119356919585, "loss": 0.029, "step": 7414 }, { "epoch": 1.51, "learning_rate": 0.00024009643750562114, "loss": 0.0035, "step": 7415 }, { "epoch": 1.51, "learning_rate": 0.00024008093781450324, "loss": 0.0228, "step": 7416 }, { "epoch": 1.51, "learning_rate": 0.0002400654366188636, "loss": 0.0115, "step": 7417 }, { "epoch": 1.51, "learning_rate": 0.00024004993391896115, "loss": 0.0198, "step": 7418 }, { "epoch": 1.51, "learning_rate": 0.00024003442971505485, "loss": 0.0266, "step": 7419 }, { "epoch": 1.51, "learning_rate": 0.0002400189240074036, "loss": 0.0123, "step": 7420 }, { "epoch": 1.51, "learning_rate": 0.0002400034167962664, "loss": 0.0183, "step": 7421 }, { "epoch": 1.51, "learning_rate": 0.00023998790808190225, "loss": 0.0184, "step": 7422 }, { "epoch": 1.51, "learning_rate": 0.00023997239786457017, "loss": 0.0045, "step": 7423 }, { "epoch": 1.51, "learning_rate": 0.00023995688614452922, "loss": 0.0139, "step": 7424 }, { "epoch": 1.51, "learning_rate": 0.00023994137292203846, "loss": 0.0252, "step": 7425 }, { "epoch": 1.51, "learning_rate": 0.000239925858197357, "loss": 0.024, "step": 7426 }, { "epoch": 1.51, "learning_rate": 0.00023991034197074393, "loss": 0.0239, "step": 7427 }, { "epoch": 1.51, "learning_rate": 0.00023989482424245848, "loss": 0.0221, "step": 7428 }, { "epoch": 1.51, "learning_rate": 0.00023987930501275978, "loss": 0.0208, "step": 7429 }, { "epoch": 1.51, "learning_rate": 0.000239863784281907, "loss": 0.0111, "step": 7430 }, { "epoch": 1.51, "learning_rate": 0.00023984826205015937, "loss": 0.0101, "step": 7431 }, { "epoch": 1.51, "learning_rate": 0.00023983273831777618, "loss": 0.0188, "step": 7432 }, { "epoch": 1.51, "learning_rate": 0.0002398172130850167, "loss": 0.0224, "step": 7433 }, { "epoch": 1.51, "learning_rate": 0.0002398016863521402, "loss": 0.0156, "step": 7434 }, { "epoch": 1.51, "learning_rate": 0.00023978615811940605, "loss": 0.0292, "step": 7435 }, { "epoch": 1.51, "learning_rate": 0.0002397706283870736, "loss": 0.027, "step": 7436 }, { "epoch": 1.51, "learning_rate": 0.00023975509715540216, "loss": 0.0102, "step": 7437 }, { "epoch": 1.51, "learning_rate": 0.00023973956442465116, "loss": 0.0087, "step": 7438 }, { "epoch": 1.51, "learning_rate": 0.00023972403019508008, "loss": 0.0229, "step": 7439 }, { "epoch": 1.51, "learning_rate": 0.00023970849446694825, "loss": 0.0059, "step": 7440 }, { "epoch": 1.52, "learning_rate": 0.00023969295724051532, "loss": 0.0166, "step": 7441 }, { "epoch": 1.52, "learning_rate": 0.00023967741851604066, "loss": 0.0052, "step": 7442 }, { "epoch": 1.52, "learning_rate": 0.00023966187829378385, "loss": 0.0497, "step": 7443 }, { "epoch": 1.52, "learning_rate": 0.00023964633657400441, "loss": 0.0232, "step": 7444 }, { "epoch": 1.52, "learning_rate": 0.0002396307933569619, "loss": 0.0197, "step": 7445 }, { "epoch": 1.52, "learning_rate": 0.00023961524864291598, "loss": 0.0121, "step": 7446 }, { "epoch": 1.52, "learning_rate": 0.00023959970243212625, "loss": 0.0053, "step": 7447 }, { "epoch": 1.52, "learning_rate": 0.00023958415472485236, "loss": 0.0054, "step": 7448 }, { "epoch": 1.52, "learning_rate": 0.00023956860552135396, "loss": 0.0052, "step": 7449 }, { "epoch": 1.52, "learning_rate": 0.00023955305482189083, "loss": 0.0015, "step": 7450 }, { "epoch": 1.52, "learning_rate": 0.0002395375026267226, "loss": 0.0214, "step": 7451 }, { "epoch": 1.52, "learning_rate": 0.00023952194893610905, "loss": 0.0325, "step": 7452 }, { "epoch": 1.52, "learning_rate": 0.00023950639375030998, "loss": 0.022, "step": 7453 }, { "epoch": 1.52, "learning_rate": 0.00023949083706958517, "loss": 0.0046, "step": 7454 }, { "epoch": 1.52, "learning_rate": 0.0002394752788941945, "loss": 0.0518, "step": 7455 }, { "epoch": 1.52, "learning_rate": 0.00023945971922439776, "loss": 0.0194, "step": 7456 }, { "epoch": 1.52, "learning_rate": 0.00023944415806045481, "loss": 0.0251, "step": 7457 }, { "epoch": 1.52, "learning_rate": 0.00023942859540262558, "loss": 0.0057, "step": 7458 }, { "epoch": 1.52, "learning_rate": 0.00023941303125117, "loss": 0.0273, "step": 7459 }, { "epoch": 1.52, "learning_rate": 0.00023939746560634804, "loss": 0.0209, "step": 7460 }, { "epoch": 1.52, "learning_rate": 0.00023938189846841966, "loss": 0.0198, "step": 7461 }, { "epoch": 1.52, "learning_rate": 0.00023936632983764485, "loss": 0.0194, "step": 7462 }, { "epoch": 1.52, "learning_rate": 0.0002393507597142836, "loss": 0.004, "step": 7463 }, { "epoch": 1.52, "learning_rate": 0.00023933518809859608, "loss": 0.0139, "step": 7464 }, { "epoch": 1.52, "learning_rate": 0.00023931961499084226, "loss": 0.0128, "step": 7465 }, { "epoch": 1.52, "learning_rate": 0.00023930404039128222, "loss": 0.0197, "step": 7466 }, { "epoch": 1.52, "learning_rate": 0.00023928846430017618, "loss": 0.0235, "step": 7467 }, { "epoch": 1.52, "learning_rate": 0.00023927288671778422, "loss": 0.0069, "step": 7468 }, { "epoch": 1.52, "learning_rate": 0.00023925730764436651, "loss": 0.0035, "step": 7469 }, { "epoch": 1.52, "learning_rate": 0.00023924172708018334, "loss": 0.014, "step": 7470 }, { "epoch": 1.52, "learning_rate": 0.00023922614502549486, "loss": 0.0149, "step": 7471 }, { "epoch": 1.52, "learning_rate": 0.0002392105614805613, "loss": 0.0136, "step": 7472 }, { "epoch": 1.52, "learning_rate": 0.00023919497644564298, "loss": 0.0201, "step": 7473 }, { "epoch": 1.52, "learning_rate": 0.0002391793899210002, "loss": 0.0122, "step": 7474 }, { "epoch": 1.52, "learning_rate": 0.00023916380190689327, "loss": 0.0118, "step": 7475 }, { "epoch": 1.52, "learning_rate": 0.0002391482124035825, "loss": 0.0246, "step": 7476 }, { "epoch": 1.52, "learning_rate": 0.00023913262141132832, "loss": 0.0095, "step": 7477 }, { "epoch": 1.52, "learning_rate": 0.00023911702893039113, "loss": 0.0163, "step": 7478 }, { "epoch": 1.52, "learning_rate": 0.00023910143496103136, "loss": 0.0175, "step": 7479 }, { "epoch": 1.52, "learning_rate": 0.00023908583950350937, "loss": 0.005, "step": 7480 }, { "epoch": 1.52, "learning_rate": 0.0002390702425580857, "loss": 0.0254, "step": 7481 }, { "epoch": 1.52, "learning_rate": 0.00023905464412502092, "loss": 0.023, "step": 7482 }, { "epoch": 1.52, "learning_rate": 0.00023903904420457544, "loss": 0.0058, "step": 7483 }, { "epoch": 1.52, "learning_rate": 0.00023902344279700985, "loss": 0.0477, "step": 7484 }, { "epoch": 1.52, "learning_rate": 0.0002390078399025847, "loss": 0.015, "step": 7485 }, { "epoch": 1.52, "learning_rate": 0.00023899223552156063, "loss": 0.0036, "step": 7486 }, { "epoch": 1.52, "learning_rate": 0.00023897662965419826, "loss": 0.0078, "step": 7487 }, { "epoch": 1.52, "learning_rate": 0.0002389610223007582, "loss": 0.018, "step": 7488 }, { "epoch": 1.52, "learning_rate": 0.00023894541346150116, "loss": 0.0398, "step": 7489 }, { "epoch": 1.53, "learning_rate": 0.0002389298031366878, "loss": 0.009, "step": 7490 }, { "epoch": 1.53, "learning_rate": 0.00023891419132657886, "loss": 0.007, "step": 7491 }, { "epoch": 1.53, "learning_rate": 0.00023889857803143508, "loss": 0.0052, "step": 7492 }, { "epoch": 1.53, "learning_rate": 0.00023888296325151728, "loss": 0.0183, "step": 7493 }, { "epoch": 1.53, "learning_rate": 0.00023886734698708617, "loss": 0.0036, "step": 7494 }, { "epoch": 1.53, "learning_rate": 0.0002388517292384026, "loss": 0.0061, "step": 7495 }, { "epoch": 1.53, "learning_rate": 0.00023883611000572748, "loss": 0.017, "step": 7496 }, { "epoch": 1.53, "learning_rate": 0.00023882048928932162, "loss": 0.0215, "step": 7497 }, { "epoch": 1.53, "learning_rate": 0.00023880486708944594, "loss": 0.0085, "step": 7498 }, { "epoch": 1.53, "learning_rate": 0.00023878924340636133, "loss": 0.0071, "step": 7499 }, { "epoch": 1.53, "learning_rate": 0.00023877361824032874, "loss": 0.0214, "step": 7500 }, { "epoch": 1.53, "learning_rate": 0.00023875799159160917, "loss": 0.0147, "step": 7501 }, { "epoch": 1.53, "learning_rate": 0.00023874236346046362, "loss": 0.0094, "step": 7502 }, { "epoch": 1.53, "learning_rate": 0.00023872673384715305, "loss": 0.0106, "step": 7503 }, { "epoch": 1.53, "learning_rate": 0.00023871110275193856, "loss": 0.0031, "step": 7504 }, { "epoch": 1.53, "learning_rate": 0.00023869547017508116, "loss": 0.0237, "step": 7505 }, { "epoch": 1.53, "learning_rate": 0.00023867983611684202, "loss": 0.0299, "step": 7506 }, { "epoch": 1.53, "learning_rate": 0.00023866420057748225, "loss": 0.0232, "step": 7507 }, { "epoch": 1.53, "learning_rate": 0.00023864856355726294, "loss": 0.0157, "step": 7508 }, { "epoch": 1.53, "learning_rate": 0.00023863292505644528, "loss": 0.0322, "step": 7509 }, { "epoch": 1.53, "learning_rate": 0.00023861728507529044, "loss": 0.0047, "step": 7510 }, { "epoch": 1.53, "learning_rate": 0.00023860164361405974, "loss": 0.0073, "step": 7511 }, { "epoch": 1.53, "learning_rate": 0.00023858600067301427, "loss": 0.0057, "step": 7512 }, { "epoch": 1.53, "learning_rate": 0.00023857035625241539, "loss": 0.0222, "step": 7513 }, { "epoch": 1.53, "learning_rate": 0.00023855471035252437, "loss": 0.0054, "step": 7514 }, { "epoch": 1.53, "learning_rate": 0.00023853906297360256, "loss": 0.0052, "step": 7515 }, { "epoch": 1.53, "learning_rate": 0.0002385234141159112, "loss": 0.0195, "step": 7516 }, { "epoch": 1.53, "learning_rate": 0.00023850776377971178, "loss": 0.0117, "step": 7517 }, { "epoch": 1.53, "learning_rate": 0.00023849211196526562, "loss": 0.0071, "step": 7518 }, { "epoch": 1.53, "learning_rate": 0.00023847645867283411, "loss": 0.0173, "step": 7519 }, { "epoch": 1.53, "learning_rate": 0.0002384608039026788, "loss": 0.0063, "step": 7520 }, { "epoch": 1.53, "learning_rate": 0.00023844514765506105, "loss": 0.0085, "step": 7521 }, { "epoch": 1.53, "learning_rate": 0.0002384294899302424, "loss": 0.0045, "step": 7522 }, { "epoch": 1.53, "learning_rate": 0.00023841383072848433, "loss": 0.0296, "step": 7523 }, { "epoch": 1.53, "learning_rate": 0.00023839817005004836, "loss": 0.0564, "step": 7524 }, { "epoch": 1.53, "learning_rate": 0.00023838250789519615, "loss": 0.0073, "step": 7525 }, { "epoch": 1.53, "learning_rate": 0.00023836684426418916, "loss": 0.0383, "step": 7526 }, { "epoch": 1.53, "learning_rate": 0.0002383511791572891, "loss": 0.0427, "step": 7527 }, { "epoch": 1.53, "learning_rate": 0.00023833551257475757, "loss": 0.017, "step": 7528 }, { "epoch": 1.53, "learning_rate": 0.00023831984451685626, "loss": 0.0088, "step": 7529 }, { "epoch": 1.53, "learning_rate": 0.00023830417498384683, "loss": 0.006, "step": 7530 }, { "epoch": 1.53, "learning_rate": 0.00023828850397599098, "loss": 0.0028, "step": 7531 }, { "epoch": 1.53, "learning_rate": 0.0002382728314935504, "loss": 0.0322, "step": 7532 }, { "epoch": 1.53, "learning_rate": 0.000238257157536787, "loss": 0.0119, "step": 7533 }, { "epoch": 1.53, "learning_rate": 0.00023824148210596242, "loss": 0.0084, "step": 7534 }, { "epoch": 1.53, "learning_rate": 0.00023822580520133852, "loss": 0.0036, "step": 7535 }, { "epoch": 1.53, "learning_rate": 0.00023821012682317716, "loss": 0.0135, "step": 7536 }, { "epoch": 1.53, "learning_rate": 0.00023819444697174014, "loss": 0.051, "step": 7537 }, { "epoch": 1.53, "learning_rate": 0.0002381787656472894, "loss": 0.0152, "step": 7538 }, { "epoch": 1.54, "learning_rate": 0.00023816308285008685, "loss": 0.014, "step": 7539 }, { "epoch": 1.54, "learning_rate": 0.00023814739858039432, "loss": 0.0175, "step": 7540 }, { "epoch": 1.54, "learning_rate": 0.00023813171283847392, "loss": 0.0204, "step": 7541 }, { "epoch": 1.54, "learning_rate": 0.0002381160256245875, "loss": 0.0167, "step": 7542 }, { "epoch": 1.54, "learning_rate": 0.00023810033693899717, "loss": 0.011, "step": 7543 }, { "epoch": 1.54, "learning_rate": 0.00023808464678196488, "loss": 0.0267, "step": 7544 }, { "epoch": 1.54, "learning_rate": 0.00023806895515375275, "loss": 0.0114, "step": 7545 }, { "epoch": 1.54, "learning_rate": 0.00023805326205462277, "loss": 0.0273, "step": 7546 }, { "epoch": 1.54, "learning_rate": 0.00023803756748483711, "loss": 0.0115, "step": 7547 }, { "epoch": 1.54, "learning_rate": 0.00023802187144465796, "loss": 0.0318, "step": 7548 }, { "epoch": 1.54, "learning_rate": 0.00023800617393434736, "loss": 0.0134, "step": 7549 }, { "epoch": 1.54, "learning_rate": 0.00023799047495416754, "loss": 0.0231, "step": 7550 }, { "epoch": 1.54, "learning_rate": 0.00023797477450438067, "loss": 0.0082, "step": 7551 }, { "epoch": 1.54, "learning_rate": 0.000237959072585249, "loss": 0.0149, "step": 7552 }, { "epoch": 1.54, "learning_rate": 0.00023794336919703482, "loss": 0.0143, "step": 7553 }, { "epoch": 1.54, "learning_rate": 0.00023792766434000036, "loss": 0.0073, "step": 7554 }, { "epoch": 1.54, "learning_rate": 0.0002379119580144079, "loss": 0.0155, "step": 7555 }, { "epoch": 1.54, "learning_rate": 0.00023789625022051984, "loss": 0.0038, "step": 7556 }, { "epoch": 1.54, "learning_rate": 0.0002378805409585984, "loss": 0.017, "step": 7557 }, { "epoch": 1.54, "learning_rate": 0.00023786483022890614, "loss": 0.0187, "step": 7558 }, { "epoch": 1.54, "learning_rate": 0.0002378491180317053, "loss": 0.0223, "step": 7559 }, { "epoch": 1.54, "learning_rate": 0.00023783340436725838, "loss": 0.0096, "step": 7560 }, { "epoch": 1.54, "learning_rate": 0.0002378176892358278, "loss": 0.0038, "step": 7561 }, { "epoch": 1.54, "learning_rate": 0.0002378019726376761, "loss": 0.0306, "step": 7562 }, { "epoch": 1.54, "learning_rate": 0.00023778625457306565, "loss": 0.0236, "step": 7563 }, { "epoch": 1.54, "learning_rate": 0.00023777053504225908, "loss": 0.0219, "step": 7564 }, { "epoch": 1.54, "learning_rate": 0.00023775481404551886, "loss": 0.0169, "step": 7565 }, { "epoch": 1.54, "learning_rate": 0.0002377390915831076, "loss": 0.0175, "step": 7566 }, { "epoch": 1.54, "learning_rate": 0.00023772336765528796, "loss": 0.0105, "step": 7567 }, { "epoch": 1.54, "learning_rate": 0.0002377076422623224, "loss": 0.0121, "step": 7568 }, { "epoch": 1.54, "learning_rate": 0.00023769191540447368, "loss": 0.0139, "step": 7569 }, { "epoch": 1.54, "learning_rate": 0.00023767618708200444, "loss": 0.0079, "step": 7570 }, { "epoch": 1.54, "learning_rate": 0.00023766045729517742, "loss": 0.0128, "step": 7571 }, { "epoch": 1.54, "learning_rate": 0.00023764472604425525, "loss": 0.0054, "step": 7572 }, { "epoch": 1.54, "learning_rate": 0.00023762899332950072, "loss": 0.012, "step": 7573 }, { "epoch": 1.54, "learning_rate": 0.00023761325915117658, "loss": 0.0109, "step": 7574 }, { "epoch": 1.54, "learning_rate": 0.00023759752350954565, "loss": 0.0192, "step": 7575 }, { "epoch": 1.54, "learning_rate": 0.00023758178640487075, "loss": 0.01, "step": 7576 }, { "epoch": 1.54, "learning_rate": 0.00023756604783741468, "loss": 0.0039, "step": 7577 }, { "epoch": 1.54, "learning_rate": 0.00023755030780744026, "loss": 0.0188, "step": 7578 }, { "epoch": 1.54, "learning_rate": 0.00023753456631521049, "loss": 0.0075, "step": 7579 }, { "epoch": 1.54, "learning_rate": 0.0002375188233609882, "loss": 0.0185, "step": 7580 }, { "epoch": 1.54, "learning_rate": 0.0002375030789450364, "loss": 0.0211, "step": 7581 }, { "epoch": 1.54, "learning_rate": 0.000237487333067618, "loss": 0.0174, "step": 7582 }, { "epoch": 1.54, "learning_rate": 0.00023747158572899596, "loss": 0.0111, "step": 7583 }, { "epoch": 1.54, "learning_rate": 0.00023745583692943333, "loss": 0.0268, "step": 7584 }, { "epoch": 1.54, "learning_rate": 0.00023744008666919317, "loss": 0.0202, "step": 7585 }, { "epoch": 1.54, "learning_rate": 0.00023742433494853846, "loss": 0.0198, "step": 7586 }, { "epoch": 1.54, "learning_rate": 0.0002374085817677324, "loss": 0.0118, "step": 7587 }, { "epoch": 1.55, "learning_rate": 0.00023739282712703796, "loss": 0.0041, "step": 7588 }, { "epoch": 1.55, "learning_rate": 0.00023737707102671838, "loss": 0.0251, "step": 7589 }, { "epoch": 1.55, "learning_rate": 0.00023736131346703679, "loss": 0.0051, "step": 7590 }, { "epoch": 1.55, "learning_rate": 0.00023734555444825632, "loss": 0.0183, "step": 7591 }, { "epoch": 1.55, "learning_rate": 0.00023732979397064026, "loss": 0.0189, "step": 7592 }, { "epoch": 1.55, "learning_rate": 0.00023731403203445175, "loss": 0.0102, "step": 7593 }, { "epoch": 1.55, "learning_rate": 0.0002372982686399541, "loss": 0.0054, "step": 7594 }, { "epoch": 1.55, "learning_rate": 0.00023728250378741056, "loss": 0.0045, "step": 7595 }, { "epoch": 1.55, "learning_rate": 0.00023726673747708447, "loss": 0.0196, "step": 7596 }, { "epoch": 1.55, "learning_rate": 0.00023725096970923914, "loss": 0.0049, "step": 7597 }, { "epoch": 1.55, "learning_rate": 0.0002372352004841379, "loss": 0.0667, "step": 7598 }, { "epoch": 1.55, "learning_rate": 0.00023721942980204418, "loss": 0.0034, "step": 7599 }, { "epoch": 1.55, "learning_rate": 0.00023720365766322134, "loss": 0.0274, "step": 7600 }, { "epoch": 1.55, "learning_rate": 0.00023718788406793274, "loss": 0.0335, "step": 7601 }, { "epoch": 1.55, "learning_rate": 0.000237172109016442, "loss": 0.0041, "step": 7602 }, { "epoch": 1.55, "learning_rate": 0.0002371563325090124, "loss": 0.0161, "step": 7603 }, { "epoch": 1.55, "learning_rate": 0.00023714055454590756, "loss": 0.0028, "step": 7604 }, { "epoch": 1.55, "learning_rate": 0.000237124775127391, "loss": 0.0083, "step": 7605 }, { "epoch": 1.55, "learning_rate": 0.00023710899425372618, "loss": 0.0127, "step": 7606 }, { "epoch": 1.55, "learning_rate": 0.00023709321192517678, "loss": 0.0188, "step": 7607 }, { "epoch": 1.55, "learning_rate": 0.0002370774281420063, "loss": 0.0092, "step": 7608 }, { "epoch": 1.55, "learning_rate": 0.00023706164290447843, "loss": 0.0075, "step": 7609 }, { "epoch": 1.55, "learning_rate": 0.00023704585621285676, "loss": 0.0185, "step": 7610 }, { "epoch": 1.55, "learning_rate": 0.000237030068067405, "loss": 0.0018, "step": 7611 }, { "epoch": 1.55, "learning_rate": 0.00023701427846838682, "loss": 0.0078, "step": 7612 }, { "epoch": 1.55, "learning_rate": 0.00023699848741606596, "loss": 0.0255, "step": 7613 }, { "epoch": 1.55, "learning_rate": 0.00023698269491070607, "loss": 0.0493, "step": 7614 }, { "epoch": 1.55, "learning_rate": 0.00023696690095257106, "loss": 0.0298, "step": 7615 }, { "epoch": 1.55, "learning_rate": 0.00023695110554192457, "loss": 0.0219, "step": 7616 }, { "epoch": 1.55, "learning_rate": 0.0002369353086790305, "loss": 0.0052, "step": 7617 }, { "epoch": 1.55, "learning_rate": 0.00023691951036415273, "loss": 0.0207, "step": 7618 }, { "epoch": 1.55, "learning_rate": 0.000236903710597555, "loss": 0.0061, "step": 7619 }, { "epoch": 1.55, "learning_rate": 0.0002368879093795013, "loss": 0.0085, "step": 7620 }, { "epoch": 1.55, "learning_rate": 0.00023687210671025552, "loss": 0.0069, "step": 7621 }, { "epoch": 1.55, "learning_rate": 0.00023685630259008157, "loss": 0.0179, "step": 7622 }, { "epoch": 1.55, "learning_rate": 0.00023684049701924338, "loss": 0.0039, "step": 7623 }, { "epoch": 1.55, "learning_rate": 0.00023682468999800498, "loss": 0.003, "step": 7624 }, { "epoch": 1.55, "learning_rate": 0.0002368088815266303, "loss": 0.0066, "step": 7625 }, { "epoch": 1.55, "learning_rate": 0.00023679307160538352, "loss": 0.0065, "step": 7626 }, { "epoch": 1.55, "learning_rate": 0.0002367772602345286, "loss": 0.0426, "step": 7627 }, { "epoch": 1.55, "learning_rate": 0.00023676144741432962, "loss": 0.0256, "step": 7628 }, { "epoch": 1.55, "learning_rate": 0.00023674563314505067, "loss": 0.0238, "step": 7629 }, { "epoch": 1.55, "learning_rate": 0.00023672981742695593, "loss": 0.0141, "step": 7630 }, { "epoch": 1.55, "learning_rate": 0.00023671400026030953, "loss": 0.024, "step": 7631 }, { "epoch": 1.55, "learning_rate": 0.0002366981816453756, "loss": 0.0275, "step": 7632 }, { "epoch": 1.55, "learning_rate": 0.00023668236158241843, "loss": 0.0078, "step": 7633 }, { "epoch": 1.55, "learning_rate": 0.0002366665400717022, "loss": 0.0094, "step": 7634 }, { "epoch": 1.55, "learning_rate": 0.00023665071711349113, "loss": 0.031, "step": 7635 }, { "epoch": 1.55, "learning_rate": 0.00023663489270804954, "loss": 0.038, "step": 7636 }, { "epoch": 1.56, "learning_rate": 0.0002366190668556417, "loss": 0.0086, "step": 7637 }, { "epoch": 1.56, "learning_rate": 0.0002366032395565319, "loss": 0.0085, "step": 7638 }, { "epoch": 1.56, "learning_rate": 0.00023658741081098459, "loss": 0.0291, "step": 7639 }, { "epoch": 1.56, "learning_rate": 0.00023657158061926397, "loss": 0.0271, "step": 7640 }, { "epoch": 1.56, "learning_rate": 0.00023655574898163466, "loss": 0.0126, "step": 7641 }, { "epoch": 1.56, "learning_rate": 0.0002365399158983609, "loss": 0.0167, "step": 7642 }, { "epoch": 1.56, "learning_rate": 0.00023652408136970717, "loss": 0.0371, "step": 7643 }, { "epoch": 1.56, "learning_rate": 0.000236508245395938, "loss": 0.0144, "step": 7644 }, { "epoch": 1.56, "learning_rate": 0.0002364924079773178, "loss": 0.0412, "step": 7645 }, { "epoch": 1.56, "learning_rate": 0.00023647656911411112, "loss": 0.0192, "step": 7646 }, { "epoch": 1.56, "learning_rate": 0.00023646072880658254, "loss": 0.0194, "step": 7647 }, { "epoch": 1.56, "learning_rate": 0.00023644488705499653, "loss": 0.0084, "step": 7648 }, { "epoch": 1.56, "learning_rate": 0.00023642904385961778, "loss": 0.0045, "step": 7649 }, { "epoch": 1.56, "learning_rate": 0.0002364131992207108, "loss": 0.0045, "step": 7650 }, { "epoch": 1.56, "learning_rate": 0.0002363973531385403, "loss": 0.0029, "step": 7651 }, { "epoch": 1.56, "learning_rate": 0.00023638150561337094, "loss": 0.0186, "step": 7652 }, { "epoch": 1.56, "learning_rate": 0.00023636565664546735, "loss": 0.0176, "step": 7653 }, { "epoch": 1.56, "learning_rate": 0.00023634980623509427, "loss": 0.0068, "step": 7654 }, { "epoch": 1.56, "learning_rate": 0.00023633395438251643, "loss": 0.027, "step": 7655 }, { "epoch": 1.56, "learning_rate": 0.00023631810108799863, "loss": 0.0077, "step": 7656 }, { "epoch": 1.56, "learning_rate": 0.00023630224635180557, "loss": 0.0089, "step": 7657 }, { "epoch": 1.56, "learning_rate": 0.00023628639017420205, "loss": 0.0194, "step": 7658 }, { "epoch": 1.56, "learning_rate": 0.000236270532555453, "loss": 0.0137, "step": 7659 }, { "epoch": 1.56, "learning_rate": 0.0002362546734958232, "loss": 0.0147, "step": 7660 }, { "epoch": 1.56, "learning_rate": 0.00023623881299557749, "loss": 0.0159, "step": 7661 }, { "epoch": 1.56, "learning_rate": 0.00023622295105498082, "loss": 0.0073, "step": 7662 }, { "epoch": 1.56, "learning_rate": 0.00023620708767429816, "loss": 0.012, "step": 7663 }, { "epoch": 1.56, "learning_rate": 0.00023619122285379438, "loss": 0.0129, "step": 7664 }, { "epoch": 1.56, "learning_rate": 0.00023617535659373445, "loss": 0.0097, "step": 7665 }, { "epoch": 1.56, "learning_rate": 0.00023615948889438345, "loss": 0.0348, "step": 7666 }, { "epoch": 1.56, "learning_rate": 0.00023614361975600633, "loss": 0.0072, "step": 7667 }, { "epoch": 1.56, "learning_rate": 0.00023612774917886815, "loss": 0.0341, "step": 7668 }, { "epoch": 1.56, "learning_rate": 0.000236111877163234, "loss": 0.0381, "step": 7669 }, { "epoch": 1.56, "learning_rate": 0.00023609600370936895, "loss": 0.0134, "step": 7670 }, { "epoch": 1.56, "learning_rate": 0.00023608012881753807, "loss": 0.0136, "step": 7671 }, { "epoch": 1.56, "learning_rate": 0.00023606425248800654, "loss": 0.0058, "step": 7672 }, { "epoch": 1.56, "learning_rate": 0.0002360483747210396, "loss": 0.0147, "step": 7673 }, { "epoch": 1.56, "learning_rate": 0.0002360324955169024, "loss": 0.0199, "step": 7674 }, { "epoch": 1.56, "learning_rate": 0.00023601661487586008, "loss": 0.0181, "step": 7675 }, { "epoch": 1.56, "learning_rate": 0.0002360007327981779, "loss": 0.0185, "step": 7676 }, { "epoch": 1.56, "learning_rate": 0.00023598484928412115, "loss": 0.011, "step": 7677 }, { "epoch": 1.56, "learning_rate": 0.0002359689643339552, "loss": 0.0102, "step": 7678 }, { "epoch": 1.56, "learning_rate": 0.00023595307794794515, "loss": 0.015, "step": 7679 }, { "epoch": 1.56, "learning_rate": 0.00023593719012635647, "loss": 0.0265, "step": 7680 }, { "epoch": 1.56, "learning_rate": 0.00023592130086945453, "loss": 0.0101, "step": 7681 }, { "epoch": 1.56, "learning_rate": 0.00023590541017750469, "loss": 0.007, "step": 7682 }, { "epoch": 1.56, "learning_rate": 0.00023588951805077231, "loss": 0.0154, "step": 7683 }, { "epoch": 1.56, "learning_rate": 0.0002358736244895229, "loss": 0.0148, "step": 7684 }, { "epoch": 1.56, "learning_rate": 0.00023585772949402182, "loss": 0.0184, "step": 7685 }, { "epoch": 1.57, "learning_rate": 0.00023584183306453457, "loss": 0.0085, "step": 7686 }, { "epoch": 1.57, "learning_rate": 0.00023582593520132673, "loss": 0.0092, "step": 7687 }, { "epoch": 1.57, "learning_rate": 0.00023581003590466372, "loss": 0.0109, "step": 7688 }, { "epoch": 1.57, "learning_rate": 0.00023579413517481115, "loss": 0.0184, "step": 7689 }, { "epoch": 1.57, "learning_rate": 0.00023577823301203457, "loss": 0.02, "step": 7690 }, { "epoch": 1.57, "learning_rate": 0.00023576232941659956, "loss": 0.0136, "step": 7691 }, { "epoch": 1.57, "learning_rate": 0.0002357464243887718, "loss": 0.0062, "step": 7692 }, { "epoch": 1.57, "learning_rate": 0.00023573051792881685, "loss": 0.0029, "step": 7693 }, { "epoch": 1.57, "learning_rate": 0.00023571461003700047, "loss": 0.0014, "step": 7694 }, { "epoch": 1.57, "learning_rate": 0.00023569870071358826, "loss": 0.0181, "step": 7695 }, { "epoch": 1.57, "learning_rate": 0.00023568278995884603, "loss": 0.0038, "step": 7696 }, { "epoch": 1.57, "learning_rate": 0.00023566687777303944, "loss": 0.0101, "step": 7697 }, { "epoch": 1.57, "learning_rate": 0.0002356509641564343, "loss": 0.0061, "step": 7698 }, { "epoch": 1.57, "learning_rate": 0.00023563504910929634, "loss": 0.0178, "step": 7699 }, { "epoch": 1.57, "learning_rate": 0.00023561913263189143, "loss": 0.0122, "step": 7700 }, { "epoch": 1.57, "learning_rate": 0.00023560321472448543, "loss": 0.0235, "step": 7701 }, { "epoch": 1.57, "learning_rate": 0.0002355872953873441, "loss": 0.0286, "step": 7702 }, { "epoch": 1.57, "learning_rate": 0.0002355713746207334, "loss": 0.0147, "step": 7703 }, { "epoch": 1.57, "learning_rate": 0.00023555545242491926, "loss": 0.0117, "step": 7704 }, { "epoch": 1.57, "learning_rate": 0.00023553952880016747, "loss": 0.0167, "step": 7705 }, { "epoch": 1.57, "learning_rate": 0.00023552360374674418, "loss": 0.0083, "step": 7706 }, { "epoch": 1.57, "learning_rate": 0.00023550767726491522, "loss": 0.0178, "step": 7707 }, { "epoch": 1.57, "learning_rate": 0.00023549174935494666, "loss": 0.0069, "step": 7708 }, { "epoch": 1.57, "learning_rate": 0.00023547582001710448, "loss": 0.0239, "step": 7709 }, { "epoch": 1.57, "learning_rate": 0.0002354598892516548, "loss": 0.0268, "step": 7710 }, { "epoch": 1.57, "learning_rate": 0.0002354439570588636, "loss": 0.0183, "step": 7711 }, { "epoch": 1.57, "learning_rate": 0.00023542802343899706, "loss": 0.0036, "step": 7712 }, { "epoch": 1.57, "learning_rate": 0.00023541208839232127, "loss": 0.0073, "step": 7713 }, { "epoch": 1.57, "learning_rate": 0.00023539615191910237, "loss": 0.011, "step": 7714 }, { "epoch": 1.57, "learning_rate": 0.0002353802140196066, "loss": 0.0089, "step": 7715 }, { "epoch": 1.57, "learning_rate": 0.0002353642746941, "loss": 0.0155, "step": 7716 }, { "epoch": 1.57, "learning_rate": 0.00023534833394284893, "loss": 0.0187, "step": 7717 }, { "epoch": 1.57, "learning_rate": 0.00023533239176611953, "loss": 0.0193, "step": 7718 }, { "epoch": 1.57, "learning_rate": 0.0002353164481641781, "loss": 0.0066, "step": 7719 }, { "epoch": 1.57, "learning_rate": 0.00023530050313729105, "loss": 0.0103, "step": 7720 }, { "epoch": 1.57, "learning_rate": 0.00023528455668572453, "loss": 0.0145, "step": 7721 }, { "epoch": 1.57, "learning_rate": 0.00023526860880974484, "loss": 0.011, "step": 7722 }, { "epoch": 1.57, "learning_rate": 0.00023525265950961852, "loss": 0.0058, "step": 7723 }, { "epoch": 1.57, "learning_rate": 0.00023523670878561185, "loss": 0.0148, "step": 7724 }, { "epoch": 1.57, "learning_rate": 0.00023522075663799124, "loss": 0.0129, "step": 7725 }, { "epoch": 1.57, "learning_rate": 0.0002352048030670231, "loss": 0.0231, "step": 7726 }, { "epoch": 1.57, "learning_rate": 0.00023518884807297396, "loss": 0.0055, "step": 7727 }, { "epoch": 1.57, "learning_rate": 0.0002351728916561102, "loss": 0.0169, "step": 7728 }, { "epoch": 1.57, "learning_rate": 0.0002351569338166984, "loss": 0.0111, "step": 7729 }, { "epoch": 1.57, "learning_rate": 0.00023514097455500508, "loss": 0.0166, "step": 7730 }, { "epoch": 1.57, "learning_rate": 0.00023512501387129675, "loss": 0.0026, "step": 7731 }, { "epoch": 1.57, "learning_rate": 0.00023510905176584002, "loss": 0.0069, "step": 7732 }, { "epoch": 1.57, "learning_rate": 0.00023509308823890145, "loss": 0.0073, "step": 7733 }, { "epoch": 1.57, "learning_rate": 0.00023507712329074766, "loss": 0.0135, "step": 7734 }, { "epoch": 1.57, "learning_rate": 0.00023506115692164536, "loss": 0.0209, "step": 7735 }, { "epoch": 1.58, "learning_rate": 0.00023504518913186116, "loss": 0.0036, "step": 7736 }, { "epoch": 1.58, "learning_rate": 0.00023502921992166176, "loss": 0.0243, "step": 7737 }, { "epoch": 1.58, "learning_rate": 0.0002350132492913139, "loss": 0.0168, "step": 7738 }, { "epoch": 1.58, "learning_rate": 0.00023499727724108428, "loss": 0.0218, "step": 7739 }, { "epoch": 1.58, "learning_rate": 0.0002349813037712397, "loss": 0.0543, "step": 7740 }, { "epoch": 1.58, "learning_rate": 0.0002349653288820469, "loss": 0.0105, "step": 7741 }, { "epoch": 1.58, "learning_rate": 0.00023494935257377278, "loss": 0.0264, "step": 7742 }, { "epoch": 1.58, "learning_rate": 0.0002349333748466841, "loss": 0.0183, "step": 7743 }, { "epoch": 1.58, "learning_rate": 0.00023491739570104773, "loss": 0.0153, "step": 7744 }, { "epoch": 1.58, "learning_rate": 0.00023490141513713057, "loss": 0.005, "step": 7745 }, { "epoch": 1.58, "learning_rate": 0.0002348854331551995, "loss": 0.0091, "step": 7746 }, { "epoch": 1.58, "learning_rate": 0.00023486944975552147, "loss": 0.0088, "step": 7747 }, { "epoch": 1.58, "learning_rate": 0.00023485346493836343, "loss": 0.0127, "step": 7748 }, { "epoch": 1.58, "learning_rate": 0.00023483747870399233, "loss": 0.0115, "step": 7749 }, { "epoch": 1.58, "learning_rate": 0.00023482149105267521, "loss": 0.0264, "step": 7750 }, { "epoch": 1.58, "learning_rate": 0.0002348055019846791, "loss": 0.0269, "step": 7751 }, { "epoch": 1.58, "learning_rate": 0.00023478951150027104, "loss": 0.0427, "step": 7752 }, { "epoch": 1.58, "learning_rate": 0.00023477351959971804, "loss": 0.0111, "step": 7753 }, { "epoch": 1.58, "learning_rate": 0.00023475752628328723, "loss": 0.0125, "step": 7754 }, { "epoch": 1.58, "learning_rate": 0.00023474153155124574, "loss": 0.019, "step": 7755 }, { "epoch": 1.58, "learning_rate": 0.00023472553540386073, "loss": 0.0122, "step": 7756 }, { "epoch": 1.58, "learning_rate": 0.0002347095378413994, "loss": 0.0028, "step": 7757 }, { "epoch": 1.58, "learning_rate": 0.0002346935388641288, "loss": 0.0023, "step": 7758 }, { "epoch": 1.58, "learning_rate": 0.0002346775384723163, "loss": 0.014, "step": 7759 }, { "epoch": 1.58, "learning_rate": 0.000234661536666229, "loss": 0.0042, "step": 7760 }, { "epoch": 1.58, "learning_rate": 0.00023464553344613428, "loss": 0.0185, "step": 7761 }, { "epoch": 1.58, "learning_rate": 0.0002346295288122994, "loss": 0.0357, "step": 7762 }, { "epoch": 1.58, "learning_rate": 0.00023461352276499156, "loss": 0.0086, "step": 7763 }, { "epoch": 1.58, "learning_rate": 0.0002345975153044782, "loss": 0.0082, "step": 7764 }, { "epoch": 1.58, "learning_rate": 0.00023458150643102665, "loss": 0.035, "step": 7765 }, { "epoch": 1.58, "learning_rate": 0.00023456549614490432, "loss": 0.0098, "step": 7766 }, { "epoch": 1.58, "learning_rate": 0.00023454948444637854, "loss": 0.0182, "step": 7767 }, { "epoch": 1.58, "learning_rate": 0.00023453347133571673, "loss": 0.014, "step": 7768 }, { "epoch": 1.58, "learning_rate": 0.00023451745681318646, "loss": 0.0045, "step": 7769 }, { "epoch": 1.58, "learning_rate": 0.00023450144087905508, "loss": 0.007, "step": 7770 }, { "epoch": 1.58, "learning_rate": 0.00023448542353359013, "loss": 0.0047, "step": 7771 }, { "epoch": 1.58, "learning_rate": 0.00023446940477705913, "loss": 0.0244, "step": 7772 }, { "epoch": 1.58, "learning_rate": 0.00023445338460972962, "loss": 0.018, "step": 7773 }, { "epoch": 1.58, "learning_rate": 0.00023443736303186918, "loss": 0.0157, "step": 7774 }, { "epoch": 1.58, "learning_rate": 0.0002344213400437454, "loss": 0.0157, "step": 7775 }, { "epoch": 1.58, "learning_rate": 0.00023440531564562588, "loss": 0.0153, "step": 7776 }, { "epoch": 1.58, "learning_rate": 0.00023438928983777826, "loss": 0.0106, "step": 7777 }, { "epoch": 1.58, "learning_rate": 0.0002343732626204702, "loss": 0.0111, "step": 7778 }, { "epoch": 1.58, "learning_rate": 0.0002343572339939694, "loss": 0.054, "step": 7779 }, { "epoch": 1.58, "learning_rate": 0.00023434120395854355, "loss": 0.0081, "step": 7780 }, { "epoch": 1.58, "learning_rate": 0.00023432517251446036, "loss": 0.032, "step": 7781 }, { "epoch": 1.58, "learning_rate": 0.00023430913966198766, "loss": 0.0216, "step": 7782 }, { "epoch": 1.58, "learning_rate": 0.00023429310540139313, "loss": 0.0135, "step": 7783 }, { "epoch": 1.58, "learning_rate": 0.0002342770697329447, "loss": 0.0226, "step": 7784 }, { "epoch": 1.59, "learning_rate": 0.00023426103265691004, "loss": 0.0079, "step": 7785 }, { "epoch": 1.59, "learning_rate": 0.00023424499417355713, "loss": 0.0276, "step": 7786 }, { "epoch": 1.59, "learning_rate": 0.00023422895428315378, "loss": 0.0029, "step": 7787 }, { "epoch": 1.59, "learning_rate": 0.00023421291298596786, "loss": 0.0099, "step": 7788 }, { "epoch": 1.59, "learning_rate": 0.0002341968702822674, "loss": 0.0185, "step": 7789 }, { "epoch": 1.59, "learning_rate": 0.00023418082617232026, "loss": 0.0197, "step": 7790 }, { "epoch": 1.59, "learning_rate": 0.0002341647806563944, "loss": 0.0158, "step": 7791 }, { "epoch": 1.59, "learning_rate": 0.00023414873373475784, "loss": 0.0135, "step": 7792 }, { "epoch": 1.59, "learning_rate": 0.00023413268540767857, "loss": 0.0086, "step": 7793 }, { "epoch": 1.59, "learning_rate": 0.00023411663567542466, "loss": 0.0237, "step": 7794 }, { "epoch": 1.59, "learning_rate": 0.00023410058453826414, "loss": 0.0112, "step": 7795 }, { "epoch": 1.59, "learning_rate": 0.00023408453199646507, "loss": 0.0076, "step": 7796 }, { "epoch": 1.59, "learning_rate": 0.00023406847805029565, "loss": 0.017, "step": 7797 }, { "epoch": 1.59, "learning_rate": 0.000234052422700024, "loss": 0.0178, "step": 7798 }, { "epoch": 1.59, "learning_rate": 0.00023403636594591815, "loss": 0.0131, "step": 7799 }, { "epoch": 1.59, "learning_rate": 0.0002340203077882464, "loss": 0.0056, "step": 7800 }, { "epoch": 1.59, "learning_rate": 0.00023400424822727687, "loss": 0.0083, "step": 7801 }, { "epoch": 1.59, "learning_rate": 0.00023398818726327785, "loss": 0.0095, "step": 7802 }, { "epoch": 1.59, "learning_rate": 0.0002339721248965176, "loss": 0.0064, "step": 7803 }, { "epoch": 1.59, "learning_rate": 0.00023395606112726428, "loss": 0.0077, "step": 7804 }, { "epoch": 1.59, "learning_rate": 0.0002339399959557863, "loss": 0.0065, "step": 7805 }, { "epoch": 1.59, "learning_rate": 0.00023392392938235195, "loss": 0.0065, "step": 7806 }, { "epoch": 1.59, "learning_rate": 0.00023390786140722953, "loss": 0.0266, "step": 7807 }, { "epoch": 1.59, "learning_rate": 0.00023389179203068747, "loss": 0.0176, "step": 7808 }, { "epoch": 1.59, "learning_rate": 0.00023387572125299413, "loss": 0.01, "step": 7809 }, { "epoch": 1.59, "learning_rate": 0.00023385964907441788, "loss": 0.0124, "step": 7810 }, { "epoch": 1.59, "learning_rate": 0.00023384357549522723, "loss": 0.0121, "step": 7811 }, { "epoch": 1.59, "learning_rate": 0.00023382750051569062, "loss": 0.0464, "step": 7812 }, { "epoch": 1.59, "learning_rate": 0.00023381142413607647, "loss": 0.007, "step": 7813 }, { "epoch": 1.59, "learning_rate": 0.00023379534635665334, "loss": 0.0217, "step": 7814 }, { "epoch": 1.59, "learning_rate": 0.00023377926717768973, "loss": 0.005, "step": 7815 }, { "epoch": 1.59, "learning_rate": 0.00023376318659945426, "loss": 0.0385, "step": 7816 }, { "epoch": 1.59, "learning_rate": 0.00023374710462221543, "loss": 0.0035, "step": 7817 }, { "epoch": 1.59, "learning_rate": 0.0002337310212462419, "loss": 0.0051, "step": 7818 }, { "epoch": 1.59, "learning_rate": 0.00023371493647180222, "loss": 0.0137, "step": 7819 }, { "epoch": 1.59, "learning_rate": 0.00023369885029916507, "loss": 0.0108, "step": 7820 }, { "epoch": 1.59, "learning_rate": 0.0002336827627285992, "loss": 0.0134, "step": 7821 }, { "epoch": 1.59, "learning_rate": 0.0002336666737603732, "loss": 0.0525, "step": 7822 }, { "epoch": 1.59, "learning_rate": 0.0002336505833947558, "loss": 0.0034, "step": 7823 }, { "epoch": 1.59, "learning_rate": 0.00023363449163201576, "loss": 0.0202, "step": 7824 }, { "epoch": 1.59, "learning_rate": 0.0002336183984724218, "loss": 0.0158, "step": 7825 }, { "epoch": 1.59, "learning_rate": 0.00023360230391624283, "loss": 0.0042, "step": 7826 }, { "epoch": 1.59, "learning_rate": 0.0002335862079637475, "loss": 0.0105, "step": 7827 }, { "epoch": 1.59, "learning_rate": 0.00023357011061520474, "loss": 0.0055, "step": 7828 }, { "epoch": 1.59, "learning_rate": 0.00023355401187088337, "loss": 0.0142, "step": 7829 }, { "epoch": 1.59, "learning_rate": 0.0002335379117310523, "loss": 0.0131, "step": 7830 }, { "epoch": 1.59, "learning_rate": 0.00023352181019598042, "loss": 0.0129, "step": 7831 }, { "epoch": 1.59, "learning_rate": 0.00023350570726593663, "loss": 0.0206, "step": 7832 }, { "epoch": 1.59, "learning_rate": 0.00023348960294118995, "loss": 0.0428, "step": 7833 }, { "epoch": 1.6, "learning_rate": 0.00023347349722200924, "loss": 0.0075, "step": 7834 }, { "epoch": 1.6, "learning_rate": 0.0002334573901086636, "loss": 0.008, "step": 7835 }, { "epoch": 1.6, "learning_rate": 0.000233441281601422, "loss": 0.0085, "step": 7836 }, { "epoch": 1.6, "learning_rate": 0.00023342517170055346, "loss": 0.0222, "step": 7837 }, { "epoch": 1.6, "learning_rate": 0.00023340906040632712, "loss": 0.008, "step": 7838 }, { "epoch": 1.6, "learning_rate": 0.000233392947719012, "loss": 0.0231, "step": 7839 }, { "epoch": 1.6, "learning_rate": 0.00023337683363887729, "loss": 0.0097, "step": 7840 }, { "epoch": 1.6, "learning_rate": 0.00023336071816619202, "loss": 0.0075, "step": 7841 }, { "epoch": 1.6, "learning_rate": 0.00023334460130122536, "loss": 0.0084, "step": 7842 }, { "epoch": 1.6, "learning_rate": 0.0002333284830442466, "loss": 0.0287, "step": 7843 }, { "epoch": 1.6, "learning_rate": 0.00023331236339552489, "loss": 0.0101, "step": 7844 }, { "epoch": 1.6, "learning_rate": 0.0002332962423553294, "loss": 0.0091, "step": 7845 }, { "epoch": 1.6, "learning_rate": 0.00023328011992392945, "loss": 0.0118, "step": 7846 }, { "epoch": 1.6, "learning_rate": 0.0002332639961015943, "loss": 0.0109, "step": 7847 }, { "epoch": 1.6, "learning_rate": 0.0002332478708885932, "loss": 0.0192, "step": 7848 }, { "epoch": 1.6, "learning_rate": 0.00023323174428519563, "loss": 0.0058, "step": 7849 }, { "epoch": 1.6, "learning_rate": 0.00023321561629167074, "loss": 0.0134, "step": 7850 }, { "epoch": 1.6, "learning_rate": 0.00023319948690828795, "loss": 0.0118, "step": 7851 }, { "epoch": 1.6, "learning_rate": 0.00023318335613531675, "loss": 0.0038, "step": 7852 }, { "epoch": 1.6, "learning_rate": 0.00023316722397302638, "loss": 0.0164, "step": 7853 }, { "epoch": 1.6, "learning_rate": 0.0002331510904216865, "loss": 0.0108, "step": 7854 }, { "epoch": 1.6, "learning_rate": 0.00023313495548156637, "loss": 0.0028, "step": 7855 }, { "epoch": 1.6, "learning_rate": 0.00023311881915293555, "loss": 0.0049, "step": 7856 }, { "epoch": 1.6, "learning_rate": 0.00023310268143606361, "loss": 0.0087, "step": 7857 }, { "epoch": 1.6, "learning_rate": 0.00023308654233122, "loss": 0.0099, "step": 7858 }, { "epoch": 1.6, "learning_rate": 0.0002330704018386743, "loss": 0.0188, "step": 7859 }, { "epoch": 1.6, "learning_rate": 0.00023305425995869604, "loss": 0.026, "step": 7860 }, { "epoch": 1.6, "learning_rate": 0.0002330381166915549, "loss": 0.002, "step": 7861 }, { "epoch": 1.6, "learning_rate": 0.00023302197203752047, "loss": 0.0063, "step": 7862 }, { "epoch": 1.6, "learning_rate": 0.00023300582599686238, "loss": 0.0163, "step": 7863 }, { "epoch": 1.6, "learning_rate": 0.00023298967856985034, "loss": 0.0146, "step": 7864 }, { "epoch": 1.6, "learning_rate": 0.000232973529756754, "loss": 0.0197, "step": 7865 }, { "epoch": 1.6, "learning_rate": 0.00023295737955784303, "loss": 0.0118, "step": 7866 }, { "epoch": 1.6, "learning_rate": 0.00023294122797338728, "loss": 0.0229, "step": 7867 }, { "epoch": 1.6, "learning_rate": 0.00023292507500365648, "loss": 0.0083, "step": 7868 }, { "epoch": 1.6, "learning_rate": 0.00023290892064892037, "loss": 0.0027, "step": 7869 }, { "epoch": 1.6, "learning_rate": 0.00023289276490944877, "loss": 0.0182, "step": 7870 }, { "epoch": 1.6, "learning_rate": 0.00023287660778551153, "loss": 0.0201, "step": 7871 }, { "epoch": 1.6, "learning_rate": 0.00023286044927737855, "loss": 0.0062, "step": 7872 }, { "epoch": 1.6, "learning_rate": 0.0002328442893853196, "loss": 0.002, "step": 7873 }, { "epoch": 1.6, "learning_rate": 0.00023282812810960463, "loss": 0.0491, "step": 7874 }, { "epoch": 1.6, "learning_rate": 0.0002328119654505036, "loss": 0.0031, "step": 7875 }, { "epoch": 1.6, "learning_rate": 0.0002327958014082864, "loss": 0.0033, "step": 7876 }, { "epoch": 1.6, "learning_rate": 0.0002327796359832231, "loss": 0.0042, "step": 7877 }, { "epoch": 1.6, "learning_rate": 0.00023276346917558356, "loss": 0.0162, "step": 7878 }, { "epoch": 1.6, "learning_rate": 0.00023274730098563786, "loss": 0.0054, "step": 7879 }, { "epoch": 1.6, "learning_rate": 0.00023273113141365604, "loss": 0.0122, "step": 7880 }, { "epoch": 1.6, "learning_rate": 0.00023271496045990816, "loss": 0.0117, "step": 7881 }, { "epoch": 1.6, "learning_rate": 0.00023269878812466434, "loss": 0.0181, "step": 7882 }, { "epoch": 1.61, "learning_rate": 0.00023268261440819463, "loss": 0.0037, "step": 7883 }, { "epoch": 1.61, "learning_rate": 0.00023266643931076916, "loss": 0.0128, "step": 7884 }, { "epoch": 1.61, "learning_rate": 0.00023265026283265813, "loss": 0.014, "step": 7885 }, { "epoch": 1.61, "learning_rate": 0.00023263408497413172, "loss": 0.0088, "step": 7886 }, { "epoch": 1.61, "learning_rate": 0.0002326179057354601, "loss": 0.0164, "step": 7887 }, { "epoch": 1.61, "learning_rate": 0.00023260172511691346, "loss": 0.0132, "step": 7888 }, { "epoch": 1.61, "learning_rate": 0.00023258554311876215, "loss": 0.0111, "step": 7889 }, { "epoch": 1.61, "learning_rate": 0.0002325693597412763, "loss": 0.0173, "step": 7890 }, { "epoch": 1.61, "learning_rate": 0.00023255317498472634, "loss": 0.0153, "step": 7891 }, { "epoch": 1.61, "learning_rate": 0.0002325369888493825, "loss": 0.0089, "step": 7892 }, { "epoch": 1.61, "learning_rate": 0.00023252080133551517, "loss": 0.0472, "step": 7893 }, { "epoch": 1.61, "learning_rate": 0.00023250461244339469, "loss": 0.0299, "step": 7894 }, { "epoch": 1.61, "learning_rate": 0.00023248842217329143, "loss": 0.0202, "step": 7895 }, { "epoch": 1.61, "learning_rate": 0.0002324722305254758, "loss": 0.0311, "step": 7896 }, { "epoch": 1.61, "learning_rate": 0.00023245603750021826, "loss": 0.0078, "step": 7897 }, { "epoch": 1.61, "learning_rate": 0.00023243984309778926, "loss": 0.0204, "step": 7898 }, { "epoch": 1.61, "learning_rate": 0.00023242364731845922, "loss": 0.0107, "step": 7899 }, { "epoch": 1.61, "learning_rate": 0.00023240745016249876, "loss": 0.0095, "step": 7900 }, { "epoch": 1.61, "learning_rate": 0.00023239125163017826, "loss": 0.0118, "step": 7901 }, { "epoch": 1.61, "learning_rate": 0.00023237505172176833, "loss": 0.0324, "step": 7902 }, { "epoch": 1.61, "learning_rate": 0.0002323588504375396, "loss": 0.021, "step": 7903 }, { "epoch": 1.61, "learning_rate": 0.00023234264777776255, "loss": 0.0066, "step": 7904 }, { "epoch": 1.61, "learning_rate": 0.00023232644374270785, "loss": 0.0084, "step": 7905 }, { "epoch": 1.61, "learning_rate": 0.00023231023833264618, "loss": 0.0193, "step": 7906 }, { "epoch": 1.61, "learning_rate": 0.00023229403154784812, "loss": 0.0165, "step": 7907 }, { "epoch": 1.61, "learning_rate": 0.00023227782338858442, "loss": 0.0215, "step": 7908 }, { "epoch": 1.61, "learning_rate": 0.00023226161385512574, "loss": 0.01, "step": 7909 }, { "epoch": 1.61, "learning_rate": 0.00023224540294774286, "loss": 0.0126, "step": 7910 }, { "epoch": 1.61, "learning_rate": 0.00023222919066670647, "loss": 0.016, "step": 7911 }, { "epoch": 1.61, "learning_rate": 0.00023221297701228735, "loss": 0.0185, "step": 7912 }, { "epoch": 1.61, "learning_rate": 0.00023219676198475638, "loss": 0.0094, "step": 7913 }, { "epoch": 1.61, "learning_rate": 0.00023218054558438433, "loss": 0.0088, "step": 7914 }, { "epoch": 1.61, "learning_rate": 0.000232164327811442, "loss": 0.0089, "step": 7915 }, { "epoch": 1.61, "learning_rate": 0.00023214810866620028, "loss": 0.0157, "step": 7916 }, { "epoch": 1.61, "learning_rate": 0.00023213188814893014, "loss": 0.0053, "step": 7917 }, { "epoch": 1.61, "learning_rate": 0.00023211566625990242, "loss": 0.0128, "step": 7918 }, { "epoch": 1.61, "learning_rate": 0.00023209944299938806, "loss": 0.0131, "step": 7919 }, { "epoch": 1.61, "learning_rate": 0.00023208321836765803, "loss": 0.0416, "step": 7920 }, { "epoch": 1.61, "learning_rate": 0.0002320669923649833, "loss": 0.0127, "step": 7921 }, { "epoch": 1.61, "learning_rate": 0.0002320507649916349, "loss": 0.0077, "step": 7922 }, { "epoch": 1.61, "learning_rate": 0.00023203453624788387, "loss": 0.0069, "step": 7923 }, { "epoch": 1.61, "learning_rate": 0.00023201830613400117, "loss": 0.0184, "step": 7924 }, { "epoch": 1.61, "learning_rate": 0.00023200207465025796, "loss": 0.0398, "step": 7925 }, { "epoch": 1.61, "learning_rate": 0.0002319858417969253, "loss": 0.0598, "step": 7926 }, { "epoch": 1.61, "learning_rate": 0.00023196960757427437, "loss": 0.0092, "step": 7927 }, { "epoch": 1.61, "learning_rate": 0.00023195337198257625, "loss": 0.027, "step": 7928 }, { "epoch": 1.61, "learning_rate": 0.0002319371350221021, "loss": 0.0121, "step": 7929 }, { "epoch": 1.61, "learning_rate": 0.00023192089669312312, "loss": 0.0207, "step": 7930 }, { "epoch": 1.61, "learning_rate": 0.00023190465699591056, "loss": 0.0129, "step": 7931 }, { "epoch": 1.62, "learning_rate": 0.0002318884159307356, "loss": 0.0121, "step": 7932 }, { "epoch": 1.62, "learning_rate": 0.00023187217349786952, "loss": 0.0387, "step": 7933 }, { "epoch": 1.62, "learning_rate": 0.00023185592969758362, "loss": 0.0134, "step": 7934 }, { "epoch": 1.62, "learning_rate": 0.00023183968453014916, "loss": 0.0054, "step": 7935 }, { "epoch": 1.62, "learning_rate": 0.00023182343799583744, "loss": 0.019, "step": 7936 }, { "epoch": 1.62, "learning_rate": 0.00023180719009491995, "loss": 0.0216, "step": 7937 }, { "epoch": 1.62, "learning_rate": 0.00023179094082766792, "loss": 0.0347, "step": 7938 }, { "epoch": 1.62, "learning_rate": 0.00023177469019435275, "loss": 0.0085, "step": 7939 }, { "epoch": 1.62, "learning_rate": 0.00023175843819524592, "loss": 0.0202, "step": 7940 }, { "epoch": 1.62, "learning_rate": 0.00023174218483061886, "loss": 0.0288, "step": 7941 }, { "epoch": 1.62, "learning_rate": 0.00023172593010074304, "loss": 0.0339, "step": 7942 }, { "epoch": 1.62, "learning_rate": 0.00023170967400588984, "loss": 0.0086, "step": 7943 }, { "epoch": 1.62, "learning_rate": 0.0002316934165463309, "loss": 0.0032, "step": 7944 }, { "epoch": 1.62, "learning_rate": 0.00023167715772233767, "loss": 0.0228, "step": 7945 }, { "epoch": 1.62, "learning_rate": 0.00023166089753418176, "loss": 0.0035, "step": 7946 }, { "epoch": 1.62, "learning_rate": 0.0002316446359821347, "loss": 0.0048, "step": 7947 }, { "epoch": 1.62, "learning_rate": 0.0002316283730664681, "loss": 0.0136, "step": 7948 }, { "epoch": 1.62, "learning_rate": 0.00023161210878745356, "loss": 0.0104, "step": 7949 }, { "epoch": 1.62, "learning_rate": 0.00023159584314536274, "loss": 0.0156, "step": 7950 }, { "epoch": 1.62, "learning_rate": 0.00023157957614046738, "loss": 0.0034, "step": 7951 }, { "epoch": 1.62, "learning_rate": 0.00023156330777303907, "loss": 0.0193, "step": 7952 }, { "epoch": 1.62, "learning_rate": 0.00023154703804334958, "loss": 0.033, "step": 7953 }, { "epoch": 1.62, "learning_rate": 0.0002315307669516706, "loss": 0.0091, "step": 7954 }, { "epoch": 1.62, "learning_rate": 0.00023151449449827392, "loss": 0.0139, "step": 7955 }, { "epoch": 1.62, "learning_rate": 0.0002314982206834313, "loss": 0.0067, "step": 7956 }, { "epoch": 1.62, "learning_rate": 0.00023148194550741457, "loss": 0.0132, "step": 7957 }, { "epoch": 1.62, "learning_rate": 0.00023146566897049557, "loss": 0.0098, "step": 7958 }, { "epoch": 1.62, "learning_rate": 0.00023144939107294608, "loss": 0.0295, "step": 7959 }, { "epoch": 1.62, "learning_rate": 0.00023143311181503804, "loss": 0.0222, "step": 7960 }, { "epoch": 1.62, "learning_rate": 0.00023141683119704332, "loss": 0.0161, "step": 7961 }, { "epoch": 1.62, "learning_rate": 0.00023140054921923377, "loss": 0.0091, "step": 7962 }, { "epoch": 1.62, "learning_rate": 0.00023138426588188146, "loss": 0.0156, "step": 7963 }, { "epoch": 1.62, "learning_rate": 0.00023136798118525824, "loss": 0.022, "step": 7964 }, { "epoch": 1.62, "learning_rate": 0.0002313516951296362, "loss": 0.014, "step": 7965 }, { "epoch": 1.62, "learning_rate": 0.00023133540771528725, "loss": 0.0059, "step": 7966 }, { "epoch": 1.62, "learning_rate": 0.00023131911894248348, "loss": 0.0171, "step": 7967 }, { "epoch": 1.62, "learning_rate": 0.00023130282881149685, "loss": 0.0139, "step": 7968 }, { "epoch": 1.62, "learning_rate": 0.00023128653732259962, "loss": 0.0184, "step": 7969 }, { "epoch": 1.62, "learning_rate": 0.00023127024447606371, "loss": 0.0158, "step": 7970 }, { "epoch": 1.62, "learning_rate": 0.00023125395027216134, "loss": 0.0508, "step": 7971 }, { "epoch": 1.62, "learning_rate": 0.0002312376547111646, "loss": 0.0203, "step": 7972 }, { "epoch": 1.62, "learning_rate": 0.00023122135779334564, "loss": 0.0104, "step": 7973 }, { "epoch": 1.62, "learning_rate": 0.00023120505951897678, "loss": 0.0307, "step": 7974 }, { "epoch": 1.62, "learning_rate": 0.00023118875988833009, "loss": 0.0129, "step": 7975 }, { "epoch": 1.62, "learning_rate": 0.00023117245890167784, "loss": 0.0105, "step": 7976 }, { "epoch": 1.62, "learning_rate": 0.00023115615655929233, "loss": 0.0077, "step": 7977 }, { "epoch": 1.62, "learning_rate": 0.00023113985286144582, "loss": 0.0067, "step": 7978 }, { "epoch": 1.62, "learning_rate": 0.0002311235478084106, "loss": 0.0012, "step": 7979 }, { "epoch": 1.62, "learning_rate": 0.00023110724140045898, "loss": 0.019, "step": 7980 }, { "epoch": 1.63, "learning_rate": 0.00023109093363786332, "loss": 0.0125, "step": 7981 }, { "epoch": 1.63, "learning_rate": 0.000231074624520896, "loss": 0.015, "step": 7982 }, { "epoch": 1.63, "learning_rate": 0.00023105831404982943, "loss": 0.0073, "step": 7983 }, { "epoch": 1.63, "learning_rate": 0.00023104200222493602, "loss": 0.0041, "step": 7984 }, { "epoch": 1.63, "learning_rate": 0.00023102568904648818, "loss": 0.008, "step": 7985 }, { "epoch": 1.63, "learning_rate": 0.00023100937451475838, "loss": 0.0044, "step": 7986 }, { "epoch": 1.63, "learning_rate": 0.0002309930586300191, "loss": 0.0298, "step": 7987 }, { "epoch": 1.63, "learning_rate": 0.00023097674139254293, "loss": 0.0042, "step": 7988 }, { "epoch": 1.63, "learning_rate": 0.00023096042280260225, "loss": 0.0173, "step": 7989 }, { "epoch": 1.63, "learning_rate": 0.0002309441028604697, "loss": 0.0251, "step": 7990 }, { "epoch": 1.63, "learning_rate": 0.00023092778156641783, "loss": 0.0273, "step": 7991 }, { "epoch": 1.63, "learning_rate": 0.00023091145892071923, "loss": 0.0126, "step": 7992 }, { "epoch": 1.63, "learning_rate": 0.0002308951349236466, "loss": 0.0063, "step": 7993 }, { "epoch": 1.63, "learning_rate": 0.00023087880957547245, "loss": 0.008, "step": 7994 }, { "epoch": 1.63, "learning_rate": 0.00023086248287646955, "loss": 0.0273, "step": 7995 }, { "epoch": 1.63, "learning_rate": 0.00023084615482691053, "loss": 0.0028, "step": 7996 }, { "epoch": 1.63, "learning_rate": 0.00023082982542706816, "loss": 0.0201, "step": 7997 }, { "epoch": 1.63, "learning_rate": 0.00023081349467721508, "loss": 0.0315, "step": 7998 }, { "epoch": 1.63, "learning_rate": 0.00023079716257762409, "loss": 0.0136, "step": 7999 }, { "epoch": 1.63, "learning_rate": 0.00023078082912856798, "loss": 0.0214, "step": 8000 }, { "epoch": 1.63, "learning_rate": 0.00023076449433031952, "loss": 0.0248, "step": 8001 }, { "epoch": 1.63, "learning_rate": 0.00023074815818315158, "loss": 0.0035, "step": 8002 }, { "epoch": 1.63, "learning_rate": 0.000230731820687337, "loss": 0.0081, "step": 8003 }, { "epoch": 1.63, "learning_rate": 0.00023071548184314857, "loss": 0.0163, "step": 8004 }, { "epoch": 1.63, "learning_rate": 0.0002306991416508592, "loss": 0.0082, "step": 8005 }, { "epoch": 1.63, "learning_rate": 0.00023068280011074197, "loss": 0.0172, "step": 8006 }, { "epoch": 1.63, "learning_rate": 0.00023066645722306952, "loss": 0.0306, "step": 8007 }, { "epoch": 1.63, "learning_rate": 0.0002306501129881151, "loss": 0.0225, "step": 8008 }, { "epoch": 1.63, "learning_rate": 0.00023063376740615148, "loss": 0.0049, "step": 8009 }, { "epoch": 1.63, "learning_rate": 0.00023061742047745173, "loss": 0.0388, "step": 8010 }, { "epoch": 1.63, "learning_rate": 0.00023060107220228892, "loss": 0.0119, "step": 8011 }, { "epoch": 1.63, "learning_rate": 0.00023058472258093602, "loss": 0.011, "step": 8012 }, { "epoch": 1.63, "learning_rate": 0.00023056837161366617, "loss": 0.0131, "step": 8013 }, { "epoch": 1.63, "learning_rate": 0.0002305520193007524, "loss": 0.0093, "step": 8014 }, { "epoch": 1.63, "learning_rate": 0.00023053566564246788, "loss": 0.0144, "step": 8015 }, { "epoch": 1.63, "learning_rate": 0.00023051931063908576, "loss": 0.0345, "step": 8016 }, { "epoch": 1.63, "learning_rate": 0.00023050295429087912, "loss": 0.016, "step": 8017 }, { "epoch": 1.63, "learning_rate": 0.00023048659659812118, "loss": 0.0205, "step": 8018 }, { "epoch": 1.63, "learning_rate": 0.00023047023756108512, "loss": 0.0053, "step": 8019 }, { "epoch": 1.63, "learning_rate": 0.00023045387718004427, "loss": 0.0167, "step": 8020 }, { "epoch": 1.63, "learning_rate": 0.00023043751545527173, "loss": 0.014, "step": 8021 }, { "epoch": 1.63, "learning_rate": 0.00023042115238704083, "loss": 0.0163, "step": 8022 }, { "epoch": 1.63, "learning_rate": 0.00023040478797562496, "loss": 0.004, "step": 8023 }, { "epoch": 1.63, "learning_rate": 0.0002303884222212973, "loss": 0.0336, "step": 8024 }, { "epoch": 1.63, "learning_rate": 0.0002303720551243313, "loss": 0.0117, "step": 8025 }, { "epoch": 1.63, "learning_rate": 0.00023035568668500022, "loss": 0.0123, "step": 8026 }, { "epoch": 1.63, "learning_rate": 0.0002303393169035775, "loss": 0.01, "step": 8027 }, { "epoch": 1.63, "learning_rate": 0.00023032294578033652, "loss": 0.0117, "step": 8028 }, { "epoch": 1.63, "learning_rate": 0.00023030657331555074, "loss": 0.0544, "step": 8029 }, { "epoch": 1.64, "learning_rate": 0.00023029019950949366, "loss": 0.0078, "step": 8030 }, { "epoch": 1.64, "learning_rate": 0.0002302738243624386, "loss": 0.0138, "step": 8031 }, { "epoch": 1.64, "learning_rate": 0.00023025744787465917, "loss": 0.0068, "step": 8032 }, { "epoch": 1.64, "learning_rate": 0.00023024107004642887, "loss": 0.0163, "step": 8033 }, { "epoch": 1.64, "learning_rate": 0.00023022469087802123, "loss": 0.0055, "step": 8034 }, { "epoch": 1.64, "learning_rate": 0.00023020831036970983, "loss": 0.0114, "step": 8035 }, { "epoch": 1.64, "learning_rate": 0.00023019192852176821, "loss": 0.0285, "step": 8036 }, { "epoch": 1.64, "learning_rate": 0.00023017554533447002, "loss": 0.0026, "step": 8037 }, { "epoch": 1.64, "learning_rate": 0.00023015916080808892, "loss": 0.0226, "step": 8038 }, { "epoch": 1.64, "learning_rate": 0.0002301427749428985, "loss": 0.0069, "step": 8039 }, { "epoch": 1.64, "learning_rate": 0.0002301263877391725, "loss": 0.0091, "step": 8040 }, { "epoch": 1.64, "learning_rate": 0.0002301099991971845, "loss": 0.0085, "step": 8041 }, { "epoch": 1.64, "learning_rate": 0.00023009360931720832, "loss": 0.0226, "step": 8042 }, { "epoch": 1.64, "learning_rate": 0.00023007721809951767, "loss": 0.0382, "step": 8043 }, { "epoch": 1.64, "learning_rate": 0.00023006082554438633, "loss": 0.0383, "step": 8044 }, { "epoch": 1.64, "learning_rate": 0.0002300444316520881, "loss": 0.0113, "step": 8045 }, { "epoch": 1.64, "learning_rate": 0.00023002803642289675, "loss": 0.0111, "step": 8046 }, { "epoch": 1.64, "learning_rate": 0.00023001163985708612, "loss": 0.019, "step": 8047 }, { "epoch": 1.64, "learning_rate": 0.00022999524195493009, "loss": 0.0432, "step": 8048 }, { "epoch": 1.64, "learning_rate": 0.0002299788427167025, "loss": 0.0034, "step": 8049 }, { "epoch": 1.64, "learning_rate": 0.0002299624421426773, "loss": 0.0287, "step": 8050 }, { "epoch": 1.64, "learning_rate": 0.00022994604023312835, "loss": 0.0132, "step": 8051 }, { "epoch": 1.64, "learning_rate": 0.00022992963698832957, "loss": 0.0131, "step": 8052 }, { "epoch": 1.64, "learning_rate": 0.00022991323240855507, "loss": 0.0108, "step": 8053 }, { "epoch": 1.64, "learning_rate": 0.00022989682649407866, "loss": 0.0093, "step": 8054 }, { "epoch": 1.64, "learning_rate": 0.00022988041924517448, "loss": 0.0108, "step": 8055 }, { "epoch": 1.64, "learning_rate": 0.0002298640106621165, "loss": 0.0068, "step": 8056 }, { "epoch": 1.64, "learning_rate": 0.0002298476007451788, "loss": 0.0141, "step": 8057 }, { "epoch": 1.64, "learning_rate": 0.00022983118949463543, "loss": 0.0285, "step": 8058 }, { "epoch": 1.64, "learning_rate": 0.0002298147769107605, "loss": 0.0078, "step": 8059 }, { "epoch": 1.64, "learning_rate": 0.00022979836299382814, "loss": 0.0167, "step": 8060 }, { "epoch": 1.64, "learning_rate": 0.0002297819477441125, "loss": 0.0022, "step": 8061 }, { "epoch": 1.64, "learning_rate": 0.00022976553116188774, "loss": 0.0142, "step": 8062 }, { "epoch": 1.64, "learning_rate": 0.000229749113247428, "loss": 0.0092, "step": 8063 }, { "epoch": 1.64, "learning_rate": 0.00022973269400100753, "loss": 0.0181, "step": 8064 }, { "epoch": 1.64, "learning_rate": 0.0002297162734229006, "loss": 0.0366, "step": 8065 }, { "epoch": 1.64, "learning_rate": 0.00022969985151338138, "loss": 0.004, "step": 8066 }, { "epoch": 1.64, "learning_rate": 0.0002296834282727243, "loss": 0.0075, "step": 8067 }, { "epoch": 1.64, "learning_rate": 0.00022966700370120346, "loss": 0.0073, "step": 8068 }, { "epoch": 1.64, "learning_rate": 0.0002296505777990933, "loss": 0.0151, "step": 8069 }, { "epoch": 1.64, "learning_rate": 0.00022963415056666817, "loss": 0.0132, "step": 8070 }, { "epoch": 1.64, "learning_rate": 0.0002296177220042024, "loss": 0.0183, "step": 8071 }, { "epoch": 1.64, "learning_rate": 0.00022960129211197037, "loss": 0.0245, "step": 8072 }, { "epoch": 1.64, "learning_rate": 0.00022958486089024645, "loss": 0.0145, "step": 8073 }, { "epoch": 1.64, "learning_rate": 0.00022956842833930514, "loss": 0.0134, "step": 8074 }, { "epoch": 1.64, "learning_rate": 0.00022955199445942094, "loss": 0.0115, "step": 8075 }, { "epoch": 1.64, "learning_rate": 0.00022953555925086828, "loss": 0.0076, "step": 8076 }, { "epoch": 1.64, "learning_rate": 0.00022951912271392157, "loss": 0.0107, "step": 8077 }, { "epoch": 1.64, "learning_rate": 0.00022950268484885547, "loss": 0.0095, "step": 8078 }, { "epoch": 1.65, "learning_rate": 0.00022948624565594444, "loss": 0.0128, "step": 8079 }, { "epoch": 1.65, "learning_rate": 0.00022946980513546304, "loss": 0.006, "step": 8080 }, { "epoch": 1.65, "learning_rate": 0.00022945336328768592, "loss": 0.0083, "step": 8081 }, { "epoch": 1.65, "learning_rate": 0.00022943692011288765, "loss": 0.0042, "step": 8082 }, { "epoch": 1.65, "learning_rate": 0.00022942047561134288, "loss": 0.0137, "step": 8083 }, { "epoch": 1.65, "learning_rate": 0.0002294040297833262, "loss": 0.0042, "step": 8084 }, { "epoch": 1.65, "learning_rate": 0.00022938758262911236, "loss": 0.0353, "step": 8085 }, { "epoch": 1.65, "learning_rate": 0.00022937113414897602, "loss": 0.0097, "step": 8086 }, { "epoch": 1.65, "learning_rate": 0.00022935468434319198, "loss": 0.0028, "step": 8087 }, { "epoch": 1.65, "learning_rate": 0.00022933823321203483, "loss": 0.0088, "step": 8088 }, { "epoch": 1.65, "learning_rate": 0.00022932178075577947, "loss": 0.0079, "step": 8089 }, { "epoch": 1.65, "learning_rate": 0.00022930532697470067, "loss": 0.0024, "step": 8090 }, { "epoch": 1.65, "learning_rate": 0.00022928887186907316, "loss": 0.0143, "step": 8091 }, { "epoch": 1.65, "learning_rate": 0.00022927241543917184, "loss": 0.0164, "step": 8092 }, { "epoch": 1.65, "learning_rate": 0.00022925595768527157, "loss": 0.0057, "step": 8093 }, { "epoch": 1.65, "learning_rate": 0.00022923949860764717, "loss": 0.0048, "step": 8094 }, { "epoch": 1.65, "learning_rate": 0.00022922303820657356, "loss": 0.0494, "step": 8095 }, { "epoch": 1.65, "learning_rate": 0.0002292065764823257, "loss": 0.0104, "step": 8096 }, { "epoch": 1.65, "learning_rate": 0.00022919011343517848, "loss": 0.0109, "step": 8097 }, { "epoch": 1.65, "learning_rate": 0.00022917364906540689, "loss": 0.0308, "step": 8098 }, { "epoch": 1.65, "learning_rate": 0.00022915718337328592, "loss": 0.0038, "step": 8099 }, { "epoch": 1.65, "learning_rate": 0.00022914071635909058, "loss": 0.0083, "step": 8100 }, { "epoch": 1.65, "learning_rate": 0.0002291242480230958, "loss": 0.0407, "step": 8101 }, { "epoch": 1.65, "learning_rate": 0.00022910777836557679, "loss": 0.005, "step": 8102 }, { "epoch": 1.65, "learning_rate": 0.00022909130738680853, "loss": 0.0321, "step": 8103 }, { "epoch": 1.65, "learning_rate": 0.00022907483508706618, "loss": 0.0125, "step": 8104 }, { "epoch": 1.65, "learning_rate": 0.0002290583614666248, "loss": 0.0301, "step": 8105 }, { "epoch": 1.65, "learning_rate": 0.00022904188652575955, "loss": 0.0838, "step": 8106 }, { "epoch": 1.65, "learning_rate": 0.00022902541026474557, "loss": 0.0174, "step": 8107 }, { "epoch": 1.65, "learning_rate": 0.00022900893268385812, "loss": 0.0675, "step": 8108 }, { "epoch": 1.65, "learning_rate": 0.00022899245378337233, "loss": 0.0101, "step": 8109 }, { "epoch": 1.65, "learning_rate": 0.00022897597356356345, "loss": 0.0063, "step": 8110 }, { "epoch": 1.65, "learning_rate": 0.00022895949202470672, "loss": 0.0089, "step": 8111 }, { "epoch": 1.65, "learning_rate": 0.00022894300916707742, "loss": 0.0093, "step": 8112 }, { "epoch": 1.65, "learning_rate": 0.0002289265249909509, "loss": 0.0123, "step": 8113 }, { "epoch": 1.65, "learning_rate": 0.00022891003949660242, "loss": 0.0034, "step": 8114 }, { "epoch": 1.65, "learning_rate": 0.0002288935526843073, "loss": 0.029, "step": 8115 }, { "epoch": 1.65, "learning_rate": 0.00022887706455434087, "loss": 0.0369, "step": 8116 }, { "epoch": 1.65, "learning_rate": 0.00022886057510697867, "loss": 0.0051, "step": 8117 }, { "epoch": 1.65, "learning_rate": 0.00022884408434249598, "loss": 0.0061, "step": 8118 }, { "epoch": 1.65, "learning_rate": 0.00022882759226116825, "loss": 0.0141, "step": 8119 }, { "epoch": 1.65, "learning_rate": 0.00022881109886327086, "loss": 0.017, "step": 8120 }, { "epoch": 1.65, "learning_rate": 0.00022879460414907944, "loss": 0.0066, "step": 8121 }, { "epoch": 1.65, "learning_rate": 0.00022877810811886942, "loss": 0.0101, "step": 8122 }, { "epoch": 1.65, "learning_rate": 0.00022876161077291623, "loss": 0.0064, "step": 8123 }, { "epoch": 1.65, "learning_rate": 0.00022874511211149547, "loss": 0.0103, "step": 8124 }, { "epoch": 1.65, "learning_rate": 0.00022872861213488267, "loss": 0.0236, "step": 8125 }, { "epoch": 1.65, "learning_rate": 0.00022871211084335349, "loss": 0.0044, "step": 8126 }, { "epoch": 1.65, "learning_rate": 0.00022869560823718347, "loss": 0.018, "step": 8127 }, { "epoch": 1.66, "learning_rate": 0.00022867910431664823, "loss": 0.0327, "step": 8128 }, { "epoch": 1.66, "learning_rate": 0.0002286625990820234, "loss": 0.0209, "step": 8129 }, { "epoch": 1.66, "learning_rate": 0.00022864609253358474, "loss": 0.0093, "step": 8130 }, { "epoch": 1.66, "learning_rate": 0.00022862958467160786, "loss": 0.008, "step": 8131 }, { "epoch": 1.66, "learning_rate": 0.0002286130754963685, "loss": 0.0066, "step": 8132 }, { "epoch": 1.66, "learning_rate": 0.00022859656500814237, "loss": 0.0259, "step": 8133 }, { "epoch": 1.66, "learning_rate": 0.00022858005320720523, "loss": 0.0049, "step": 8134 }, { "epoch": 1.66, "learning_rate": 0.00022856354009383287, "loss": 0.0053, "step": 8135 }, { "epoch": 1.66, "learning_rate": 0.00022854702566830112, "loss": 0.0146, "step": 8136 }, { "epoch": 1.66, "learning_rate": 0.00022853050993088575, "loss": 0.0144, "step": 8137 }, { "epoch": 1.66, "learning_rate": 0.00022851399288186265, "loss": 0.0065, "step": 8138 }, { "epoch": 1.66, "learning_rate": 0.00022849747452150762, "loss": 0.0171, "step": 8139 }, { "epoch": 1.66, "learning_rate": 0.00022848095485009665, "loss": 0.0052, "step": 8140 }, { "epoch": 1.66, "learning_rate": 0.00022846443386790555, "loss": 0.0127, "step": 8141 }, { "epoch": 1.66, "learning_rate": 0.00022844791157521028, "loss": 0.0096, "step": 8142 }, { "epoch": 1.66, "learning_rate": 0.00022843138797228686, "loss": 0.0025, "step": 8143 }, { "epoch": 1.66, "learning_rate": 0.00022841486305941118, "loss": 0.0173, "step": 8144 }, { "epoch": 1.66, "learning_rate": 0.00022839833683685929, "loss": 0.0093, "step": 8145 }, { "epoch": 1.66, "learning_rate": 0.00022838180930490713, "loss": 0.0103, "step": 8146 }, { "epoch": 1.66, "learning_rate": 0.00022836528046383086, "loss": 0.0252, "step": 8147 }, { "epoch": 1.66, "learning_rate": 0.00022834875031390643, "loss": 0.0087, "step": 8148 }, { "epoch": 1.66, "learning_rate": 0.00022833221885541, "loss": 0.0153, "step": 8149 }, { "epoch": 1.66, "learning_rate": 0.0002283156860886177, "loss": 0.0157, "step": 8150 }, { "epoch": 1.66, "learning_rate": 0.00022829915201380555, "loss": 0.0171, "step": 8151 }, { "epoch": 1.66, "learning_rate": 0.00022828261663124976, "loss": 0.0116, "step": 8152 }, { "epoch": 1.66, "learning_rate": 0.00022826607994122654, "loss": 0.0169, "step": 8153 }, { "epoch": 1.66, "learning_rate": 0.00022824954194401205, "loss": 0.024, "step": 8154 }, { "epoch": 1.66, "learning_rate": 0.0002282330026398825, "loss": 0.0114, "step": 8155 }, { "epoch": 1.66, "learning_rate": 0.0002282164620291141, "loss": 0.0097, "step": 8156 }, { "epoch": 1.66, "learning_rate": 0.00022819992011198308, "loss": 0.0458, "step": 8157 }, { "epoch": 1.66, "learning_rate": 0.00022818337688876588, "loss": 0.0196, "step": 8158 }, { "epoch": 1.66, "learning_rate": 0.0002281668323597387, "loss": 0.0105, "step": 8159 }, { "epoch": 1.66, "learning_rate": 0.00022815028652517784, "loss": 0.021, "step": 8160 }, { "epoch": 1.66, "learning_rate": 0.00022813373938535968, "loss": 0.0071, "step": 8161 }, { "epoch": 1.66, "learning_rate": 0.00022811719094056057, "loss": 0.0207, "step": 8162 }, { "epoch": 1.66, "learning_rate": 0.00022810064119105694, "loss": 0.0228, "step": 8163 }, { "epoch": 1.66, "learning_rate": 0.0002280840901371252, "loss": 0.0063, "step": 8164 }, { "epoch": 1.66, "learning_rate": 0.0002280675377790417, "loss": 0.0145, "step": 8165 }, { "epoch": 1.66, "learning_rate": 0.000228050984117083, "loss": 0.005, "step": 8166 }, { "epoch": 1.66, "learning_rate": 0.00022803442915152552, "loss": 0.022, "step": 8167 }, { "epoch": 1.66, "learning_rate": 0.00022801787288264578, "loss": 0.0059, "step": 8168 }, { "epoch": 1.66, "learning_rate": 0.00022800131531072024, "loss": 0.0036, "step": 8169 }, { "epoch": 1.66, "learning_rate": 0.00022798475643602556, "loss": 0.0159, "step": 8170 }, { "epoch": 1.66, "learning_rate": 0.00022796819625883822, "loss": 0.0319, "step": 8171 }, { "epoch": 1.66, "learning_rate": 0.00022795163477943485, "loss": 0.0055, "step": 8172 }, { "epoch": 1.66, "learning_rate": 0.00022793507199809205, "loss": 0.013, "step": 8173 }, { "epoch": 1.66, "learning_rate": 0.00022791850791508637, "loss": 0.0028, "step": 8174 }, { "epoch": 1.66, "learning_rate": 0.00022790194253069455, "loss": 0.0243, "step": 8175 }, { "epoch": 1.66, "learning_rate": 0.00022788537584519326, "loss": 0.0305, "step": 8176 }, { "epoch": 1.66, "learning_rate": 0.00022786880785885915, "loss": 0.0143, "step": 8177 }, { "epoch": 1.67, "learning_rate": 0.000227852238571969, "loss": 0.0071, "step": 8178 }, { "epoch": 1.67, "learning_rate": 0.00022783566798479944, "loss": 0.0074, "step": 8179 }, { "epoch": 1.67, "learning_rate": 0.00022781909609762731, "loss": 0.0092, "step": 8180 }, { "epoch": 1.67, "learning_rate": 0.00022780252291072943, "loss": 0.0154, "step": 8181 }, { "epoch": 1.67, "learning_rate": 0.00022778594842438256, "loss": 0.0028, "step": 8182 }, { "epoch": 1.67, "learning_rate": 0.0002277693726388635, "loss": 0.0182, "step": 8183 }, { "epoch": 1.67, "learning_rate": 0.0002277527955544491, "loss": 0.0232, "step": 8184 }, { "epoch": 1.67, "learning_rate": 0.00022773621717141627, "loss": 0.0048, "step": 8185 }, { "epoch": 1.67, "learning_rate": 0.00022771963749004185, "loss": 0.037, "step": 8186 }, { "epoch": 1.67, "learning_rate": 0.0002277030565106028, "loss": 0.0038, "step": 8187 }, { "epoch": 1.67, "learning_rate": 0.000227686474233376, "loss": 0.0063, "step": 8188 }, { "epoch": 1.67, "learning_rate": 0.00022766989065863845, "loss": 0.0088, "step": 8189 }, { "epoch": 1.67, "learning_rate": 0.00022765330578666717, "loss": 0.02, "step": 8190 }, { "epoch": 1.67, "learning_rate": 0.00022763671961773907, "loss": 0.0122, "step": 8191 }, { "epoch": 1.67, "learning_rate": 0.00022762013215213116, "loss": 0.0127, "step": 8192 }, { "epoch": 1.67, "learning_rate": 0.00022760354339012055, "loss": 0.0149, "step": 8193 }, { "epoch": 1.67, "learning_rate": 0.0002275869533319843, "loss": 0.0057, "step": 8194 }, { "epoch": 1.67, "learning_rate": 0.00022757036197799943, "loss": 0.0157, "step": 8195 }, { "epoch": 1.67, "learning_rate": 0.00022755376932844315, "loss": 0.0063, "step": 8196 }, { "epoch": 1.67, "learning_rate": 0.00022753717538359246, "loss": 0.0182, "step": 8197 }, { "epoch": 1.67, "learning_rate": 0.00022752058014372464, "loss": 0.0128, "step": 8198 }, { "epoch": 1.67, "learning_rate": 0.00022750398360911676, "loss": 0.0391, "step": 8199 }, { "epoch": 1.67, "learning_rate": 0.00022748738578004605, "loss": 0.0099, "step": 8200 }, { "epoch": 1.67, "learning_rate": 0.00022747078665678975, "loss": 0.0185, "step": 8201 }, { "epoch": 1.67, "learning_rate": 0.0002274541862396251, "loss": 0.0289, "step": 8202 }, { "epoch": 1.67, "learning_rate": 0.0002274375845288293, "loss": 0.0052, "step": 8203 }, { "epoch": 1.67, "learning_rate": 0.00022742098152467964, "loss": 0.0106, "step": 8204 }, { "epoch": 1.67, "learning_rate": 0.00022740437722745355, "loss": 0.0106, "step": 8205 }, { "epoch": 1.67, "learning_rate": 0.00022738777163742815, "loss": 0.0068, "step": 8206 }, { "epoch": 1.67, "learning_rate": 0.00022737116475488094, "loss": 0.0064, "step": 8207 }, { "epoch": 1.67, "learning_rate": 0.00022735455658008915, "loss": 0.0185, "step": 8208 }, { "epoch": 1.67, "learning_rate": 0.00022733794711333034, "loss": 0.0047, "step": 8209 }, { "epoch": 1.67, "learning_rate": 0.00022732133635488177, "loss": 0.0181, "step": 8210 }, { "epoch": 1.67, "learning_rate": 0.00022730472430502094, "loss": 0.0039, "step": 8211 }, { "epoch": 1.67, "learning_rate": 0.0002272881109640253, "loss": 0.0184, "step": 8212 }, { "epoch": 1.67, "learning_rate": 0.0002272714963321723, "loss": 0.0145, "step": 8213 }, { "epoch": 1.67, "learning_rate": 0.00022725488040973947, "loss": 0.0109, "step": 8214 }, { "epoch": 1.67, "learning_rate": 0.0002272382631970043, "loss": 0.0084, "step": 8215 }, { "epoch": 1.67, "learning_rate": 0.00022722164469424436, "loss": 0.0069, "step": 8216 }, { "epoch": 1.67, "learning_rate": 0.00022720502490173718, "loss": 0.0104, "step": 8217 }, { "epoch": 1.67, "learning_rate": 0.0002271884038197603, "loss": 0.0197, "step": 8218 }, { "epoch": 1.67, "learning_rate": 0.00022717178144859146, "loss": 0.0264, "step": 8219 }, { "epoch": 1.67, "learning_rate": 0.0002271551577885081, "loss": 0.0068, "step": 8220 }, { "epoch": 1.67, "learning_rate": 0.00022713853283978802, "loss": 0.0103, "step": 8221 }, { "epoch": 1.67, "learning_rate": 0.00022712190660270884, "loss": 0.0238, "step": 8222 }, { "epoch": 1.67, "learning_rate": 0.00022710527907754822, "loss": 0.0206, "step": 8223 }, { "epoch": 1.67, "learning_rate": 0.00022708865026458392, "loss": 0.0028, "step": 8224 }, { "epoch": 1.67, "learning_rate": 0.00022707202016409363, "loss": 0.0137, "step": 8225 }, { "epoch": 1.67, "learning_rate": 0.0002270553887763551, "loss": 0.0058, "step": 8226 }, { "epoch": 1.68, "learning_rate": 0.00022703875610164613, "loss": 0.0056, "step": 8227 }, { "epoch": 1.68, "learning_rate": 0.00022702212214024454, "loss": 0.0145, "step": 8228 }, { "epoch": 1.68, "learning_rate": 0.0002270054868924281, "loss": 0.0252, "step": 8229 }, { "epoch": 1.68, "learning_rate": 0.00022698885035847465, "loss": 0.0125, "step": 8230 }, { "epoch": 1.68, "learning_rate": 0.0002269722125386621, "loss": 0.021, "step": 8231 }, { "epoch": 1.68, "learning_rate": 0.00022695557343326827, "loss": 0.0096, "step": 8232 }, { "epoch": 1.68, "learning_rate": 0.00022693893304257117, "loss": 0.0101, "step": 8233 }, { "epoch": 1.68, "learning_rate": 0.00022692229136684862, "loss": 0.0131, "step": 8234 }, { "epoch": 1.68, "learning_rate": 0.0002269056484063786, "loss": 0.0119, "step": 8235 }, { "epoch": 1.68, "learning_rate": 0.00022688900416143905, "loss": 0.0064, "step": 8236 }, { "epoch": 1.68, "learning_rate": 0.00022687235863230805, "loss": 0.0207, "step": 8237 }, { "epoch": 1.68, "learning_rate": 0.00022685571181926354, "loss": 0.009, "step": 8238 }, { "epoch": 1.68, "learning_rate": 0.00022683906372258355, "loss": 0.0107, "step": 8239 }, { "epoch": 1.68, "learning_rate": 0.00022682241434254614, "loss": 0.0059, "step": 8240 }, { "epoch": 1.68, "learning_rate": 0.00022680576367942938, "loss": 0.0199, "step": 8241 }, { "epoch": 1.68, "learning_rate": 0.00022678911173351144, "loss": 0.0161, "step": 8242 }, { "epoch": 1.68, "learning_rate": 0.00022677245850507037, "loss": 0.015, "step": 8243 }, { "epoch": 1.68, "learning_rate": 0.0002267558039943843, "loss": 0.006, "step": 8244 }, { "epoch": 1.68, "learning_rate": 0.00022673914820173146, "loss": 0.0104, "step": 8245 }, { "epoch": 1.68, "learning_rate": 0.00022672249112738995, "loss": 0.0157, "step": 8246 }, { "epoch": 1.68, "learning_rate": 0.00022670583277163809, "loss": 0.0203, "step": 8247 }, { "epoch": 1.68, "learning_rate": 0.00022668917313475393, "loss": 0.0045, "step": 8248 }, { "epoch": 1.68, "learning_rate": 0.00022667251221701587, "loss": 0.0168, "step": 8249 }, { "epoch": 1.68, "learning_rate": 0.00022665585001870208, "loss": 0.0109, "step": 8250 }, { "epoch": 1.68, "learning_rate": 0.00022663918654009093, "loss": 0.0335, "step": 8251 }, { "epoch": 1.68, "learning_rate": 0.00022662252178146073, "loss": 0.0207, "step": 8252 }, { "epoch": 1.68, "learning_rate": 0.0002266058557430897, "loss": 0.0037, "step": 8253 }, { "epoch": 1.68, "learning_rate": 0.00022658918842525632, "loss": 0.0157, "step": 8254 }, { "epoch": 1.68, "learning_rate": 0.00022657251982823894, "loss": 0.0106, "step": 8255 }, { "epoch": 1.68, "learning_rate": 0.00022655584995231594, "loss": 0.0211, "step": 8256 }, { "epoch": 1.68, "learning_rate": 0.00022653917879776573, "loss": 0.0169, "step": 8257 }, { "epoch": 1.68, "learning_rate": 0.00022652250636486673, "loss": 0.0161, "step": 8258 }, { "epoch": 1.68, "learning_rate": 0.00022650583265389744, "loss": 0.0298, "step": 8259 }, { "epoch": 1.68, "learning_rate": 0.0002264891576651363, "loss": 0.0256, "step": 8260 }, { "epoch": 1.68, "learning_rate": 0.0002264724813988619, "loss": 0.0041, "step": 8261 }, { "epoch": 1.68, "learning_rate": 0.00022645580385535267, "loss": 0.0252, "step": 8262 }, { "epoch": 1.68, "learning_rate": 0.00022643912503488722, "loss": 0.011, "step": 8263 }, { "epoch": 1.68, "learning_rate": 0.0002264224449377441, "loss": 0.0125, "step": 8264 }, { "epoch": 1.68, "learning_rate": 0.00022640576356420186, "loss": 0.005, "step": 8265 }, { "epoch": 1.68, "learning_rate": 0.00022638908091453917, "loss": 0.0269, "step": 8266 }, { "epoch": 1.68, "learning_rate": 0.00022637239698903463, "loss": 0.0046, "step": 8267 }, { "epoch": 1.68, "learning_rate": 0.00022635571178796686, "loss": 0.0194, "step": 8268 }, { "epoch": 1.68, "learning_rate": 0.0002263390253116146, "loss": 0.0083, "step": 8269 }, { "epoch": 1.68, "learning_rate": 0.00022632233756025654, "loss": 0.0104, "step": 8270 }, { "epoch": 1.68, "learning_rate": 0.0002263056485341713, "loss": 0.0052, "step": 8271 }, { "epoch": 1.68, "learning_rate": 0.00022628895823363775, "loss": 0.0122, "step": 8272 }, { "epoch": 1.68, "learning_rate": 0.0002262722666589346, "loss": 0.0132, "step": 8273 }, { "epoch": 1.68, "learning_rate": 0.00022625557381034057, "loss": 0.009, "step": 8274 }, { "epoch": 1.68, "learning_rate": 0.0002262388796881346, "loss": 0.0067, "step": 8275 }, { "epoch": 1.69, "learning_rate": 0.0002262221842925954, "loss": 0.0229, "step": 8276 }, { "epoch": 1.69, "learning_rate": 0.0002262054876240018, "loss": 0.0068, "step": 8277 }, { "epoch": 1.69, "learning_rate": 0.00022618878968263273, "loss": 0.0214, "step": 8278 }, { "epoch": 1.69, "learning_rate": 0.00022617209046876707, "loss": 0.0099, "step": 8279 }, { "epoch": 1.69, "learning_rate": 0.0002261553899826837, "loss": 0.046, "step": 8280 }, { "epoch": 1.69, "learning_rate": 0.00022613868822466155, "loss": 0.0289, "step": 8281 }, { "epoch": 1.69, "learning_rate": 0.0002261219851949796, "loss": 0.0208, "step": 8282 }, { "epoch": 1.69, "learning_rate": 0.0002261052808939168, "loss": 0.0125, "step": 8283 }, { "epoch": 1.69, "learning_rate": 0.00022608857532175215, "loss": 0.0163, "step": 8284 }, { "epoch": 1.69, "learning_rate": 0.0002260718684787647, "loss": 0.0057, "step": 8285 }, { "epoch": 1.69, "learning_rate": 0.0002260551603652334, "loss": 0.0104, "step": 8286 }, { "epoch": 1.69, "learning_rate": 0.00022603845098143738, "loss": 0.0114, "step": 8287 }, { "epoch": 1.69, "learning_rate": 0.00022602174032765573, "loss": 0.0083, "step": 8288 }, { "epoch": 1.69, "learning_rate": 0.00022600502840416746, "loss": 0.0187, "step": 8289 }, { "epoch": 1.69, "learning_rate": 0.00022598831521125176, "loss": 0.0403, "step": 8290 }, { "epoch": 1.69, "learning_rate": 0.00022597160074918778, "loss": 0.0094, "step": 8291 }, { "epoch": 1.69, "learning_rate": 0.00022595488501825464, "loss": 0.0045, "step": 8292 }, { "epoch": 1.69, "learning_rate": 0.00022593816801873151, "loss": 0.0071, "step": 8293 }, { "epoch": 1.69, "learning_rate": 0.0002259214497508977, "loss": 0.0234, "step": 8294 }, { "epoch": 1.69, "learning_rate": 0.00022590473021503235, "loss": 0.0278, "step": 8295 }, { "epoch": 1.69, "learning_rate": 0.00022588800941141473, "loss": 0.0289, "step": 8296 }, { "epoch": 1.69, "learning_rate": 0.00022587128734032405, "loss": 0.02, "step": 8297 }, { "epoch": 1.69, "learning_rate": 0.00022585456400203973, "loss": 0.0069, "step": 8298 }, { "epoch": 1.69, "learning_rate": 0.00022583783939684096, "loss": 0.0089, "step": 8299 }, { "epoch": 1.69, "learning_rate": 0.00022582111352500712, "loss": 0.0362, "step": 8300 }, { "epoch": 1.69, "learning_rate": 0.00022580438638681756, "loss": 0.0104, "step": 8301 }, { "epoch": 1.69, "learning_rate": 0.00022578765798255166, "loss": 0.0053, "step": 8302 }, { "epoch": 1.69, "learning_rate": 0.00022577092831248884, "loss": 0.0114, "step": 8303 }, { "epoch": 1.69, "learning_rate": 0.00022575419737690843, "loss": 0.0121, "step": 8304 }, { "epoch": 1.69, "learning_rate": 0.00022573746517609, "loss": 0.004, "step": 8305 }, { "epoch": 1.69, "learning_rate": 0.00022572073171031286, "loss": 0.0148, "step": 8306 }, { "epoch": 1.69, "learning_rate": 0.00022570399697985667, "loss": 0.0025, "step": 8307 }, { "epoch": 1.69, "learning_rate": 0.00022568726098500072, "loss": 0.0265, "step": 8308 }, { "epoch": 1.69, "learning_rate": 0.00022567052372602473, "loss": 0.0129, "step": 8309 }, { "epoch": 1.69, "learning_rate": 0.0002256537852032081, "loss": 0.0258, "step": 8310 }, { "epoch": 1.69, "learning_rate": 0.00022563704541683045, "loss": 0.0033, "step": 8311 }, { "epoch": 1.69, "learning_rate": 0.00022562030436717138, "loss": 0.012, "step": 8312 }, { "epoch": 1.69, "learning_rate": 0.00022560356205451047, "loss": 0.0081, "step": 8313 }, { "epoch": 1.69, "learning_rate": 0.00022558681847912736, "loss": 0.0106, "step": 8314 }, { "epoch": 1.69, "learning_rate": 0.0002255700736413017, "loss": 0.0076, "step": 8315 }, { "epoch": 1.69, "learning_rate": 0.00022555332754131322, "loss": 0.0086, "step": 8316 }, { "epoch": 1.69, "learning_rate": 0.00022553658017944152, "loss": 0.0089, "step": 8317 }, { "epoch": 1.69, "learning_rate": 0.00022551983155596634, "loss": 0.0205, "step": 8318 }, { "epoch": 1.69, "learning_rate": 0.00022550308167116741, "loss": 0.0064, "step": 8319 }, { "epoch": 1.69, "learning_rate": 0.00022548633052532448, "loss": 0.019, "step": 8320 }, { "epoch": 1.69, "learning_rate": 0.00022546957811871743, "loss": 0.0148, "step": 8321 }, { "epoch": 1.69, "learning_rate": 0.00022545282445162585, "loss": 0.0173, "step": 8322 }, { "epoch": 1.69, "learning_rate": 0.00022543606952432974, "loss": 0.0027, "step": 8323 }, { "epoch": 1.69, "learning_rate": 0.00022541931333710881, "loss": 0.0072, "step": 8324 }, { "epoch": 1.7, "learning_rate": 0.00022540255589024305, "loss": 0.0131, "step": 8325 }, { "epoch": 1.7, "learning_rate": 0.00022538579718401223, "loss": 0.0084, "step": 8326 }, { "epoch": 1.7, "learning_rate": 0.00022536903721869634, "loss": 0.0124, "step": 8327 }, { "epoch": 1.7, "learning_rate": 0.0002253522759945752, "loss": 0.0367, "step": 8328 }, { "epoch": 1.7, "learning_rate": 0.0002253355135119289, "loss": 0.0203, "step": 8329 }, { "epoch": 1.7, "learning_rate": 0.00022531874977103726, "loss": 0.0061, "step": 8330 }, { "epoch": 1.7, "learning_rate": 0.00022530198477218035, "loss": 0.002, "step": 8331 }, { "epoch": 1.7, "learning_rate": 0.00022528521851563813, "loss": 0.0173, "step": 8332 }, { "epoch": 1.7, "learning_rate": 0.00022526845100169068, "loss": 0.0185, "step": 8333 }, { "epoch": 1.7, "learning_rate": 0.00022525168223061796, "loss": 0.0075, "step": 8334 }, { "epoch": 1.7, "learning_rate": 0.00022523491220270017, "loss": 0.0035, "step": 8335 }, { "epoch": 1.7, "learning_rate": 0.00022521814091821724, "loss": 0.0143, "step": 8336 }, { "epoch": 1.7, "learning_rate": 0.00022520136837744944, "loss": 0.0161, "step": 8337 }, { "epoch": 1.7, "learning_rate": 0.0002251845945806768, "loss": 0.0445, "step": 8338 }, { "epoch": 1.7, "learning_rate": 0.0002251678195281796, "loss": 0.0112, "step": 8339 }, { "epoch": 1.7, "learning_rate": 0.0002251510432202378, "loss": 0.0218, "step": 8340 }, { "epoch": 1.7, "learning_rate": 0.0002251342656571318, "loss": 0.0075, "step": 8341 }, { "epoch": 1.7, "learning_rate": 0.00022511748683914172, "loss": 0.0142, "step": 8342 }, { "epoch": 1.7, "learning_rate": 0.0002251007067665478, "loss": 0.0111, "step": 8343 }, { "epoch": 1.7, "learning_rate": 0.0002250839254396303, "loss": 0.0219, "step": 8344 }, { "epoch": 1.7, "learning_rate": 0.00022506714285866955, "loss": 0.0025, "step": 8345 }, { "epoch": 1.7, "learning_rate": 0.00022505035902394582, "loss": 0.0031, "step": 8346 }, { "epoch": 1.7, "learning_rate": 0.0002250335739357394, "loss": 0.0057, "step": 8347 }, { "epoch": 1.7, "learning_rate": 0.00022501678759433063, "loss": 0.0176, "step": 8348 }, { "epoch": 1.7, "learning_rate": 0.000225, "loss": 0.03, "step": 8349 }, { "epoch": 1.7, "learning_rate": 0.00022498321115302773, "loss": 0.0104, "step": 8350 }, { "epoch": 1.7, "learning_rate": 0.0002249664210536943, "loss": 0.0102, "step": 8351 }, { "epoch": 1.7, "learning_rate": 0.00022494962970228012, "loss": 0.0022, "step": 8352 }, { "epoch": 1.7, "learning_rate": 0.0002249328370990657, "loss": 0.0086, "step": 8353 }, { "epoch": 1.7, "learning_rate": 0.00022491604324433137, "loss": 0.0095, "step": 8354 }, { "epoch": 1.7, "learning_rate": 0.00022489924813835774, "loss": 0.0099, "step": 8355 }, { "epoch": 1.7, "learning_rate": 0.00022488245178142526, "loss": 0.026, "step": 8356 }, { "epoch": 1.7, "learning_rate": 0.00022486565417381455, "loss": 0.015, "step": 8357 }, { "epoch": 1.7, "learning_rate": 0.0002248488553158061, "loss": 0.0176, "step": 8358 }, { "epoch": 1.7, "learning_rate": 0.00022483205520768045, "loss": 0.0043, "step": 8359 }, { "epoch": 1.7, "learning_rate": 0.0002248152538497182, "loss": 0.0161, "step": 8360 }, { "epoch": 1.7, "learning_rate": 0.0002247984512422, "loss": 0.0089, "step": 8361 }, { "epoch": 1.7, "learning_rate": 0.00022478164738540642, "loss": 0.0067, "step": 8362 }, { "epoch": 1.7, "learning_rate": 0.00022476484227961828, "loss": 0.0145, "step": 8363 }, { "epoch": 1.7, "learning_rate": 0.00022474803592511608, "loss": 0.0053, "step": 8364 }, { "epoch": 1.7, "learning_rate": 0.00022473122832218054, "loss": 0.0168, "step": 8365 }, { "epoch": 1.7, "learning_rate": 0.0002247144194710925, "loss": 0.0334, "step": 8366 }, { "epoch": 1.7, "learning_rate": 0.0002246976093721326, "loss": 0.0181, "step": 8367 }, { "epoch": 1.7, "learning_rate": 0.0002246807980255816, "loss": 0.0065, "step": 8368 }, { "epoch": 1.7, "learning_rate": 0.00022466398543172033, "loss": 0.0039, "step": 8369 }, { "epoch": 1.7, "learning_rate": 0.00022464717159082954, "loss": 0.0108, "step": 8370 }, { "epoch": 1.7, "learning_rate": 0.00022463035650319008, "loss": 0.0113, "step": 8371 }, { "epoch": 1.7, "learning_rate": 0.00022461354016908283, "loss": 0.018, "step": 8372 }, { "epoch": 1.7, "learning_rate": 0.0002245967225887886, "loss": 0.0333, "step": 8373 }, { "epoch": 1.71, "learning_rate": 0.00022457990376258826, "loss": 0.0082, "step": 8374 }, { "epoch": 1.71, "learning_rate": 0.00022456308369076276, "loss": 0.0172, "step": 8375 }, { "epoch": 1.71, "learning_rate": 0.00022454626237359301, "loss": 0.0074, "step": 8376 }, { "epoch": 1.71, "learning_rate": 0.00022452943981136, "loss": 0.005, "step": 8377 }, { "epoch": 1.71, "learning_rate": 0.0002245126160043446, "loss": 0.0009, "step": 8378 }, { "epoch": 1.71, "learning_rate": 0.0002244957909528279, "loss": 0.0113, "step": 8379 }, { "epoch": 1.71, "learning_rate": 0.00022447896465709088, "loss": 0.0329, "step": 8380 }, { "epoch": 1.71, "learning_rate": 0.00022446213711741454, "loss": 0.0134, "step": 8381 }, { "epoch": 1.71, "learning_rate": 0.00022444530833407999, "loss": 0.0106, "step": 8382 }, { "epoch": 1.71, "learning_rate": 0.0002244284783073682, "loss": 0.0613, "step": 8383 }, { "epoch": 1.71, "learning_rate": 0.00022441164703756037, "loss": 0.0171, "step": 8384 }, { "epoch": 1.71, "learning_rate": 0.00022439481452493756, "loss": 0.023, "step": 8385 }, { "epoch": 1.71, "learning_rate": 0.00022437798076978092, "loss": 0.0126, "step": 8386 }, { "epoch": 1.71, "learning_rate": 0.0002243611457723716, "loss": 0.0038, "step": 8387 }, { "epoch": 1.71, "learning_rate": 0.00022434430953299078, "loss": 0.015, "step": 8388 }, { "epoch": 1.71, "learning_rate": 0.00022432747205191966, "loss": 0.0063, "step": 8389 }, { "epoch": 1.71, "learning_rate": 0.00022431063332943948, "loss": 0.0127, "step": 8390 }, { "epoch": 1.71, "learning_rate": 0.00022429379336583145, "loss": 0.0088, "step": 8391 }, { "epoch": 1.71, "learning_rate": 0.00022427695216137677, "loss": 0.0353, "step": 8392 }, { "epoch": 1.71, "learning_rate": 0.00022426010971635682, "loss": 0.0013, "step": 8393 }, { "epoch": 1.71, "learning_rate": 0.00022424326603105287, "loss": 0.0088, "step": 8394 }, { "epoch": 1.71, "learning_rate": 0.00022422642110574622, "loss": 0.0133, "step": 8395 }, { "epoch": 1.71, "learning_rate": 0.00022420957494071822, "loss": 0.0349, "step": 8396 }, { "epoch": 1.71, "learning_rate": 0.00022419272753625025, "loss": 0.0106, "step": 8397 }, { "epoch": 1.71, "learning_rate": 0.00022417587889262368, "loss": 0.0126, "step": 8398 }, { "epoch": 1.71, "learning_rate": 0.00022415902901011991, "loss": 0.0138, "step": 8399 }, { "epoch": 1.71, "learning_rate": 0.0002241421778890204, "loss": 0.013, "step": 8400 }, { "epoch": 1.71, "learning_rate": 0.0002241253255296065, "loss": 0.0298, "step": 8401 }, { "epoch": 1.71, "learning_rate": 0.00022410847193215982, "loss": 0.0049, "step": 8402 }, { "epoch": 1.71, "learning_rate": 0.0002240916170969617, "loss": 0.0124, "step": 8403 }, { "epoch": 1.71, "learning_rate": 0.0002240747610242938, "loss": 0.0105, "step": 8404 }, { "epoch": 1.71, "learning_rate": 0.0002240579037144375, "loss": 0.0182, "step": 8405 }, { "epoch": 1.71, "learning_rate": 0.00022404104516767442, "loss": 0.0057, "step": 8406 }, { "epoch": 1.71, "learning_rate": 0.0002240241853842861, "loss": 0.0083, "step": 8407 }, { "epoch": 1.71, "learning_rate": 0.00022400732436455418, "loss": 0.0175, "step": 8408 }, { "epoch": 1.71, "learning_rate": 0.00022399046210876028, "loss": 0.0481, "step": 8409 }, { "epoch": 1.71, "learning_rate": 0.00022397359861718596, "loss": 0.0072, "step": 8410 }, { "epoch": 1.71, "learning_rate": 0.00022395673389011291, "loss": 0.016, "step": 8411 }, { "epoch": 1.71, "learning_rate": 0.0002239398679278228, "loss": 0.0064, "step": 8412 }, { "epoch": 1.71, "learning_rate": 0.00022392300073059736, "loss": 0.0194, "step": 8413 }, { "epoch": 1.71, "learning_rate": 0.0002239061322987182, "loss": 0.0078, "step": 8414 }, { "epoch": 1.71, "learning_rate": 0.00022388926263246716, "loss": 0.0222, "step": 8415 }, { "epoch": 1.71, "learning_rate": 0.000223872391732126, "loss": 0.0012, "step": 8416 }, { "epoch": 1.71, "learning_rate": 0.0002238555195979764, "loss": 0.0263, "step": 8417 }, { "epoch": 1.71, "learning_rate": 0.0002238386462303002, "loss": 0.0226, "step": 8418 }, { "epoch": 1.71, "learning_rate": 0.00022382177162937923, "loss": 0.018, "step": 8419 }, { "epoch": 1.71, "learning_rate": 0.00022380489579549534, "loss": 0.0215, "step": 8420 }, { "epoch": 1.71, "learning_rate": 0.00022378801872893037, "loss": 0.0161, "step": 8421 }, { "epoch": 1.71, "learning_rate": 0.00022377114042996624, "loss": 0.0082, "step": 8422 }, { "epoch": 1.72, "learning_rate": 0.0002237542608988848, "loss": 0.0075, "step": 8423 }, { "epoch": 1.72, "learning_rate": 0.00022373738013596793, "loss": 0.0038, "step": 8424 }, { "epoch": 1.72, "learning_rate": 0.00022372049814149768, "loss": 0.005, "step": 8425 }, { "epoch": 1.72, "learning_rate": 0.00022370361491575594, "loss": 0.0193, "step": 8426 }, { "epoch": 1.72, "learning_rate": 0.0002236867304590247, "loss": 0.0076, "step": 8427 }, { "epoch": 1.72, "learning_rate": 0.00022366984477158592, "loss": 0.017, "step": 8428 }, { "epoch": 1.72, "learning_rate": 0.00022365295785372176, "loss": 0.0123, "step": 8429 }, { "epoch": 1.72, "learning_rate": 0.0002236360697057141, "loss": 0.0112, "step": 8430 }, { "epoch": 1.72, "learning_rate": 0.00022361918032784512, "loss": 0.0663, "step": 8431 }, { "epoch": 1.72, "learning_rate": 0.00022360228972039686, "loss": 0.0047, "step": 8432 }, { "epoch": 1.72, "learning_rate": 0.0002235853978836514, "loss": 0.0124, "step": 8433 }, { "epoch": 1.72, "learning_rate": 0.0002235685048178909, "loss": 0.0046, "step": 8434 }, { "epoch": 1.72, "learning_rate": 0.00022355161052339752, "loss": 0.0066, "step": 8435 }, { "epoch": 1.72, "learning_rate": 0.00022353471500045338, "loss": 0.0104, "step": 8436 }, { "epoch": 1.72, "learning_rate": 0.00022351781824934072, "loss": 0.0382, "step": 8437 }, { "epoch": 1.72, "learning_rate": 0.00022350092027034169, "loss": 0.0212, "step": 8438 }, { "epoch": 1.72, "learning_rate": 0.00022348402106373857, "loss": 0.0029, "step": 8439 }, { "epoch": 1.72, "learning_rate": 0.00022346712062981357, "loss": 0.0269, "step": 8440 }, { "epoch": 1.72, "learning_rate": 0.00022345021896884903, "loss": 0.0222, "step": 8441 }, { "epoch": 1.72, "learning_rate": 0.00022343331608112713, "loss": 0.0019, "step": 8442 }, { "epoch": 1.72, "learning_rate": 0.00022341641196693026, "loss": 0.0152, "step": 8443 }, { "epoch": 1.72, "learning_rate": 0.0002233995066265407, "loss": 0.0105, "step": 8444 }, { "epoch": 1.72, "learning_rate": 0.00022338260006024086, "loss": 0.0084, "step": 8445 }, { "epoch": 1.72, "learning_rate": 0.0002233656922683131, "loss": 0.0285, "step": 8446 }, { "epoch": 1.72, "learning_rate": 0.00022334878325103974, "loss": 0.0074, "step": 8447 }, { "epoch": 1.72, "learning_rate": 0.00022333187300870323, "loss": 0.012, "step": 8448 }, { "epoch": 1.72, "learning_rate": 0.00022331496154158606, "loss": 0.0339, "step": 8449 }, { "epoch": 1.72, "learning_rate": 0.00022329804884997065, "loss": 0.0167, "step": 8450 }, { "epoch": 1.72, "learning_rate": 0.00022328113493413944, "loss": 0.0094, "step": 8451 }, { "epoch": 1.72, "learning_rate": 0.00022326421979437496, "loss": 0.011, "step": 8452 }, { "epoch": 1.72, "learning_rate": 0.00022324730343095968, "loss": 0.0042, "step": 8453 }, { "epoch": 1.72, "learning_rate": 0.00022323038584417618, "loss": 0.0216, "step": 8454 }, { "epoch": 1.72, "learning_rate": 0.00022321346703430705, "loss": 0.0051, "step": 8455 }, { "epoch": 1.72, "learning_rate": 0.00022319654700163482, "loss": 0.0216, "step": 8456 }, { "epoch": 1.72, "learning_rate": 0.00022317962574644205, "loss": 0.029, "step": 8457 }, { "epoch": 1.72, "learning_rate": 0.0002231627032690114, "loss": 0.0085, "step": 8458 }, { "epoch": 1.72, "learning_rate": 0.00022314577956962547, "loss": 0.0109, "step": 8459 }, { "epoch": 1.72, "learning_rate": 0.000223128854648567, "loss": 0.0133, "step": 8460 }, { "epoch": 1.72, "learning_rate": 0.00022311192850611858, "loss": 0.0061, "step": 8461 }, { "epoch": 1.72, "learning_rate": 0.00022309500114256296, "loss": 0.0192, "step": 8462 }, { "epoch": 1.72, "learning_rate": 0.00022307807255818283, "loss": 0.0115, "step": 8463 }, { "epoch": 1.72, "learning_rate": 0.00022306114275326102, "loss": 0.0231, "step": 8464 }, { "epoch": 1.72, "learning_rate": 0.00022304421172808012, "loss": 0.0064, "step": 8465 }, { "epoch": 1.72, "learning_rate": 0.00022302727948292304, "loss": 0.0189, "step": 8466 }, { "epoch": 1.72, "learning_rate": 0.00022301034601807253, "loss": 0.0329, "step": 8467 }, { "epoch": 1.72, "learning_rate": 0.00022299341133381144, "loss": 0.0139, "step": 8468 }, { "epoch": 1.72, "learning_rate": 0.0002229764754304226, "loss": 0.0056, "step": 8469 }, { "epoch": 1.72, "learning_rate": 0.00022295953830818885, "loss": 0.0099, "step": 8470 }, { "epoch": 1.72, "learning_rate": 0.00022294259996739308, "loss": 0.0153, "step": 8471 }, { "epoch": 1.73, "learning_rate": 0.0002229256604083182, "loss": 0.0105, "step": 8472 }, { "epoch": 1.73, "learning_rate": 0.00022290871963124719, "loss": 0.0077, "step": 8473 }, { "epoch": 1.73, "learning_rate": 0.00022289177763646292, "loss": 0.0077, "step": 8474 }, { "epoch": 1.73, "learning_rate": 0.00022287483442424833, "loss": 0.0134, "step": 8475 }, { "epoch": 1.73, "learning_rate": 0.0002228578899948865, "loss": 0.0183, "step": 8476 }, { "epoch": 1.73, "learning_rate": 0.00022284094434866033, "loss": 0.0051, "step": 8477 }, { "epoch": 1.73, "learning_rate": 0.00022282399748585293, "loss": 0.0225, "step": 8478 }, { "epoch": 1.73, "learning_rate": 0.00022280704940674722, "loss": 0.0356, "step": 8479 }, { "epoch": 1.73, "learning_rate": 0.0002227901001116264, "loss": 0.0026, "step": 8480 }, { "epoch": 1.73, "learning_rate": 0.00022277314960077356, "loss": 0.0105, "step": 8481 }, { "epoch": 1.73, "learning_rate": 0.0002227561978744717, "loss": 0.0085, "step": 8482 }, { "epoch": 1.73, "learning_rate": 0.00022273924493300404, "loss": 0.0011, "step": 8483 }, { "epoch": 1.73, "learning_rate": 0.00022272229077665366, "loss": 0.0041, "step": 8484 }, { "epoch": 1.73, "learning_rate": 0.00022270533540570374, "loss": 0.0053, "step": 8485 }, { "epoch": 1.73, "learning_rate": 0.00022268837882043747, "loss": 0.0127, "step": 8486 }, { "epoch": 1.73, "learning_rate": 0.0002226714210211381, "loss": 0.0219, "step": 8487 }, { "epoch": 1.73, "learning_rate": 0.00022265446200808882, "loss": 0.0171, "step": 8488 }, { "epoch": 1.73, "learning_rate": 0.00022263750178157284, "loss": 0.0221, "step": 8489 }, { "epoch": 1.73, "learning_rate": 0.0002226205403418735, "loss": 0.0125, "step": 8490 }, { "epoch": 1.73, "learning_rate": 0.000222603577689274, "loss": 0.0192, "step": 8491 }, { "epoch": 1.73, "learning_rate": 0.0002225866138240578, "loss": 0.0257, "step": 8492 }, { "epoch": 1.73, "learning_rate": 0.00022256964874650808, "loss": 0.0165, "step": 8493 }, { "epoch": 1.73, "learning_rate": 0.00022255268245690825, "loss": 0.0083, "step": 8494 }, { "epoch": 1.73, "learning_rate": 0.00022253571495554165, "loss": 0.0323, "step": 8495 }, { "epoch": 1.73, "learning_rate": 0.0002225187462426917, "loss": 0.0129, "step": 8496 }, { "epoch": 1.73, "learning_rate": 0.0002225017763186418, "loss": 0.0185, "step": 8497 }, { "epoch": 1.73, "learning_rate": 0.00022248480518367538, "loss": 0.0119, "step": 8498 }, { "epoch": 1.73, "learning_rate": 0.00022246783283807588, "loss": 0.0122, "step": 8499 }, { "epoch": 1.73, "learning_rate": 0.00022245085928212678, "loss": 0.0138, "step": 8500 }, { "epoch": 1.73, "learning_rate": 0.00022243388451611158, "loss": 0.0046, "step": 8501 }, { "epoch": 1.73, "learning_rate": 0.00022241690854031378, "loss": 0.0018, "step": 8502 }, { "epoch": 1.73, "learning_rate": 0.0002223999313550169, "loss": 0.0338, "step": 8503 }, { "epoch": 1.73, "learning_rate": 0.00022238295296050453, "loss": 0.0098, "step": 8504 }, { "epoch": 1.73, "learning_rate": 0.00022236597335706016, "loss": 0.016, "step": 8505 }, { "epoch": 1.73, "learning_rate": 0.0002223489925449675, "loss": 0.0226, "step": 8506 }, { "epoch": 1.73, "learning_rate": 0.00022233201052451005, "loss": 0.0096, "step": 8507 }, { "epoch": 1.73, "learning_rate": 0.0002223150272959715, "loss": 0.0051, "step": 8508 }, { "epoch": 1.73, "learning_rate": 0.0002222980428596355, "loss": 0.0101, "step": 8509 }, { "epoch": 1.73, "learning_rate": 0.0002222810572157857, "loss": 0.0088, "step": 8510 }, { "epoch": 1.73, "learning_rate": 0.00022226407036470577, "loss": 0.0206, "step": 8511 }, { "epoch": 1.73, "learning_rate": 0.0002222470823066795, "loss": 0.0246, "step": 8512 }, { "epoch": 1.73, "learning_rate": 0.0002222300930419906, "loss": 0.0072, "step": 8513 }, { "epoch": 1.73, "learning_rate": 0.00022221310257092272, "loss": 0.0281, "step": 8514 }, { "epoch": 1.73, "learning_rate": 0.00022219611089375983, "loss": 0.008, "step": 8515 }, { "epoch": 1.73, "learning_rate": 0.00022217911801078553, "loss": 0.0142, "step": 8516 }, { "epoch": 1.73, "learning_rate": 0.00022216212392228374, "loss": 0.0068, "step": 8517 }, { "epoch": 1.73, "learning_rate": 0.00022214512862853825, "loss": 0.0096, "step": 8518 }, { "epoch": 1.73, "learning_rate": 0.00022212813212983294, "loss": 0.0068, "step": 8519 }, { "epoch": 1.73, "learning_rate": 0.00022211113442645165, "loss": 0.0169, "step": 8520 }, { "epoch": 1.74, "learning_rate": 0.0002220941355186783, "loss": 0.0378, "step": 8521 }, { "epoch": 1.74, "learning_rate": 0.0002220771354067968, "loss": 0.0223, "step": 8522 }, { "epoch": 1.74, "learning_rate": 0.0002220601340910911, "loss": 0.0061, "step": 8523 }, { "epoch": 1.74, "learning_rate": 0.00022204313157184514, "loss": 0.0245, "step": 8524 }, { "epoch": 1.74, "learning_rate": 0.0002220261278493429, "loss": 0.0127, "step": 8525 }, { "epoch": 1.74, "learning_rate": 0.00022200912292386833, "loss": 0.0102, "step": 8526 }, { "epoch": 1.74, "learning_rate": 0.0002219921167957055, "loss": 0.0311, "step": 8527 }, { "epoch": 1.74, "learning_rate": 0.00022197510946513844, "loss": 0.0227, "step": 8528 }, { "epoch": 1.74, "learning_rate": 0.00022195810093245116, "loss": 0.0015, "step": 8529 }, { "epoch": 1.74, "learning_rate": 0.0002219410911979278, "loss": 0.0165, "step": 8530 }, { "epoch": 1.74, "learning_rate": 0.00022192408026185237, "loss": 0.0238, "step": 8531 }, { "epoch": 1.74, "learning_rate": 0.00022190706812450905, "loss": 0.0276, "step": 8532 }, { "epoch": 1.74, "learning_rate": 0.00022189005478618197, "loss": 0.0325, "step": 8533 }, { "epoch": 1.74, "learning_rate": 0.00022187304024715528, "loss": 0.0064, "step": 8534 }, { "epoch": 1.74, "learning_rate": 0.00022185602450771317, "loss": 0.0133, "step": 8535 }, { "epoch": 1.74, "learning_rate": 0.00022183900756813973, "loss": 0.0067, "step": 8536 }, { "epoch": 1.74, "learning_rate": 0.00022182198942871932, "loss": 0.0512, "step": 8537 }, { "epoch": 1.74, "learning_rate": 0.00022180497008973614, "loss": 0.0142, "step": 8538 }, { "epoch": 1.74, "learning_rate": 0.00022178794955147435, "loss": 0.0129, "step": 8539 }, { "epoch": 1.74, "learning_rate": 0.00022177092781421832, "loss": 0.0183, "step": 8540 }, { "epoch": 1.74, "learning_rate": 0.00022175390487825231, "loss": 0.0053, "step": 8541 }, { "epoch": 1.74, "learning_rate": 0.0002217368807438607, "loss": 0.0049, "step": 8542 }, { "epoch": 1.74, "learning_rate": 0.0002217198554113277, "loss": 0.043, "step": 8543 }, { "epoch": 1.74, "learning_rate": 0.00022170282888093774, "loss": 0.0143, "step": 8544 }, { "epoch": 1.74, "learning_rate": 0.0002216858011529752, "loss": 0.0053, "step": 8545 }, { "epoch": 1.74, "learning_rate": 0.00022166877222772448, "loss": 0.0085, "step": 8546 }, { "epoch": 1.74, "learning_rate": 0.00022165174210546997, "loss": 0.0208, "step": 8547 }, { "epoch": 1.74, "learning_rate": 0.00022163471078649613, "loss": 0.006, "step": 8548 }, { "epoch": 1.74, "learning_rate": 0.00022161767827108737, "loss": 0.0145, "step": 8549 }, { "epoch": 1.74, "learning_rate": 0.0002216006445595282, "loss": 0.0146, "step": 8550 }, { "epoch": 1.74, "learning_rate": 0.0002215836096521031, "loss": 0.0348, "step": 8551 }, { "epoch": 1.74, "learning_rate": 0.00022156657354909664, "loss": 0.0168, "step": 8552 }, { "epoch": 1.74, "learning_rate": 0.00022154953625079328, "loss": 0.0155, "step": 8553 }, { "epoch": 1.74, "learning_rate": 0.0002215324977574776, "loss": 0.0191, "step": 8554 }, { "epoch": 1.74, "learning_rate": 0.00022151545806943417, "loss": 0.0058, "step": 8555 }, { "epoch": 1.74, "learning_rate": 0.00022149841718694765, "loss": 0.0305, "step": 8556 }, { "epoch": 1.74, "learning_rate": 0.0002214813751103026, "loss": 0.0165, "step": 8557 }, { "epoch": 1.74, "learning_rate": 0.0002214643318397836, "loss": 0.0152, "step": 8558 }, { "epoch": 1.74, "learning_rate": 0.00022144728737567536, "loss": 0.0242, "step": 8559 }, { "epoch": 1.74, "learning_rate": 0.0002214302417182626, "loss": 0.0179, "step": 8560 }, { "epoch": 1.74, "learning_rate": 0.00022141319486782994, "loss": 0.0052, "step": 8561 }, { "epoch": 1.74, "learning_rate": 0.0002213961468246621, "loss": 0.0106, "step": 8562 }, { "epoch": 1.74, "learning_rate": 0.00022137909758904384, "loss": 0.0043, "step": 8563 }, { "epoch": 1.74, "learning_rate": 0.00022136204716125996, "loss": 0.0192, "step": 8564 }, { "epoch": 1.74, "learning_rate": 0.00022134499554159518, "loss": 0.0206, "step": 8565 }, { "epoch": 1.74, "learning_rate": 0.00022132794273033428, "loss": 0.0361, "step": 8566 }, { "epoch": 1.74, "learning_rate": 0.0002213108887277621, "loss": 0.0365, "step": 8567 }, { "epoch": 1.74, "learning_rate": 0.00022129383353416347, "loss": 0.014, "step": 8568 }, { "epoch": 1.74, "learning_rate": 0.00022127677714982327, "loss": 0.0202, "step": 8569 }, { "epoch": 1.75, "learning_rate": 0.0002212597195750263, "loss": 0.0079, "step": 8570 }, { "epoch": 1.75, "learning_rate": 0.00022124266081005755, "loss": 0.0108, "step": 8571 }, { "epoch": 1.75, "learning_rate": 0.00022122560085520185, "loss": 0.0265, "step": 8572 }, { "epoch": 1.75, "learning_rate": 0.00022120853971074414, "loss": 0.0176, "step": 8573 }, { "epoch": 1.75, "learning_rate": 0.00022119147737696942, "loss": 0.0079, "step": 8574 }, { "epoch": 1.75, "learning_rate": 0.0002211744138541627, "loss": 0.0051, "step": 8575 }, { "epoch": 1.75, "learning_rate": 0.00022115734914260888, "loss": 0.0114, "step": 8576 }, { "epoch": 1.75, "learning_rate": 0.000221140283242593, "loss": 0.0024, "step": 8577 }, { "epoch": 1.75, "learning_rate": 0.00022112321615440011, "loss": 0.0422, "step": 8578 }, { "epoch": 1.75, "learning_rate": 0.00022110614787831525, "loss": 0.0249, "step": 8579 }, { "epoch": 1.75, "learning_rate": 0.00022108907841462353, "loss": 0.0329, "step": 8580 }, { "epoch": 1.75, "learning_rate": 0.00022107200776360999, "loss": 0.0032, "step": 8581 }, { "epoch": 1.75, "learning_rate": 0.00022105493592555975, "loss": 0.009, "step": 8582 }, { "epoch": 1.75, "learning_rate": 0.00022103786290075795, "loss": 0.0086, "step": 8583 }, { "epoch": 1.75, "learning_rate": 0.00022102078868948977, "loss": 0.01, "step": 8584 }, { "epoch": 1.75, "learning_rate": 0.00022100371329204034, "loss": 0.0127, "step": 8585 }, { "epoch": 1.75, "learning_rate": 0.00022098663670869486, "loss": 0.0088, "step": 8586 }, { "epoch": 1.75, "learning_rate": 0.00022096955893973857, "loss": 0.0024, "step": 8587 }, { "epoch": 1.75, "learning_rate": 0.0002209524799854567, "loss": 0.0108, "step": 8588 }, { "epoch": 1.75, "learning_rate": 0.00022093539984613446, "loss": 0.019, "step": 8589 }, { "epoch": 1.75, "learning_rate": 0.00022091831852205716, "loss": 0.0175, "step": 8590 }, { "epoch": 1.75, "learning_rate": 0.00022090123601351, "loss": 0.0059, "step": 8591 }, { "epoch": 1.75, "learning_rate": 0.00022088415232077846, "loss": 0.0087, "step": 8592 }, { "epoch": 1.75, "learning_rate": 0.00022086706744414768, "loss": 0.006, "step": 8593 }, { "epoch": 1.75, "learning_rate": 0.00022084998138390316, "loss": 0.0177, "step": 8594 }, { "epoch": 1.75, "learning_rate": 0.0002208328941403302, "loss": 0.0128, "step": 8595 }, { "epoch": 1.75, "learning_rate": 0.00022081580571371422, "loss": 0.0149, "step": 8596 }, { "epoch": 1.75, "learning_rate": 0.0002207987161043406, "loss": 0.0304, "step": 8597 }, { "epoch": 1.75, "learning_rate": 0.00022078162531249476, "loss": 0.0204, "step": 8598 }, { "epoch": 1.75, "learning_rate": 0.0002207645333384622, "loss": 0.0365, "step": 8599 }, { "epoch": 1.75, "learning_rate": 0.00022074744018252832, "loss": 0.0099, "step": 8600 }, { "epoch": 1.75, "learning_rate": 0.00022073034584497867, "loss": 0.012, "step": 8601 }, { "epoch": 1.75, "learning_rate": 0.00022071325032609873, "loss": 0.0138, "step": 8602 }, { "epoch": 1.75, "learning_rate": 0.000220696153626174, "loss": 0.0118, "step": 8603 }, { "epoch": 1.75, "learning_rate": 0.00022067905574549008, "loss": 0.0141, "step": 8604 }, { "epoch": 1.75, "learning_rate": 0.0002206619566843325, "loss": 0.0098, "step": 8605 }, { "epoch": 1.75, "learning_rate": 0.00022064485644298688, "loss": 0.0107, "step": 8606 }, { "epoch": 1.75, "learning_rate": 0.00022062775502173877, "loss": 0.0129, "step": 8607 }, { "epoch": 1.75, "learning_rate": 0.00022061065242087393, "loss": 0.0087, "step": 8608 }, { "epoch": 1.75, "learning_rate": 0.0002205935486406778, "loss": 0.0047, "step": 8609 }, { "epoch": 1.75, "learning_rate": 0.0002205764436814362, "loss": 0.0096, "step": 8610 }, { "epoch": 1.75, "learning_rate": 0.00022055933754343475, "loss": 0.0061, "step": 8611 }, { "epoch": 1.75, "learning_rate": 0.0002205422302269592, "loss": 0.0235, "step": 8612 }, { "epoch": 1.75, "learning_rate": 0.00022052512173229523, "loss": 0.012, "step": 8613 }, { "epoch": 1.75, "learning_rate": 0.00022050801205972858, "loss": 0.0147, "step": 8614 }, { "epoch": 1.75, "learning_rate": 0.00022049090120954503, "loss": 0.0076, "step": 8615 }, { "epoch": 1.75, "learning_rate": 0.00022047378918203038, "loss": 0.0315, "step": 8616 }, { "epoch": 1.75, "learning_rate": 0.00022045667597747046, "loss": 0.0158, "step": 8617 }, { "epoch": 1.75, "learning_rate": 0.00022043956159615102, "loss": 0.0133, "step": 8618 }, { "epoch": 1.75, "learning_rate": 0.00022042244603835795, "loss": 0.0256, "step": 8619 }, { "epoch": 1.76, "learning_rate": 0.00022040532930437708, "loss": 0.0133, "step": 8620 }, { "epoch": 1.76, "learning_rate": 0.00022038821139449432, "loss": 0.0184, "step": 8621 }, { "epoch": 1.76, "learning_rate": 0.00022037109230899562, "loss": 0.0138, "step": 8622 }, { "epoch": 1.76, "learning_rate": 0.00022035397204816677, "loss": 0.0201, "step": 8623 }, { "epoch": 1.76, "learning_rate": 0.0002203368506122938, "loss": 0.0172, "step": 8624 }, { "epoch": 1.76, "learning_rate": 0.00022031972800166269, "loss": 0.0119, "step": 8625 }, { "epoch": 1.76, "learning_rate": 0.00022030260421655932, "loss": 0.0073, "step": 8626 }, { "epoch": 1.76, "learning_rate": 0.0002202854792572698, "loss": 0.017, "step": 8627 }, { "epoch": 1.76, "learning_rate": 0.0002202683531240801, "loss": 0.0075, "step": 8628 }, { "epoch": 1.76, "learning_rate": 0.00022025122581727626, "loss": 0.0161, "step": 8629 }, { "epoch": 1.76, "learning_rate": 0.00022023409733714432, "loss": 0.0092, "step": 8630 }, { "epoch": 1.76, "learning_rate": 0.0002202169676839704, "loss": 0.0166, "step": 8631 }, { "epoch": 1.76, "learning_rate": 0.00022019983685804057, "loss": 0.0048, "step": 8632 }, { "epoch": 1.76, "learning_rate": 0.00022018270485964095, "loss": 0.0119, "step": 8633 }, { "epoch": 1.76, "learning_rate": 0.0002201655716890577, "loss": 0.0115, "step": 8634 }, { "epoch": 1.76, "learning_rate": 0.00022014843734657693, "loss": 0.0094, "step": 8635 }, { "epoch": 1.76, "learning_rate": 0.00022013130183248482, "loss": 0.0082, "step": 8636 }, { "epoch": 1.76, "learning_rate": 0.00022011416514706764, "loss": 0.0188, "step": 8637 }, { "epoch": 1.76, "learning_rate": 0.0002200970272906115, "loss": 0.0078, "step": 8638 }, { "epoch": 1.76, "learning_rate": 0.00022007988826340272, "loss": 0.0023, "step": 8639 }, { "epoch": 1.76, "learning_rate": 0.00022006274806572756, "loss": 0.0102, "step": 8640 }, { "epoch": 1.76, "learning_rate": 0.0002200456066978722, "loss": 0.0292, "step": 8641 }, { "epoch": 1.76, "learning_rate": 0.00022002846416012298, "loss": 0.0513, "step": 8642 }, { "epoch": 1.76, "learning_rate": 0.00022001132045276626, "loss": 0.0072, "step": 8643 }, { "epoch": 1.76, "learning_rate": 0.0002199941755760883, "loss": 0.0053, "step": 8644 }, { "epoch": 1.76, "learning_rate": 0.00021997702953037548, "loss": 0.0129, "step": 8645 }, { "epoch": 1.76, "learning_rate": 0.0002199598823159142, "loss": 0.0102, "step": 8646 }, { "epoch": 1.76, "learning_rate": 0.0002199427339329908, "loss": 0.0251, "step": 8647 }, { "epoch": 1.76, "learning_rate": 0.00021992558438189175, "loss": 0.0172, "step": 8648 }, { "epoch": 1.76, "learning_rate": 0.00021990843366290346, "loss": 0.0081, "step": 8649 }, { "epoch": 1.76, "learning_rate": 0.00021989128177631232, "loss": 0.0185, "step": 8650 }, { "epoch": 1.76, "learning_rate": 0.00021987412872240486, "loss": 0.0222, "step": 8651 }, { "epoch": 1.76, "learning_rate": 0.00021985697450146758, "loss": 0.0366, "step": 8652 }, { "epoch": 1.76, "learning_rate": 0.0002198398191137869, "loss": 0.0109, "step": 8653 }, { "epoch": 1.76, "learning_rate": 0.0002198226625596495, "loss": 0.0185, "step": 8654 }, { "epoch": 1.76, "learning_rate": 0.00021980550483934177, "loss": 0.0176, "step": 8655 }, { "epoch": 1.76, "learning_rate": 0.00021978834595315033, "loss": 0.0179, "step": 8656 }, { "epoch": 1.76, "learning_rate": 0.0002197711859013618, "loss": 0.0156, "step": 8657 }, { "epoch": 1.76, "learning_rate": 0.00021975402468426276, "loss": 0.0057, "step": 8658 }, { "epoch": 1.76, "learning_rate": 0.00021973686230213985, "loss": 0.014, "step": 8659 }, { "epoch": 1.76, "learning_rate": 0.00021971969875527974, "loss": 0.0267, "step": 8660 }, { "epoch": 1.76, "learning_rate": 0.00021970253404396896, "loss": 0.0142, "step": 8661 }, { "epoch": 1.76, "learning_rate": 0.00021968536816849437, "loss": 0.0179, "step": 8662 }, { "epoch": 1.76, "learning_rate": 0.00021966820112914257, "loss": 0.0198, "step": 8663 }, { "epoch": 1.76, "learning_rate": 0.00021965103292620027, "loss": 0.0153, "step": 8664 }, { "epoch": 1.76, "learning_rate": 0.00021963386355995426, "loss": 0.0176, "step": 8665 }, { "epoch": 1.76, "learning_rate": 0.00021961669303069133, "loss": 0.0059, "step": 8666 }, { "epoch": 1.76, "learning_rate": 0.0002195995213386982, "loss": 0.01, "step": 8667 }, { "epoch": 1.76, "learning_rate": 0.00021958234848426164, "loss": 0.0023, "step": 8668 }, { "epoch": 1.77, "learning_rate": 0.00021956517446766852, "loss": 0.0183, "step": 8669 }, { "epoch": 1.77, "learning_rate": 0.00021954799928920567, "loss": 0.0063, "step": 8670 }, { "epoch": 1.77, "learning_rate": 0.00021953082294916, "loss": 0.0278, "step": 8671 }, { "epoch": 1.77, "learning_rate": 0.0002195136454478183, "loss": 0.0174, "step": 8672 }, { "epoch": 1.77, "learning_rate": 0.00021949646678546755, "loss": 0.0176, "step": 8673 }, { "epoch": 1.77, "learning_rate": 0.00021947928696239457, "loss": 0.0198, "step": 8674 }, { "epoch": 1.77, "learning_rate": 0.00021946210597888636, "loss": 0.0337, "step": 8675 }, { "epoch": 1.77, "learning_rate": 0.00021944492383522987, "loss": 0.0124, "step": 8676 }, { "epoch": 1.77, "learning_rate": 0.00021942774053171205, "loss": 0.0437, "step": 8677 }, { "epoch": 1.77, "learning_rate": 0.0002194105560686199, "loss": 0.0228, "step": 8678 }, { "epoch": 1.77, "learning_rate": 0.00021939337044624046, "loss": 0.0055, "step": 8679 }, { "epoch": 1.77, "learning_rate": 0.00021937618366486077, "loss": 0.0052, "step": 8680 }, { "epoch": 1.77, "learning_rate": 0.00021935899572476778, "loss": 0.0108, "step": 8681 }, { "epoch": 1.77, "learning_rate": 0.00021934180662624875, "loss": 0.0038, "step": 8682 }, { "epoch": 1.77, "learning_rate": 0.0002193246163695906, "loss": 0.0148, "step": 8683 }, { "epoch": 1.77, "learning_rate": 0.00021930742495508048, "loss": 0.0433, "step": 8684 }, { "epoch": 1.77, "learning_rate": 0.00021929023238300552, "loss": 0.0132, "step": 8685 }, { "epoch": 1.77, "learning_rate": 0.00021927303865365292, "loss": 0.0046, "step": 8686 }, { "epoch": 1.77, "learning_rate": 0.0002192558437673098, "loss": 0.0083, "step": 8687 }, { "epoch": 1.77, "learning_rate": 0.00021923864772426335, "loss": 0.0091, "step": 8688 }, { "epoch": 1.77, "learning_rate": 0.00021922145052480084, "loss": 0.0223, "step": 8689 }, { "epoch": 1.77, "learning_rate": 0.00021920425216920937, "loss": 0.0042, "step": 8690 }, { "epoch": 1.77, "learning_rate": 0.0002191870526577763, "loss": 0.0292, "step": 8691 }, { "epoch": 1.77, "learning_rate": 0.00021916985199078886, "loss": 0.009, "step": 8692 }, { "epoch": 1.77, "learning_rate": 0.0002191526501685343, "loss": 0.0083, "step": 8693 }, { "epoch": 1.77, "learning_rate": 0.0002191354471912999, "loss": 0.0184, "step": 8694 }, { "epoch": 1.77, "learning_rate": 0.0002191182430593731, "loss": 0.0071, "step": 8695 }, { "epoch": 1.77, "learning_rate": 0.0002191010377730412, "loss": 0.0147, "step": 8696 }, { "epoch": 1.77, "learning_rate": 0.0002190838313325915, "loss": 0.0035, "step": 8697 }, { "epoch": 1.77, "learning_rate": 0.00021906662373831135, "loss": 0.0109, "step": 8698 }, { "epoch": 1.77, "learning_rate": 0.00021904941499048823, "loss": 0.0177, "step": 8699 }, { "epoch": 1.77, "learning_rate": 0.00021903220508940962, "loss": 0.0159, "step": 8700 }, { "epoch": 1.77, "learning_rate": 0.0002190149940353628, "loss": 0.027, "step": 8701 }, { "epoch": 1.77, "learning_rate": 0.00021899778182863532, "loss": 0.0311, "step": 8702 }, { "epoch": 1.77, "learning_rate": 0.00021898056846951465, "loss": 0.0186, "step": 8703 }, { "epoch": 1.77, "learning_rate": 0.00021896335395828827, "loss": 0.0052, "step": 8704 }, { "epoch": 1.77, "learning_rate": 0.00021894613829524375, "loss": 0.005, "step": 8705 }, { "epoch": 1.77, "learning_rate": 0.0002189289214806685, "loss": 0.0175, "step": 8706 }, { "epoch": 1.77, "learning_rate": 0.00021891170351485015, "loss": 0.016, "step": 8707 }, { "epoch": 1.77, "learning_rate": 0.00021889448439807633, "loss": 0.0184, "step": 8708 }, { "epoch": 1.77, "learning_rate": 0.00021887726413063454, "loss": 0.0217, "step": 8709 }, { "epoch": 1.77, "learning_rate": 0.0002188600427128124, "loss": 0.0192, "step": 8710 }, { "epoch": 1.77, "learning_rate": 0.0002188428201448976, "loss": 0.0398, "step": 8711 }, { "epoch": 1.77, "learning_rate": 0.00021882559642717777, "loss": 0.0035, "step": 8712 }, { "epoch": 1.77, "learning_rate": 0.00021880837155994053, "loss": 0.0108, "step": 8713 }, { "epoch": 1.77, "learning_rate": 0.00021879114554347362, "loss": 0.0364, "step": 8714 }, { "epoch": 1.77, "learning_rate": 0.00021877391837806472, "loss": 0.0135, "step": 8715 }, { "epoch": 1.77, "learning_rate": 0.00021875669006400154, "loss": 0.0073, "step": 8716 }, { "epoch": 1.77, "learning_rate": 0.00021873946060157188, "loss": 0.0123, "step": 8717 }, { "epoch": 1.78, "learning_rate": 0.0002187222299910635, "loss": 0.0113, "step": 8718 }, { "epoch": 1.78, "learning_rate": 0.0002187049982327641, "loss": 0.0171, "step": 8719 }, { "epoch": 1.78, "learning_rate": 0.00021868776532696152, "loss": 0.0042, "step": 8720 }, { "epoch": 1.78, "learning_rate": 0.00021867053127394364, "loss": 0.0191, "step": 8721 }, { "epoch": 1.78, "learning_rate": 0.00021865329607399824, "loss": 0.0074, "step": 8722 }, { "epoch": 1.78, "learning_rate": 0.00021863605972741328, "loss": 0.0158, "step": 8723 }, { "epoch": 1.78, "learning_rate": 0.0002186188222344765, "loss": 0.0127, "step": 8724 }, { "epoch": 1.78, "learning_rate": 0.00021860158359547584, "loss": 0.0248, "step": 8725 }, { "epoch": 1.78, "learning_rate": 0.0002185843438106993, "loss": 0.0337, "step": 8726 }, { "epoch": 1.78, "learning_rate": 0.00021856710288043472, "loss": 0.0278, "step": 8727 }, { "epoch": 1.78, "learning_rate": 0.00021854986080497007, "loss": 0.0097, "step": 8728 }, { "epoch": 1.78, "learning_rate": 0.00021853261758459337, "loss": 0.0085, "step": 8729 }, { "epoch": 1.78, "learning_rate": 0.0002185153732195926, "loss": 0.025, "step": 8730 }, { "epoch": 1.78, "learning_rate": 0.00021849812771025575, "loss": 0.0082, "step": 8731 }, { "epoch": 1.78, "learning_rate": 0.0002184808810568709, "loss": 0.0036, "step": 8732 }, { "epoch": 1.78, "learning_rate": 0.00021846363325972606, "loss": 0.005, "step": 8733 }, { "epoch": 1.78, "learning_rate": 0.00021844638431910927, "loss": 0.0123, "step": 8734 }, { "epoch": 1.78, "learning_rate": 0.0002184291342353087, "loss": 0.0009, "step": 8735 }, { "epoch": 1.78, "learning_rate": 0.00021841188300861242, "loss": 0.0102, "step": 8736 }, { "epoch": 1.78, "learning_rate": 0.00021839463063930858, "loss": 0.0055, "step": 8737 }, { "epoch": 1.78, "learning_rate": 0.00021837737712768524, "loss": 0.0336, "step": 8738 }, { "epoch": 1.78, "learning_rate": 0.00021836012247403066, "loss": 0.1206, "step": 8739 }, { "epoch": 1.78, "learning_rate": 0.000218342866678633, "loss": 0.0128, "step": 8740 }, { "epoch": 1.78, "learning_rate": 0.0002183256097417804, "loss": 0.0221, "step": 8741 }, { "epoch": 1.78, "learning_rate": 0.00021830835166376125, "loss": 0.0225, "step": 8742 }, { "epoch": 1.78, "learning_rate": 0.00021829109244486363, "loss": 0.0359, "step": 8743 }, { "epoch": 1.78, "learning_rate": 0.00021827383208537586, "loss": 0.0078, "step": 8744 }, { "epoch": 1.78, "learning_rate": 0.00021825657058558622, "loss": 0.0117, "step": 8745 }, { "epoch": 1.78, "learning_rate": 0.000218239307945783, "loss": 0.0043, "step": 8746 }, { "epoch": 1.78, "learning_rate": 0.00021822204416625457, "loss": 0.0081, "step": 8747 }, { "epoch": 1.78, "learning_rate": 0.00021820477924728917, "loss": 0.0046, "step": 8748 }, { "epoch": 1.78, "learning_rate": 0.00021818751318917524, "loss": 0.0121, "step": 8749 }, { "epoch": 1.78, "learning_rate": 0.00021817024599220112, "loss": 0.0159, "step": 8750 }, { "epoch": 1.78, "learning_rate": 0.00021815297765665517, "loss": 0.0025, "step": 8751 }, { "epoch": 1.78, "learning_rate": 0.0002181357081828259, "loss": 0.0265, "step": 8752 }, { "epoch": 1.78, "learning_rate": 0.0002181184375710017, "loss": 0.0129, "step": 8753 }, { "epoch": 1.78, "learning_rate": 0.00021810116582147098, "loss": 0.016, "step": 8754 }, { "epoch": 1.78, "learning_rate": 0.00021808389293452221, "loss": 0.0085, "step": 8755 }, { "epoch": 1.78, "learning_rate": 0.00021806661891044397, "loss": 0.0069, "step": 8756 }, { "epoch": 1.78, "learning_rate": 0.0002180493437495247, "loss": 0.0196, "step": 8757 }, { "epoch": 1.78, "learning_rate": 0.0002180320674520529, "loss": 0.0059, "step": 8758 }, { "epoch": 1.78, "learning_rate": 0.00021801479001831717, "loss": 0.0179, "step": 8759 }, { "epoch": 1.78, "learning_rate": 0.00021799751144860606, "loss": 0.058, "step": 8760 }, { "epoch": 1.78, "learning_rate": 0.00021798023174320817, "loss": 0.0037, "step": 8761 }, { "epoch": 1.78, "learning_rate": 0.00021796295090241205, "loss": 0.006, "step": 8762 }, { "epoch": 1.78, "learning_rate": 0.00021794566892650638, "loss": 0.0184, "step": 8763 }, { "epoch": 1.78, "learning_rate": 0.00021792838581577981, "loss": 0.0059, "step": 8764 }, { "epoch": 1.78, "learning_rate": 0.00021791110157052095, "loss": 0.0062, "step": 8765 }, { "epoch": 1.78, "learning_rate": 0.00021789381619101853, "loss": 0.0295, "step": 8766 }, { "epoch": 1.79, "learning_rate": 0.00021787652967756118, "loss": 0.0166, "step": 8767 }, { "epoch": 1.79, "learning_rate": 0.0002178592420304377, "loss": 0.0166, "step": 8768 }, { "epoch": 1.79, "learning_rate": 0.00021784195324993673, "loss": 0.0074, "step": 8769 }, { "epoch": 1.79, "learning_rate": 0.00021782466333634712, "loss": 0.009, "step": 8770 }, { "epoch": 1.79, "learning_rate": 0.00021780737228995758, "loss": 0.0167, "step": 8771 }, { "epoch": 1.79, "learning_rate": 0.00021779008011105693, "loss": 0.0097, "step": 8772 }, { "epoch": 1.79, "learning_rate": 0.000217772786799934, "loss": 0.0275, "step": 8773 }, { "epoch": 1.79, "learning_rate": 0.0002177554923568776, "loss": 0.0111, "step": 8774 }, { "epoch": 1.79, "learning_rate": 0.00021773819678217658, "loss": 0.0128, "step": 8775 }, { "epoch": 1.79, "learning_rate": 0.00021772090007611978, "loss": 0.017, "step": 8776 }, { "epoch": 1.79, "learning_rate": 0.00021770360223899614, "loss": 0.0189, "step": 8777 }, { "epoch": 1.79, "learning_rate": 0.00021768630327109452, "loss": 0.0094, "step": 8778 }, { "epoch": 1.79, "learning_rate": 0.0002176690031727039, "loss": 0.0024, "step": 8779 }, { "epoch": 1.79, "learning_rate": 0.0002176517019441132, "loss": 0.0043, "step": 8780 }, { "epoch": 1.79, "learning_rate": 0.00021763439958561131, "loss": 0.0139, "step": 8781 }, { "epoch": 1.79, "learning_rate": 0.00021761709609748734, "loss": 0.025, "step": 8782 }, { "epoch": 1.79, "learning_rate": 0.0002175997914800302, "loss": 0.0066, "step": 8783 }, { "epoch": 1.79, "learning_rate": 0.00021758248573352897, "loss": 0.0078, "step": 8784 }, { "epoch": 1.79, "learning_rate": 0.00021756517885827262, "loss": 0.0107, "step": 8785 }, { "epoch": 1.79, "learning_rate": 0.0002175478708545503, "loss": 0.0304, "step": 8786 }, { "epoch": 1.79, "learning_rate": 0.00021753056172265096, "loss": 0.0096, "step": 8787 }, { "epoch": 1.79, "learning_rate": 0.0002175132514628638, "loss": 0.0073, "step": 8788 }, { "epoch": 1.79, "learning_rate": 0.00021749594007547794, "loss": 0.0077, "step": 8789 }, { "epoch": 1.79, "learning_rate": 0.00021747862756078243, "loss": 0.0322, "step": 8790 }, { "epoch": 1.79, "learning_rate": 0.00021746131391906645, "loss": 0.0092, "step": 8791 }, { "epoch": 1.79, "learning_rate": 0.0002174439991506192, "loss": 0.0035, "step": 8792 }, { "epoch": 1.79, "learning_rate": 0.00021742668325572985, "loss": 0.0213, "step": 8793 }, { "epoch": 1.79, "learning_rate": 0.00021740936623468766, "loss": 0.0116, "step": 8794 }, { "epoch": 1.79, "learning_rate": 0.00021739204808778173, "loss": 0.0304, "step": 8795 }, { "epoch": 1.79, "learning_rate": 0.00021737472881530143, "loss": 0.0134, "step": 8796 }, { "epoch": 1.79, "learning_rate": 0.00021735740841753598, "loss": 0.0115, "step": 8797 }, { "epoch": 1.79, "learning_rate": 0.00021734008689477466, "loss": 0.0411, "step": 8798 }, { "epoch": 1.79, "learning_rate": 0.00021732276424730681, "loss": 0.0095, "step": 8799 }, { "epoch": 1.79, "learning_rate": 0.00021730544047542167, "loss": 0.0059, "step": 8800 }, { "epoch": 1.79, "learning_rate": 0.00021728811557940862, "loss": 0.0144, "step": 8801 }, { "epoch": 1.79, "learning_rate": 0.00021727078955955704, "loss": 0.0161, "step": 8802 }, { "epoch": 1.79, "learning_rate": 0.0002172534624161563, "loss": 0.0335, "step": 8803 }, { "epoch": 1.79, "learning_rate": 0.00021723613414949578, "loss": 0.0047, "step": 8804 }, { "epoch": 1.79, "learning_rate": 0.0002172188047598649, "loss": 0.0263, "step": 8805 }, { "epoch": 1.79, "learning_rate": 0.00021720147424755308, "loss": 0.0108, "step": 8806 }, { "epoch": 1.79, "learning_rate": 0.00021718414261284982, "loss": 0.0073, "step": 8807 }, { "epoch": 1.79, "learning_rate": 0.00021716680985604459, "loss": 0.0237, "step": 8808 }, { "epoch": 1.79, "learning_rate": 0.00021714947597742677, "loss": 0.0115, "step": 8809 }, { "epoch": 1.79, "learning_rate": 0.00021713214097728598, "loss": 0.029, "step": 8810 }, { "epoch": 1.79, "learning_rate": 0.00021711480485591173, "loss": 0.0033, "step": 8811 }, { "epoch": 1.79, "learning_rate": 0.00021709746761359354, "loss": 0.036, "step": 8812 }, { "epoch": 1.79, "learning_rate": 0.00021708012925062095, "loss": 0.0046, "step": 8813 }, { "epoch": 1.79, "learning_rate": 0.00021706278976728365, "loss": 0.0072, "step": 8814 }, { "epoch": 1.79, "learning_rate": 0.00021704544916387113, "loss": 0.0144, "step": 8815 }, { "epoch": 1.8, "learning_rate": 0.00021702810744067308, "loss": 0.0044, "step": 8816 }, { "epoch": 1.8, "learning_rate": 0.00021701076459797907, "loss": 0.0068, "step": 8817 }, { "epoch": 1.8, "learning_rate": 0.00021699342063607883, "loss": 0.0143, "step": 8818 }, { "epoch": 1.8, "learning_rate": 0.00021697607555526196, "loss": 0.0335, "step": 8819 }, { "epoch": 1.8, "learning_rate": 0.00021695872935581826, "loss": 0.0271, "step": 8820 }, { "epoch": 1.8, "learning_rate": 0.0002169413820380374, "loss": 0.0403, "step": 8821 }, { "epoch": 1.8, "learning_rate": 0.00021692403360220905, "loss": 0.0191, "step": 8822 }, { "epoch": 1.8, "learning_rate": 0.00021690668404862295, "loss": 0.0291, "step": 8823 }, { "epoch": 1.8, "learning_rate": 0.00021688933337756902, "loss": 0.0031, "step": 8824 }, { "epoch": 1.8, "learning_rate": 0.00021687198158933696, "loss": 0.0071, "step": 8825 }, { "epoch": 1.8, "learning_rate": 0.00021685462868421655, "loss": 0.0167, "step": 8826 }, { "epoch": 1.8, "learning_rate": 0.00021683727466249769, "loss": 0.0013, "step": 8827 }, { "epoch": 1.8, "learning_rate": 0.00021681991952447012, "loss": 0.0031, "step": 8828 }, { "epoch": 1.8, "learning_rate": 0.00021680256327042375, "loss": 0.0048, "step": 8829 }, { "epoch": 1.8, "learning_rate": 0.00021678520590064855, "loss": 0.0121, "step": 8830 }, { "epoch": 1.8, "learning_rate": 0.0002167678474154343, "loss": 0.0167, "step": 8831 }, { "epoch": 1.8, "learning_rate": 0.00021675048781507095, "loss": 0.0327, "step": 8832 }, { "epoch": 1.8, "learning_rate": 0.00021673312709984848, "loss": 0.0071, "step": 8833 }, { "epoch": 1.8, "learning_rate": 0.00021671576527005682, "loss": 0.0056, "step": 8834 }, { "epoch": 1.8, "learning_rate": 0.00021669840232598595, "loss": 0.0224, "step": 8835 }, { "epoch": 1.8, "learning_rate": 0.00021668103826792584, "loss": 0.0111, "step": 8836 }, { "epoch": 1.8, "learning_rate": 0.00021666367309616653, "loss": 0.0157, "step": 8837 }, { "epoch": 1.8, "learning_rate": 0.00021664630681099802, "loss": 0.0294, "step": 8838 }, { "epoch": 1.8, "learning_rate": 0.00021662893941271045, "loss": 0.0081, "step": 8839 }, { "epoch": 1.8, "learning_rate": 0.00021661157090159378, "loss": 0.0171, "step": 8840 }, { "epoch": 1.8, "learning_rate": 0.00021659420127793813, "loss": 0.0077, "step": 8841 }, { "epoch": 1.8, "learning_rate": 0.0002165768305420336, "loss": 0.0158, "step": 8842 }, { "epoch": 1.8, "learning_rate": 0.0002165594586941703, "loss": 0.0203, "step": 8843 }, { "epoch": 1.8, "learning_rate": 0.00021654208573463845, "loss": 0.012, "step": 8844 }, { "epoch": 1.8, "learning_rate": 0.00021652471166372817, "loss": 0.0219, "step": 8845 }, { "epoch": 1.8, "learning_rate": 0.0002165073364817296, "loss": 0.006, "step": 8846 }, { "epoch": 1.8, "learning_rate": 0.00021648996018893302, "loss": 0.0027, "step": 8847 }, { "epoch": 1.8, "learning_rate": 0.00021647258278562856, "loss": 0.0114, "step": 8848 }, { "epoch": 1.8, "learning_rate": 0.00021645520427210647, "loss": 0.0083, "step": 8849 }, { "epoch": 1.8, "learning_rate": 0.00021643782464865707, "loss": 0.0104, "step": 8850 }, { "epoch": 1.8, "learning_rate": 0.00021642044391557055, "loss": 0.007, "step": 8851 }, { "epoch": 1.8, "learning_rate": 0.00021640306207313723, "loss": 0.015, "step": 8852 }, { "epoch": 1.8, "learning_rate": 0.0002163856791216475, "loss": 0.0048, "step": 8853 }, { "epoch": 1.8, "learning_rate": 0.00021636829506139154, "loss": 0.0156, "step": 8854 }, { "epoch": 1.8, "learning_rate": 0.00021635090989265978, "loss": 0.0129, "step": 8855 }, { "epoch": 1.8, "learning_rate": 0.00021633352361574262, "loss": 0.0084, "step": 8856 }, { "epoch": 1.8, "learning_rate": 0.00021631613623093038, "loss": 0.035, "step": 8857 }, { "epoch": 1.8, "learning_rate": 0.0002162987477385135, "loss": 0.0161, "step": 8858 }, { "epoch": 1.8, "learning_rate": 0.00021628135813878238, "loss": 0.0358, "step": 8859 }, { "epoch": 1.8, "learning_rate": 0.00021626396743202746, "loss": 0.008, "step": 8860 }, { "epoch": 1.8, "learning_rate": 0.00021624657561853918, "loss": 0.0134, "step": 8861 }, { "epoch": 1.8, "learning_rate": 0.0002162291826986081, "loss": 0.0067, "step": 8862 }, { "epoch": 1.8, "learning_rate": 0.00021621178867252462, "loss": 0.0159, "step": 8863 }, { "epoch": 1.8, "learning_rate": 0.00021619439354057923, "loss": 0.0196, "step": 8864 }, { "epoch": 1.81, "learning_rate": 0.00021617699730306256, "loss": 0.0285, "step": 8865 }, { "epoch": 1.81, "learning_rate": 0.00021615959996026512, "loss": 0.013, "step": 8866 }, { "epoch": 1.81, "learning_rate": 0.00021614220151247747, "loss": 0.012, "step": 8867 }, { "epoch": 1.81, "learning_rate": 0.00021612480195999024, "loss": 0.0075, "step": 8868 }, { "epoch": 1.81, "learning_rate": 0.00021610740130309397, "loss": 0.0106, "step": 8869 }, { "epoch": 1.81, "learning_rate": 0.00021608999954207927, "loss": 0.0254, "step": 8870 }, { "epoch": 1.81, "learning_rate": 0.0002160725966772369, "loss": 0.0629, "step": 8871 }, { "epoch": 1.81, "learning_rate": 0.0002160551927088574, "loss": 0.0462, "step": 8872 }, { "epoch": 1.81, "learning_rate": 0.0002160377876372315, "loss": 0.0063, "step": 8873 }, { "epoch": 1.81, "learning_rate": 0.00021602038146264991, "loss": 0.0148, "step": 8874 }, { "epoch": 1.81, "learning_rate": 0.00021600297418540327, "loss": 0.0032, "step": 8875 }, { "epoch": 1.81, "learning_rate": 0.00021598556580578243, "loss": 0.0025, "step": 8876 }, { "epoch": 1.81, "learning_rate": 0.00021596815632407803, "loss": 0.0164, "step": 8877 }, { "epoch": 1.81, "learning_rate": 0.00021595074574058093, "loss": 0.0418, "step": 8878 }, { "epoch": 1.81, "learning_rate": 0.0002159333340555819, "loss": 0.0067, "step": 8879 }, { "epoch": 1.81, "learning_rate": 0.0002159159212693717, "loss": 0.0201, "step": 8880 }, { "epoch": 1.81, "learning_rate": 0.00021589850738224127, "loss": 0.0053, "step": 8881 }, { "epoch": 1.81, "learning_rate": 0.0002158810923944813, "loss": 0.014, "step": 8882 }, { "epoch": 1.81, "learning_rate": 0.0002158636763063827, "loss": 0.0136, "step": 8883 }, { "epoch": 1.81, "learning_rate": 0.00021584625911823642, "loss": 0.018, "step": 8884 }, { "epoch": 1.81, "learning_rate": 0.00021582884083033333, "loss": 0.0143, "step": 8885 }, { "epoch": 1.81, "learning_rate": 0.00021581142144296432, "loss": 0.0129, "step": 8886 }, { "epoch": 1.81, "learning_rate": 0.00021579400095642036, "loss": 0.025, "step": 8887 }, { "epoch": 1.81, "learning_rate": 0.00021577657937099236, "loss": 0.0072, "step": 8888 }, { "epoch": 1.81, "learning_rate": 0.00021575915668697136, "loss": 0.0084, "step": 8889 }, { "epoch": 1.81, "learning_rate": 0.0002157417329046483, "loss": 0.0121, "step": 8890 }, { "epoch": 1.81, "learning_rate": 0.0002157243080243142, "loss": 0.0087, "step": 8891 }, { "epoch": 1.81, "learning_rate": 0.00021570688204626008, "loss": 0.0152, "step": 8892 }, { "epoch": 1.81, "learning_rate": 0.000215689454970777, "loss": 0.007, "step": 8893 }, { "epoch": 1.81, "learning_rate": 0.00021567202679815604, "loss": 0.015, "step": 8894 }, { "epoch": 1.81, "learning_rate": 0.00021565459752868828, "loss": 0.0253, "step": 8895 }, { "epoch": 1.81, "learning_rate": 0.00021563716716266478, "loss": 0.0063, "step": 8896 }, { "epoch": 1.81, "learning_rate": 0.0002156197357003767, "loss": 0.0162, "step": 8897 }, { "epoch": 1.81, "learning_rate": 0.00021560230314211518, "loss": 0.0165, "step": 8898 }, { "epoch": 1.81, "learning_rate": 0.00021558486948817138, "loss": 0.005, "step": 8899 }, { "epoch": 1.81, "learning_rate": 0.00021556743473883643, "loss": 0.0017, "step": 8900 }, { "epoch": 1.81, "learning_rate": 0.00021554999889440154, "loss": 0.0069, "step": 8901 }, { "epoch": 1.81, "learning_rate": 0.00021553256195515794, "loss": 0.0147, "step": 8902 }, { "epoch": 1.81, "learning_rate": 0.00021551512392139688, "loss": 0.0155, "step": 8903 }, { "epoch": 1.81, "learning_rate": 0.00021549768479340957, "loss": 0.0094, "step": 8904 }, { "epoch": 1.81, "learning_rate": 0.0002154802445714873, "loss": 0.0057, "step": 8905 }, { "epoch": 1.81, "learning_rate": 0.00021546280325592128, "loss": 0.0052, "step": 8906 }, { "epoch": 1.81, "learning_rate": 0.00021544536084700295, "loss": 0.0161, "step": 8907 }, { "epoch": 1.81, "learning_rate": 0.00021542791734502356, "loss": 0.0207, "step": 8908 }, { "epoch": 1.81, "learning_rate": 0.0002154104727502744, "loss": 0.0203, "step": 8909 }, { "epoch": 1.81, "learning_rate": 0.00021539302706304687, "loss": 0.0066, "step": 8910 }, { "epoch": 1.81, "learning_rate": 0.0002153755802836324, "loss": 0.0149, "step": 8911 }, { "epoch": 1.81, "learning_rate": 0.00021535813241232226, "loss": 0.017, "step": 8912 }, { "epoch": 1.81, "learning_rate": 0.00021534068344940805, "loss": 0.0174, "step": 8913 }, { "epoch": 1.82, "learning_rate": 0.000215323233395181, "loss": 0.032, "step": 8914 }, { "epoch": 1.82, "learning_rate": 0.00021530578224993263, "loss": 0.0041, "step": 8915 }, { "epoch": 1.82, "learning_rate": 0.00021528833001395448, "loss": 0.0128, "step": 8916 }, { "epoch": 1.82, "learning_rate": 0.00021527087668753793, "loss": 0.0057, "step": 8917 }, { "epoch": 1.82, "learning_rate": 0.00021525342227097458, "loss": 0.0089, "step": 8918 }, { "epoch": 1.82, "learning_rate": 0.00021523596676455587, "loss": 0.0054, "step": 8919 }, { "epoch": 1.82, "learning_rate": 0.0002152185101685734, "loss": 0.0116, "step": 8920 }, { "epoch": 1.82, "learning_rate": 0.0002152010524833187, "loss": 0.0073, "step": 8921 }, { "epoch": 1.82, "learning_rate": 0.0002151835937090833, "loss": 0.0102, "step": 8922 }, { "epoch": 1.82, "learning_rate": 0.0002151661338461589, "loss": 0.0245, "step": 8923 }, { "epoch": 1.82, "learning_rate": 0.00021514867289483704, "loss": 0.0303, "step": 8924 }, { "epoch": 1.82, "learning_rate": 0.00021513121085540933, "loss": 0.0245, "step": 8925 }, { "epoch": 1.82, "learning_rate": 0.0002151137477281675, "loss": 0.0055, "step": 8926 }, { "epoch": 1.82, "learning_rate": 0.00021509628351340315, "loss": 0.0245, "step": 8927 }, { "epoch": 1.82, "learning_rate": 0.000215078818211408, "loss": 0.002, "step": 8928 }, { "epoch": 1.82, "learning_rate": 0.0002150613518224737, "loss": 0.0153, "step": 8929 }, { "epoch": 1.82, "learning_rate": 0.00021504388434689204, "loss": 0.0079, "step": 8930 }, { "epoch": 1.82, "learning_rate": 0.00021502641578495475, "loss": 0.0195, "step": 8931 }, { "epoch": 1.82, "learning_rate": 0.0002150089461369536, "loss": 0.0213, "step": 8932 }, { "epoch": 1.82, "learning_rate": 0.00021499147540318027, "loss": 0.0452, "step": 8933 }, { "epoch": 1.82, "learning_rate": 0.00021497400358392663, "loss": 0.0029, "step": 8934 }, { "epoch": 1.82, "learning_rate": 0.00021495653067948452, "loss": 0.0086, "step": 8935 }, { "epoch": 1.82, "learning_rate": 0.0002149390566901457, "loss": 0.0124, "step": 8936 }, { "epoch": 1.82, "learning_rate": 0.00021492158161620206, "loss": 0.0133, "step": 8937 }, { "epoch": 1.82, "learning_rate": 0.00021490410545794546, "loss": 0.0171, "step": 8938 }, { "epoch": 1.82, "learning_rate": 0.0002148866282156678, "loss": 0.0182, "step": 8939 }, { "epoch": 1.82, "learning_rate": 0.00021486914988966095, "loss": 0.0031, "step": 8940 }, { "epoch": 1.82, "learning_rate": 0.00021485167048021685, "loss": 0.0066, "step": 8941 }, { "epoch": 1.82, "learning_rate": 0.00021483418998762742, "loss": 0.0058, "step": 8942 }, { "epoch": 1.82, "learning_rate": 0.00021481670841218465, "loss": 0.0072, "step": 8943 }, { "epoch": 1.82, "learning_rate": 0.00021479922575418051, "loss": 0.0045, "step": 8944 }, { "epoch": 1.82, "learning_rate": 0.00021478174201390699, "loss": 0.0122, "step": 8945 }, { "epoch": 1.82, "learning_rate": 0.00021476425719165612, "loss": 0.0369, "step": 8946 }, { "epoch": 1.82, "learning_rate": 0.0002147467712877198, "loss": 0.0112, "step": 8947 }, { "epoch": 1.82, "learning_rate": 0.00021472928430239023, "loss": 0.0033, "step": 8948 }, { "epoch": 1.82, "learning_rate": 0.00021471179623595943, "loss": 0.0112, "step": 8949 }, { "epoch": 1.82, "learning_rate": 0.00021469430708871953, "loss": 0.0031, "step": 8950 }, { "epoch": 1.82, "learning_rate": 0.00021467681686096254, "loss": 0.0201, "step": 8951 }, { "epoch": 1.82, "learning_rate": 0.00021465932555298062, "loss": 0.0099, "step": 8952 }, { "epoch": 1.82, "learning_rate": 0.0002146418331650659, "loss": 0.0218, "step": 8953 }, { "epoch": 1.82, "learning_rate": 0.00021462433969751058, "loss": 0.0078, "step": 8954 }, { "epoch": 1.82, "learning_rate": 0.0002146068451506068, "loss": 0.0313, "step": 8955 }, { "epoch": 1.82, "learning_rate": 0.00021458934952464672, "loss": 0.0018, "step": 8956 }, { "epoch": 1.82, "learning_rate": 0.00021457185281992258, "loss": 0.0038, "step": 8957 }, { "epoch": 1.82, "learning_rate": 0.00021455435503672665, "loss": 0.0079, "step": 8958 }, { "epoch": 1.82, "learning_rate": 0.00021453685617535108, "loss": 0.048, "step": 8959 }, { "epoch": 1.82, "learning_rate": 0.00021451935623608822, "loss": 0.0088, "step": 8960 }, { "epoch": 1.82, "learning_rate": 0.0002145018552192303, "loss": 0.0098, "step": 8961 }, { "epoch": 1.82, "learning_rate": 0.0002144843531250697, "loss": 0.0097, "step": 8962 }, { "epoch": 1.83, "learning_rate": 0.00021446684995389865, "loss": 0.0022, "step": 8963 }, { "epoch": 1.83, "learning_rate": 0.00021444934570600952, "loss": 0.0127, "step": 8964 }, { "epoch": 1.83, "learning_rate": 0.00021443184038169466, "loss": 0.0327, "step": 8965 }, { "epoch": 1.83, "learning_rate": 0.0002144143339812464, "loss": 0.0028, "step": 8966 }, { "epoch": 1.83, "learning_rate": 0.0002143968265049572, "loss": 0.0036, "step": 8967 }, { "epoch": 1.83, "learning_rate": 0.00021437931795311946, "loss": 0.0079, "step": 8968 }, { "epoch": 1.83, "learning_rate": 0.00021436180832602554, "loss": 0.0707, "step": 8969 }, { "epoch": 1.83, "learning_rate": 0.000214344297623968, "loss": 0.0352, "step": 8970 }, { "epoch": 1.83, "learning_rate": 0.00021432678584723915, "loss": 0.0053, "step": 8971 }, { "epoch": 1.83, "learning_rate": 0.0002143092729961316, "loss": 0.0139, "step": 8972 }, { "epoch": 1.83, "learning_rate": 0.0002142917590709378, "loss": 0.0395, "step": 8973 }, { "epoch": 1.83, "learning_rate": 0.00021427424407195026, "loss": 0.0114, "step": 8974 }, { "epoch": 1.83, "learning_rate": 0.0002142567279994615, "loss": 0.0359, "step": 8975 }, { "epoch": 1.83, "learning_rate": 0.0002142392108537641, "loss": 0.0119, "step": 8976 }, { "epoch": 1.83, "learning_rate": 0.0002142216926351506, "loss": 0.0207, "step": 8977 }, { "epoch": 1.83, "learning_rate": 0.00021420417334391364, "loss": 0.0225, "step": 8978 }, { "epoch": 1.83, "learning_rate": 0.00021418665298034576, "loss": 0.0279, "step": 8979 }, { "epoch": 1.83, "learning_rate": 0.00021416913154473965, "loss": 0.0129, "step": 8980 }, { "epoch": 1.83, "learning_rate": 0.0002141516090373879, "loss": 0.0346, "step": 8981 }, { "epoch": 1.83, "learning_rate": 0.0002141340854585832, "loss": 0.0274, "step": 8982 }, { "epoch": 1.83, "learning_rate": 0.00021411656080861817, "loss": 0.0016, "step": 8983 }, { "epoch": 1.83, "learning_rate": 0.00021409903508778558, "loss": 0.0148, "step": 8984 }, { "epoch": 1.83, "learning_rate": 0.00021408150829637808, "loss": 0.0086, "step": 8985 }, { "epoch": 1.83, "learning_rate": 0.00021406398043468845, "loss": 0.0103, "step": 8986 }, { "epoch": 1.83, "learning_rate": 0.00021404645150300945, "loss": 0.0264, "step": 8987 }, { "epoch": 1.83, "learning_rate": 0.00021402892150163377, "loss": 0.0082, "step": 8988 }, { "epoch": 1.83, "learning_rate": 0.0002140113904308542, "loss": 0.0035, "step": 8989 }, { "epoch": 1.83, "learning_rate": 0.0002139938582909636, "loss": 0.0133, "step": 8990 }, { "epoch": 1.83, "learning_rate": 0.00021397632508225482, "loss": 0.0116, "step": 8991 }, { "epoch": 1.83, "learning_rate": 0.00021395879080502066, "loss": 0.0284, "step": 8992 }, { "epoch": 1.83, "learning_rate": 0.00021394125545955392, "loss": 0.0218, "step": 8993 }, { "epoch": 1.83, "learning_rate": 0.00021392371904614753, "loss": 0.025, "step": 8994 }, { "epoch": 1.83, "learning_rate": 0.00021390618156509435, "loss": 0.0064, "step": 8995 }, { "epoch": 1.83, "learning_rate": 0.0002138886430166873, "loss": 0.0247, "step": 8996 }, { "epoch": 1.83, "learning_rate": 0.00021387110340121934, "loss": 0.0032, "step": 8997 }, { "epoch": 1.83, "learning_rate": 0.00021385356271898338, "loss": 0.0324, "step": 8998 }, { "epoch": 1.83, "learning_rate": 0.00021383602097027238, "loss": 0.0152, "step": 8999 }, { "epoch": 1.83, "learning_rate": 0.00021381847815537928, "loss": 0.0149, "step": 9000 }, { "epoch": 1.83, "learning_rate": 0.00021380093427459724, "loss": 0.0116, "step": 9001 }, { "epoch": 1.83, "learning_rate": 0.0002137833893282191, "loss": 0.0062, "step": 9002 }, { "epoch": 1.83, "learning_rate": 0.00021376584331653795, "loss": 0.004, "step": 9003 }, { "epoch": 1.83, "learning_rate": 0.00021374829623984685, "loss": 0.0055, "step": 9004 }, { "epoch": 1.83, "learning_rate": 0.00021373074809843888, "loss": 0.0214, "step": 9005 }, { "epoch": 1.83, "learning_rate": 0.00021371319889260717, "loss": 0.019, "step": 9006 }, { "epoch": 1.83, "learning_rate": 0.0002136956486226447, "loss": 0.0015, "step": 9007 }, { "epoch": 1.83, "learning_rate": 0.0002136780972888447, "loss": 0.003, "step": 9008 }, { "epoch": 1.83, "learning_rate": 0.00021366054489150029, "loss": 0.0068, "step": 9009 }, { "epoch": 1.83, "learning_rate": 0.00021364299143090455, "loss": 0.011, "step": 9010 }, { "epoch": 1.83, "learning_rate": 0.00021362543690735077, "loss": 0.0121, "step": 9011 }, { "epoch": 1.84, "learning_rate": 0.00021360788132113206, "loss": 0.0101, "step": 9012 }, { "epoch": 1.84, "learning_rate": 0.0002135903246725417, "loss": 0.0078, "step": 9013 }, { "epoch": 1.84, "learning_rate": 0.00021357276696187284, "loss": 0.0043, "step": 9014 }, { "epoch": 1.84, "learning_rate": 0.0002135552081894188, "loss": 0.0107, "step": 9015 }, { "epoch": 1.84, "learning_rate": 0.00021353764835547282, "loss": 0.0102, "step": 9016 }, { "epoch": 1.84, "learning_rate": 0.00021352008746032815, "loss": 0.0086, "step": 9017 }, { "epoch": 1.84, "learning_rate": 0.00021350252550427816, "loss": 0.0303, "step": 9018 }, { "epoch": 1.84, "learning_rate": 0.0002134849624876161, "loss": 0.0117, "step": 9019 }, { "epoch": 1.84, "learning_rate": 0.00021346739841063527, "loss": 0.0099, "step": 9020 }, { "epoch": 1.84, "learning_rate": 0.00021344983327362916, "loss": 0.0118, "step": 9021 }, { "epoch": 1.84, "learning_rate": 0.00021343226707689104, "loss": 0.0212, "step": 9022 }, { "epoch": 1.84, "learning_rate": 0.00021341469982071433, "loss": 0.0225, "step": 9023 }, { "epoch": 1.84, "learning_rate": 0.00021339713150539245, "loss": 0.0152, "step": 9024 }, { "epoch": 1.84, "learning_rate": 0.00021337956213121878, "loss": 0.0173, "step": 9025 }, { "epoch": 1.84, "learning_rate": 0.00021336199169848678, "loss": 0.0114, "step": 9026 }, { "epoch": 1.84, "learning_rate": 0.0002133444202074899, "loss": 0.0035, "step": 9027 }, { "epoch": 1.84, "learning_rate": 0.00021332684765852165, "loss": 0.0203, "step": 9028 }, { "epoch": 1.84, "learning_rate": 0.00021330927405187553, "loss": 0.0111, "step": 9029 }, { "epoch": 1.84, "learning_rate": 0.00021329169938784498, "loss": 0.0109, "step": 9030 }, { "epoch": 1.84, "learning_rate": 0.0002132741236667236, "loss": 0.0238, "step": 9031 }, { "epoch": 1.84, "learning_rate": 0.00021325654688880488, "loss": 0.0136, "step": 9032 }, { "epoch": 1.84, "learning_rate": 0.0002132389690543825, "loss": 0.0401, "step": 9033 }, { "epoch": 1.84, "learning_rate": 0.00021322139016374992, "loss": 0.008, "step": 9034 }, { "epoch": 1.84, "learning_rate": 0.0002132038102172008, "loss": 0.0082, "step": 9035 }, { "epoch": 1.84, "learning_rate": 0.00021318622921502871, "loss": 0.0098, "step": 9036 }, { "epoch": 1.84, "learning_rate": 0.00021316864715752737, "loss": 0.0024, "step": 9037 }, { "epoch": 1.84, "learning_rate": 0.00021315106404499036, "loss": 0.0095, "step": 9038 }, { "epoch": 1.84, "learning_rate": 0.0002131334798777114, "loss": 0.0236, "step": 9039 }, { "epoch": 1.84, "learning_rate": 0.00021311589465598408, "loss": 0.0237, "step": 9040 }, { "epoch": 1.84, "learning_rate": 0.00021309830838010224, "loss": 0.0436, "step": 9041 }, { "epoch": 1.84, "learning_rate": 0.0002130807210503595, "loss": 0.0148, "step": 9042 }, { "epoch": 1.84, "learning_rate": 0.0002130631326670497, "loss": 0.0032, "step": 9043 }, { "epoch": 1.84, "learning_rate": 0.0002130455432304665, "loss": 0.0098, "step": 9044 }, { "epoch": 1.84, "learning_rate": 0.00021302795274090374, "loss": 0.0126, "step": 9045 }, { "epoch": 1.84, "learning_rate": 0.00021301036119865518, "loss": 0.0092, "step": 9046 }, { "epoch": 1.84, "learning_rate": 0.00021299276860401467, "loss": 0.0079, "step": 9047 }, { "epoch": 1.84, "learning_rate": 0.00021297517495727603, "loss": 0.02, "step": 9048 }, { "epoch": 1.84, "learning_rate": 0.00021295758025873307, "loss": 0.0076, "step": 9049 }, { "epoch": 1.84, "learning_rate": 0.00021293998450867967, "loss": 0.0159, "step": 9050 }, { "epoch": 1.84, "learning_rate": 0.00021292238770740973, "loss": 0.0145, "step": 9051 }, { "epoch": 1.84, "learning_rate": 0.00021290478985521718, "loss": 0.0074, "step": 9052 }, { "epoch": 1.84, "learning_rate": 0.00021288719095239583, "loss": 0.0164, "step": 9053 }, { "epoch": 1.84, "learning_rate": 0.00021286959099923972, "loss": 0.0227, "step": 9054 }, { "epoch": 1.84, "learning_rate": 0.00021285198999604273, "loss": 0.006, "step": 9055 }, { "epoch": 1.84, "learning_rate": 0.00021283438794309894, "loss": 0.0095, "step": 9056 }, { "epoch": 1.84, "learning_rate": 0.00021281678484070222, "loss": 0.0155, "step": 9057 }, { "epoch": 1.84, "learning_rate": 0.00021279918068914662, "loss": 0.0159, "step": 9058 }, { "epoch": 1.84, "learning_rate": 0.00021278157548872614, "loss": 0.0305, "step": 9059 }, { "epoch": 1.84, "learning_rate": 0.00021276396923973487, "loss": 0.0087, "step": 9060 }, { "epoch": 1.84, "learning_rate": 0.00021274636194246681, "loss": 0.0154, "step": 9061 }, { "epoch": 1.85, "learning_rate": 0.0002127287535972161, "loss": 0.0183, "step": 9062 }, { "epoch": 1.85, "learning_rate": 0.00021271114420427675, "loss": 0.0125, "step": 9063 }, { "epoch": 1.85, "learning_rate": 0.00021269353376394295, "loss": 0.012, "step": 9064 }, { "epoch": 1.85, "learning_rate": 0.00021267592227650878, "loss": 0.0012, "step": 9065 }, { "epoch": 1.85, "learning_rate": 0.00021265830974226844, "loss": 0.0035, "step": 9066 }, { "epoch": 1.85, "learning_rate": 0.00021264069616151602, "loss": 0.0417, "step": 9067 }, { "epoch": 1.85, "learning_rate": 0.00021262308153454572, "loss": 0.007, "step": 9068 }, { "epoch": 1.85, "learning_rate": 0.00021260546586165173, "loss": 0.0118, "step": 9069 }, { "epoch": 1.85, "learning_rate": 0.00021258784914312835, "loss": 0.0115, "step": 9070 }, { "epoch": 1.85, "learning_rate": 0.0002125702313792697, "loss": 0.0114, "step": 9071 }, { "epoch": 1.85, "learning_rate": 0.00021255261257037007, "loss": 0.0044, "step": 9072 }, { "epoch": 1.85, "learning_rate": 0.00021253499271672375, "loss": 0.0061, "step": 9073 }, { "epoch": 1.85, "learning_rate": 0.00021251737181862497, "loss": 0.0171, "step": 9074 }, { "epoch": 1.85, "learning_rate": 0.00021249974987636814, "loss": 0.0057, "step": 9075 }, { "epoch": 1.85, "learning_rate": 0.00021248212689024747, "loss": 0.0201, "step": 9076 }, { "epoch": 1.85, "learning_rate": 0.00021246450286055733, "loss": 0.0071, "step": 9077 }, { "epoch": 1.85, "learning_rate": 0.00021244687778759208, "loss": 0.012, "step": 9078 }, { "epoch": 1.85, "learning_rate": 0.00021242925167164612, "loss": 0.0208, "step": 9079 }, { "epoch": 1.85, "learning_rate": 0.00021241162451301384, "loss": 0.0097, "step": 9080 }, { "epoch": 1.85, "learning_rate": 0.00021239399631198957, "loss": 0.0013, "step": 9081 }, { "epoch": 1.85, "learning_rate": 0.0002123763670688678, "loss": 0.0116, "step": 9082 }, { "epoch": 1.85, "learning_rate": 0.00021235873678394294, "loss": 0.0018, "step": 9083 }, { "epoch": 1.85, "learning_rate": 0.0002123411054575095, "loss": 0.0112, "step": 9084 }, { "epoch": 1.85, "learning_rate": 0.00021232347308986187, "loss": 0.019, "step": 9085 }, { "epoch": 1.85, "learning_rate": 0.00021230583968129464, "loss": 0.0117, "step": 9086 }, { "epoch": 1.85, "learning_rate": 0.0002122882052321023, "loss": 0.016, "step": 9087 }, { "epoch": 1.85, "learning_rate": 0.0002122705697425793, "loss": 0.0406, "step": 9088 }, { "epoch": 1.85, "learning_rate": 0.00021225293321302025, "loss": 0.0194, "step": 9089 }, { "epoch": 1.85, "learning_rate": 0.00021223529564371973, "loss": 0.0097, "step": 9090 }, { "epoch": 1.85, "learning_rate": 0.00021221765703497228, "loss": 0.0338, "step": 9091 }, { "epoch": 1.85, "learning_rate": 0.0002122000173870725, "loss": 0.0161, "step": 9092 }, { "epoch": 1.85, "learning_rate": 0.000212182376700315, "loss": 0.0248, "step": 9093 }, { "epoch": 1.85, "learning_rate": 0.00021216473497499448, "loss": 0.0081, "step": 9094 }, { "epoch": 1.85, "learning_rate": 0.00021214709221140554, "loss": 0.0168, "step": 9095 }, { "epoch": 1.85, "learning_rate": 0.00021212944840984284, "loss": 0.0066, "step": 9096 }, { "epoch": 1.85, "learning_rate": 0.00021211180357060108, "loss": 0.0164, "step": 9097 }, { "epoch": 1.85, "learning_rate": 0.00021209415769397495, "loss": 0.0053, "step": 9098 }, { "epoch": 1.85, "learning_rate": 0.00021207651078025916, "loss": 0.0092, "step": 9099 }, { "epoch": 1.85, "learning_rate": 0.00021205886282974848, "loss": 0.0063, "step": 9100 }, { "epoch": 1.85, "learning_rate": 0.00021204121384273762, "loss": 0.0071, "step": 9101 }, { "epoch": 1.85, "learning_rate": 0.0002120235638195214, "loss": 0.0145, "step": 9102 }, { "epoch": 1.85, "learning_rate": 0.00021200591276039458, "loss": 0.0136, "step": 9103 }, { "epoch": 1.85, "learning_rate": 0.00021198826066565196, "loss": 0.0076, "step": 9104 }, { "epoch": 1.85, "learning_rate": 0.0002119706075355884, "loss": 0.037, "step": 9105 }, { "epoch": 1.85, "learning_rate": 0.0002119529533704987, "loss": 0.0168, "step": 9106 }, { "epoch": 1.85, "learning_rate": 0.00021193529817067777, "loss": 0.0275, "step": 9107 }, { "epoch": 1.85, "learning_rate": 0.0002119176419364204, "loss": 0.014, "step": 9108 }, { "epoch": 1.85, "learning_rate": 0.00021189998466802158, "loss": 0.0066, "step": 9109 }, { "epoch": 1.85, "learning_rate": 0.00021188232636577614, "loss": 0.0044, "step": 9110 }, { "epoch": 1.86, "learning_rate": 0.00021186466702997905, "loss": 0.006, "step": 9111 }, { "epoch": 1.86, "learning_rate": 0.00021184700666092526, "loss": 0.0098, "step": 9112 }, { "epoch": 1.86, "learning_rate": 0.0002118293452589097, "loss": 0.0099, "step": 9113 }, { "epoch": 1.86, "learning_rate": 0.0002118116828242273, "loss": 0.007, "step": 9114 }, { "epoch": 1.86, "learning_rate": 0.00021179401935717316, "loss": 0.0237, "step": 9115 }, { "epoch": 1.86, "learning_rate": 0.00021177635485804226, "loss": 0.0173, "step": 9116 }, { "epoch": 1.86, "learning_rate": 0.00021175868932712968, "loss": 0.0095, "step": 9117 }, { "epoch": 1.86, "learning_rate": 0.00021174102276473036, "loss": 0.0081, "step": 9118 }, { "epoch": 1.86, "learning_rate": 0.00021172335517113936, "loss": 0.0096, "step": 9119 }, { "epoch": 1.86, "learning_rate": 0.00021170568654665188, "loss": 0.017, "step": 9120 }, { "epoch": 1.86, "learning_rate": 0.000211688016891563, "loss": 0.0207, "step": 9121 }, { "epoch": 1.86, "learning_rate": 0.00021167034620616772, "loss": 0.012, "step": 9122 }, { "epoch": 1.86, "learning_rate": 0.00021165267449076128, "loss": 0.0028, "step": 9123 }, { "epoch": 1.86, "learning_rate": 0.0002116350017456388, "loss": 0.0024, "step": 9124 }, { "epoch": 1.86, "learning_rate": 0.0002116173279710954, "loss": 0.025, "step": 9125 }, { "epoch": 1.86, "learning_rate": 0.00021159965316742632, "loss": 0.008, "step": 9126 }, { "epoch": 1.86, "learning_rate": 0.0002115819773349268, "loss": 0.0104, "step": 9127 }, { "epoch": 1.86, "learning_rate": 0.000211564300473892, "loss": 0.0416, "step": 9128 }, { "epoch": 1.86, "learning_rate": 0.00021154662258461717, "loss": 0.0072, "step": 9129 }, { "epoch": 1.86, "learning_rate": 0.00021152894366739753, "loss": 0.006, "step": 9130 }, { "epoch": 1.86, "learning_rate": 0.00021151126372252846, "loss": 0.0106, "step": 9131 }, { "epoch": 1.86, "learning_rate": 0.0002114935827503051, "loss": 0.0091, "step": 9132 }, { "epoch": 1.86, "learning_rate": 0.00021147590075102287, "loss": 0.0225, "step": 9133 }, { "epoch": 1.86, "learning_rate": 0.00021145821772497705, "loss": 0.0034, "step": 9134 }, { "epoch": 1.86, "learning_rate": 0.00021144053367246296, "loss": 0.0215, "step": 9135 }, { "epoch": 1.86, "learning_rate": 0.00021142284859377601, "loss": 0.0106, "step": 9136 }, { "epoch": 1.86, "learning_rate": 0.00021140516248921153, "loss": 0.0262, "step": 9137 }, { "epoch": 1.86, "learning_rate": 0.00021138747535906494, "loss": 0.0144, "step": 9138 }, { "epoch": 1.86, "learning_rate": 0.00021136978720363161, "loss": 0.0186, "step": 9139 }, { "epoch": 1.86, "learning_rate": 0.00021135209802320706, "loss": 0.0064, "step": 9140 }, { "epoch": 1.86, "learning_rate": 0.00021133440781808657, "loss": 0.0106, "step": 9141 }, { "epoch": 1.86, "learning_rate": 0.00021131671658856574, "loss": 0.0055, "step": 9142 }, { "epoch": 1.86, "learning_rate": 0.00021129902433493999, "loss": 0.0265, "step": 9143 }, { "epoch": 1.86, "learning_rate": 0.0002112813310575048, "loss": 0.0075, "step": 9144 }, { "epoch": 1.86, "learning_rate": 0.00021126363675655574, "loss": 0.0236, "step": 9145 }, { "epoch": 1.86, "learning_rate": 0.0002112459414323883, "loss": 0.0096, "step": 9146 }, { "epoch": 1.86, "learning_rate": 0.00021122824508529802, "loss": 0.0055, "step": 9147 }, { "epoch": 1.86, "learning_rate": 0.00021121054771558047, "loss": 0.0107, "step": 9148 }, { "epoch": 1.86, "learning_rate": 0.00021119284932353123, "loss": 0.0255, "step": 9149 }, { "epoch": 1.86, "learning_rate": 0.00021117514990944588, "loss": 0.0063, "step": 9150 }, { "epoch": 1.86, "learning_rate": 0.00021115744947362006, "loss": 0.0032, "step": 9151 }, { "epoch": 1.86, "learning_rate": 0.00021113974801634944, "loss": 0.0083, "step": 9152 }, { "epoch": 1.86, "learning_rate": 0.00021112204553792955, "loss": 0.0254, "step": 9153 }, { "epoch": 1.86, "learning_rate": 0.00021110434203865618, "loss": 0.0044, "step": 9154 }, { "epoch": 1.86, "learning_rate": 0.0002110866375188249, "loss": 0.035, "step": 9155 }, { "epoch": 1.86, "learning_rate": 0.00021106893197873149, "loss": 0.0078, "step": 9156 }, { "epoch": 1.86, "learning_rate": 0.00021105122541867163, "loss": 0.0028, "step": 9157 }, { "epoch": 1.86, "learning_rate": 0.0002110335178389411, "loss": 0.0194, "step": 9158 }, { "epoch": 1.86, "learning_rate": 0.00021101580923983557, "loss": 0.0054, "step": 9159 }, { "epoch": 1.87, "learning_rate": 0.00021099809962165088, "loss": 0.0106, "step": 9160 }, { "epoch": 1.87, "learning_rate": 0.00021098038898468275, "loss": 0.0063, "step": 9161 }, { "epoch": 1.87, "learning_rate": 0.00021096267732922705, "loss": 0.0076, "step": 9162 }, { "epoch": 1.87, "learning_rate": 0.00021094496465557958, "loss": 0.0372, "step": 9163 }, { "epoch": 1.87, "learning_rate": 0.0002109272509640361, "loss": 0.0254, "step": 9164 }, { "epoch": 1.87, "learning_rate": 0.00021090953625489255, "loss": 0.0028, "step": 9165 }, { "epoch": 1.87, "learning_rate": 0.00021089182052844477, "loss": 0.0054, "step": 9166 }, { "epoch": 1.87, "learning_rate": 0.0002108741037849886, "loss": 0.008, "step": 9167 }, { "epoch": 1.87, "learning_rate": 0.00021085638602482006, "loss": 0.0097, "step": 9168 }, { "epoch": 1.87, "learning_rate": 0.000210838667248235, "loss": 0.0275, "step": 9169 }, { "epoch": 1.87, "learning_rate": 0.0002108209474555293, "loss": 0.0137, "step": 9170 }, { "epoch": 1.87, "learning_rate": 0.00021080322664699901, "loss": 0.0045, "step": 9171 }, { "epoch": 1.87, "learning_rate": 0.00021078550482294008, "loss": 0.0265, "step": 9172 }, { "epoch": 1.87, "learning_rate": 0.00021076778198364843, "loss": 0.0174, "step": 9173 }, { "epoch": 1.87, "learning_rate": 0.0002107500581294201, "loss": 0.0099, "step": 9174 }, { "epoch": 1.87, "learning_rate": 0.00021073233326055117, "loss": 0.0112, "step": 9175 }, { "epoch": 1.87, "learning_rate": 0.0002107146073773376, "loss": 0.0156, "step": 9176 }, { "epoch": 1.87, "learning_rate": 0.0002106968804800755, "loss": 0.0065, "step": 9177 }, { "epoch": 1.87, "learning_rate": 0.00021067915256906095, "loss": 0.0146, "step": 9178 }, { "epoch": 1.87, "learning_rate": 0.00021066142364458998, "loss": 0.0099, "step": 9179 }, { "epoch": 1.87, "learning_rate": 0.0002106436937069587, "loss": 0.0183, "step": 9180 }, { "epoch": 1.87, "learning_rate": 0.00021062596275646332, "loss": 0.0084, "step": 9181 }, { "epoch": 1.87, "learning_rate": 0.00021060823079339992, "loss": 0.0042, "step": 9182 }, { "epoch": 1.87, "learning_rate": 0.0002105904978180646, "loss": 0.0081, "step": 9183 }, { "epoch": 1.87, "learning_rate": 0.00021057276383075363, "loss": 0.0025, "step": 9184 }, { "epoch": 1.87, "learning_rate": 0.0002105550288317632, "loss": 0.0051, "step": 9185 }, { "epoch": 1.87, "learning_rate": 0.00021053729282138943, "loss": 0.0618, "step": 9186 }, { "epoch": 1.87, "learning_rate": 0.0002105195557999286, "loss": 0.0158, "step": 9187 }, { "epoch": 1.87, "learning_rate": 0.00021050181776767696, "loss": 0.0116, "step": 9188 }, { "epoch": 1.87, "learning_rate": 0.00021048407872493075, "loss": 0.0077, "step": 9189 }, { "epoch": 1.87, "learning_rate": 0.0002104663386719863, "loss": 0.0075, "step": 9190 }, { "epoch": 1.87, "learning_rate": 0.00021044859760913982, "loss": 0.0155, "step": 9191 }, { "epoch": 1.87, "learning_rate": 0.00021043085553668764, "loss": 0.0338, "step": 9192 }, { "epoch": 1.87, "learning_rate": 0.0002104131124549261, "loss": 0.0086, "step": 9193 }, { "epoch": 1.87, "learning_rate": 0.0002103953683641516, "loss": 0.0255, "step": 9194 }, { "epoch": 1.87, "learning_rate": 0.00021037762326466043, "loss": 0.0167, "step": 9195 }, { "epoch": 1.87, "learning_rate": 0.00021035987715674895, "loss": 0.0264, "step": 9196 }, { "epoch": 1.87, "learning_rate": 0.00021034213004071355, "loss": 0.0124, "step": 9197 }, { "epoch": 1.87, "learning_rate": 0.0002103243819168507, "loss": 0.0162, "step": 9198 }, { "epoch": 1.87, "learning_rate": 0.00021030663278545685, "loss": 0.0124, "step": 9199 }, { "epoch": 1.87, "learning_rate": 0.00021028888264682834, "loss": 0.0098, "step": 9200 }, { "epoch": 1.87, "learning_rate": 0.00021027113150126172, "loss": 0.0055, "step": 9201 }, { "epoch": 1.87, "learning_rate": 0.00021025337934905343, "loss": 0.0069, "step": 9202 }, { "epoch": 1.87, "learning_rate": 0.00021023562619049997, "loss": 0.0204, "step": 9203 }, { "epoch": 1.87, "learning_rate": 0.00021021787202589782, "loss": 0.023, "step": 9204 }, { "epoch": 1.87, "learning_rate": 0.0002102001168555436, "loss": 0.0175, "step": 9205 }, { "epoch": 1.87, "learning_rate": 0.00021018236067973375, "loss": 0.0065, "step": 9206 }, { "epoch": 1.87, "learning_rate": 0.00021016460349876487, "loss": 0.0102, "step": 9207 }, { "epoch": 1.87, "learning_rate": 0.0002101468453129335, "loss": 0.0035, "step": 9208 }, { "epoch": 1.88, "learning_rate": 0.00021012908612253638, "loss": 0.0054, "step": 9209 }, { "epoch": 1.88, "learning_rate": 0.00021011132592786995, "loss": 0.0168, "step": 9210 }, { "epoch": 1.88, "learning_rate": 0.00021009356472923092, "loss": 0.0085, "step": 9211 }, { "epoch": 1.88, "learning_rate": 0.00021007580252691596, "loss": 0.0233, "step": 9212 }, { "epoch": 1.88, "learning_rate": 0.00021005803932122163, "loss": 0.0105, "step": 9213 }, { "epoch": 1.88, "learning_rate": 0.00021004027511244475, "loss": 0.0065, "step": 9214 }, { "epoch": 1.88, "learning_rate": 0.0002100225099008819, "loss": 0.0174, "step": 9215 }, { "epoch": 1.88, "learning_rate": 0.00021000474368682985, "loss": 0.0126, "step": 9216 }, { "epoch": 1.88, "learning_rate": 0.0002099869764705853, "loss": 0.0092, "step": 9217 }, { "epoch": 1.88, "learning_rate": 0.00020996920825244497, "loss": 0.0087, "step": 9218 }, { "epoch": 1.88, "learning_rate": 0.00020995143903270575, "loss": 0.0111, "step": 9219 }, { "epoch": 1.88, "learning_rate": 0.0002099336688116643, "loss": 0.0343, "step": 9220 }, { "epoch": 1.88, "learning_rate": 0.0002099158975896174, "loss": 0.0128, "step": 9221 }, { "epoch": 1.88, "learning_rate": 0.0002098981253668619, "loss": 0.0089, "step": 9222 }, { "epoch": 1.88, "learning_rate": 0.00020988035214369475, "loss": 0.004, "step": 9223 }, { "epoch": 1.88, "learning_rate": 0.00020986257792041262, "loss": 0.0234, "step": 9224 }, { "epoch": 1.88, "learning_rate": 0.00020984480269731242, "loss": 0.0126, "step": 9225 }, { "epoch": 1.88, "learning_rate": 0.00020982702647469106, "loss": 0.0106, "step": 9226 }, { "epoch": 1.88, "learning_rate": 0.00020980924925284548, "loss": 0.0269, "step": 9227 }, { "epoch": 1.88, "learning_rate": 0.00020979147103207248, "loss": 0.0107, "step": 9228 }, { "epoch": 1.88, "learning_rate": 0.00020977369181266907, "loss": 0.0084, "step": 9229 }, { "epoch": 1.88, "learning_rate": 0.00020975591159493216, "loss": 0.0063, "step": 9230 }, { "epoch": 1.88, "learning_rate": 0.00020973813037915875, "loss": 0.0098, "step": 9231 }, { "epoch": 1.88, "learning_rate": 0.0002097203481656458, "loss": 0.0325, "step": 9232 }, { "epoch": 1.88, "learning_rate": 0.00020970256495469032, "loss": 0.0044, "step": 9233 }, { "epoch": 1.88, "learning_rate": 0.00020968478074658928, "loss": 0.0024, "step": 9234 }, { "epoch": 1.88, "learning_rate": 0.00020966699554163975, "loss": 0.0168, "step": 9235 }, { "epoch": 1.88, "learning_rate": 0.00020964920934013877, "loss": 0.0065, "step": 9236 }, { "epoch": 1.88, "learning_rate": 0.00020963142214238339, "loss": 0.0044, "step": 9237 }, { "epoch": 1.88, "learning_rate": 0.0002096136339486707, "loss": 0.0169, "step": 9238 }, { "epoch": 1.88, "learning_rate": 0.00020959584475929775, "loss": 0.0103, "step": 9239 }, { "epoch": 1.88, "learning_rate": 0.00020957805457456173, "loss": 0.007, "step": 9240 }, { "epoch": 1.88, "learning_rate": 0.00020956026339475974, "loss": 0.0472, "step": 9241 }, { "epoch": 1.88, "learning_rate": 0.00020954247122018896, "loss": 0.0277, "step": 9242 }, { "epoch": 1.88, "learning_rate": 0.00020952467805114647, "loss": 0.0048, "step": 9243 }, { "epoch": 1.88, "learning_rate": 0.00020950688388792952, "loss": 0.0111, "step": 9244 }, { "epoch": 1.88, "learning_rate": 0.00020948908873083527, "loss": 0.0193, "step": 9245 }, { "epoch": 1.88, "learning_rate": 0.00020947129258016097, "loss": 0.0113, "step": 9246 }, { "epoch": 1.88, "learning_rate": 0.00020945349543620382, "loss": 0.0274, "step": 9247 }, { "epoch": 1.88, "learning_rate": 0.00020943569729926103, "loss": 0.0209, "step": 9248 }, { "epoch": 1.88, "learning_rate": 0.00020941789816962992, "loss": 0.011, "step": 9249 }, { "epoch": 1.88, "learning_rate": 0.00020940009804760773, "loss": 0.0041, "step": 9250 }, { "epoch": 1.88, "learning_rate": 0.0002093822969334918, "loss": 0.0214, "step": 9251 }, { "epoch": 1.88, "learning_rate": 0.00020936449482757943, "loss": 0.0506, "step": 9252 }, { "epoch": 1.88, "learning_rate": 0.00020934669173016792, "loss": 0.0219, "step": 9253 }, { "epoch": 1.88, "learning_rate": 0.00020932888764155466, "loss": 0.003, "step": 9254 }, { "epoch": 1.88, "learning_rate": 0.000209311082562037, "loss": 0.0102, "step": 9255 }, { "epoch": 1.88, "learning_rate": 0.00020929327649191223, "loss": 0.0061, "step": 9256 }, { "epoch": 1.88, "learning_rate": 0.00020927546943147788, "loss": 0.0229, "step": 9257 }, { "epoch": 1.89, "learning_rate": 0.00020925766138103126, "loss": 0.0056, "step": 9258 }, { "epoch": 1.89, "learning_rate": 0.00020923985234086987, "loss": 0.0073, "step": 9259 }, { "epoch": 1.89, "learning_rate": 0.0002092220423112911, "loss": 0.0061, "step": 9260 }, { "epoch": 1.89, "learning_rate": 0.00020920423129259242, "loss": 0.0026, "step": 9261 }, { "epoch": 1.89, "learning_rate": 0.00020918641928507136, "loss": 0.01, "step": 9262 }, { "epoch": 1.89, "learning_rate": 0.00020916860628902536, "loss": 0.0077, "step": 9263 }, { "epoch": 1.89, "learning_rate": 0.00020915079230475193, "loss": 0.0041, "step": 9264 }, { "epoch": 1.89, "learning_rate": 0.00020913297733254866, "loss": 0.0034, "step": 9265 }, { "epoch": 1.89, "learning_rate": 0.00020911516137271302, "loss": 0.0249, "step": 9266 }, { "epoch": 1.89, "learning_rate": 0.0002090973444255426, "loss": 0.0148, "step": 9267 }, { "epoch": 1.89, "learning_rate": 0.00020907952649133497, "loss": 0.0169, "step": 9268 }, { "epoch": 1.89, "learning_rate": 0.0002090617075703877, "loss": 0.0236, "step": 9269 }, { "epoch": 1.89, "learning_rate": 0.00020904388766299846, "loss": 0.0217, "step": 9270 }, { "epoch": 1.89, "learning_rate": 0.00020902606676946484, "loss": 0.0181, "step": 9271 }, { "epoch": 1.89, "learning_rate": 0.00020900824489008448, "loss": 0.0289, "step": 9272 }, { "epoch": 1.89, "learning_rate": 0.00020899042202515505, "loss": 0.0054, "step": 9273 }, { "epoch": 1.89, "learning_rate": 0.0002089725981749742, "loss": 0.0193, "step": 9274 }, { "epoch": 1.89, "learning_rate": 0.00020895477333983967, "loss": 0.0115, "step": 9275 }, { "epoch": 1.89, "learning_rate": 0.00020893694752004914, "loss": 0.0223, "step": 9276 }, { "epoch": 1.89, "learning_rate": 0.0002089191207159003, "loss": 0.0239, "step": 9277 }, { "epoch": 1.89, "learning_rate": 0.00020890129292769097, "loss": 0.0017, "step": 9278 }, { "epoch": 1.89, "learning_rate": 0.00020888346415571884, "loss": 0.0015, "step": 9279 }, { "epoch": 1.89, "learning_rate": 0.0002088656344002817, "loss": 0.0157, "step": 9280 }, { "epoch": 1.89, "learning_rate": 0.00020884780366167734, "loss": 0.0055, "step": 9281 }, { "epoch": 1.89, "learning_rate": 0.00020882997194020362, "loss": 0.017, "step": 9282 }, { "epoch": 1.89, "learning_rate": 0.0002088121392361583, "loss": 0.0221, "step": 9283 }, { "epoch": 1.89, "learning_rate": 0.00020879430554983922, "loss": 0.0175, "step": 9284 }, { "epoch": 1.89, "learning_rate": 0.0002087764708815443, "loss": 0.0208, "step": 9285 }, { "epoch": 1.89, "learning_rate": 0.0002087586352315713, "loss": 0.0104, "step": 9286 }, { "epoch": 1.89, "learning_rate": 0.00020874079860021822, "loss": 0.0112, "step": 9287 }, { "epoch": 1.89, "learning_rate": 0.00020872296098778295, "loss": 0.0122, "step": 9288 }, { "epoch": 1.89, "learning_rate": 0.00020870512239456337, "loss": 0.0102, "step": 9289 }, { "epoch": 1.89, "learning_rate": 0.00020868728282085738, "loss": 0.0112, "step": 9290 }, { "epoch": 1.89, "learning_rate": 0.00020866944226696302, "loss": 0.0339, "step": 9291 }, { "epoch": 1.89, "learning_rate": 0.00020865160073317823, "loss": 0.0242, "step": 9292 }, { "epoch": 1.89, "learning_rate": 0.000208633758219801, "loss": 0.0041, "step": 9293 }, { "epoch": 1.89, "learning_rate": 0.0002086159147271293, "loss": 0.0261, "step": 9294 }, { "epoch": 1.89, "learning_rate": 0.0002085980702554612, "loss": 0.018, "step": 9295 }, { "epoch": 1.89, "learning_rate": 0.0002085802248050947, "loss": 0.0145, "step": 9296 }, { "epoch": 1.89, "learning_rate": 0.0002085623783763279, "loss": 0.0065, "step": 9297 }, { "epoch": 1.89, "learning_rate": 0.00020854453096945882, "loss": 0.0109, "step": 9298 }, { "epoch": 1.89, "learning_rate": 0.00020852668258478557, "loss": 0.0243, "step": 9299 }, { "epoch": 1.89, "learning_rate": 0.00020850883322260624, "loss": 0.0172, "step": 9300 }, { "epoch": 1.89, "learning_rate": 0.0002084909828832189, "loss": 0.0096, "step": 9301 }, { "epoch": 1.89, "learning_rate": 0.0002084731315669218, "loss": 0.0119, "step": 9302 }, { "epoch": 1.89, "learning_rate": 0.000208455279274013, "loss": 0.0187, "step": 9303 }, { "epoch": 1.89, "learning_rate": 0.0002084374260047907, "loss": 0.0091, "step": 9304 }, { "epoch": 1.89, "learning_rate": 0.0002084195717595531, "loss": 0.0141, "step": 9305 }, { "epoch": 1.89, "learning_rate": 0.00020840171653859838, "loss": 0.0262, "step": 9306 }, { "epoch": 1.9, "learning_rate": 0.00020838386034222474, "loss": 0.0277, "step": 9307 }, { "epoch": 1.9, "learning_rate": 0.0002083660031707304, "loss": 0.0048, "step": 9308 }, { "epoch": 1.9, "learning_rate": 0.00020834814502441364, "loss": 0.0253, "step": 9309 }, { "epoch": 1.9, "learning_rate": 0.00020833028590357274, "loss": 0.0189, "step": 9310 }, { "epoch": 1.9, "learning_rate": 0.00020831242580850593, "loss": 0.0334, "step": 9311 }, { "epoch": 1.9, "learning_rate": 0.00020829456473951154, "loss": 0.0206, "step": 9312 }, { "epoch": 1.9, "learning_rate": 0.00020827670269688787, "loss": 0.014, "step": 9313 }, { "epoch": 1.9, "learning_rate": 0.0002082588396809333, "loss": 0.0177, "step": 9314 }, { "epoch": 1.9, "learning_rate": 0.00020824097569194613, "loss": 0.0144, "step": 9315 }, { "epoch": 1.9, "learning_rate": 0.00020822311073022474, "loss": 0.0078, "step": 9316 }, { "epoch": 1.9, "learning_rate": 0.0002082052447960675, "loss": 0.0032, "step": 9317 }, { "epoch": 1.9, "learning_rate": 0.00020818737788977275, "loss": 0.0057, "step": 9318 }, { "epoch": 1.9, "learning_rate": 0.00020816951001163895, "loss": 0.0133, "step": 9319 }, { "epoch": 1.9, "learning_rate": 0.0002081516411619646, "loss": 0.0171, "step": 9320 }, { "epoch": 1.9, "learning_rate": 0.00020813377134104802, "loss": 0.0079, "step": 9321 }, { "epoch": 1.9, "learning_rate": 0.0002081159005491877, "loss": 0.0097, "step": 9322 }, { "epoch": 1.9, "learning_rate": 0.00020809802878668217, "loss": 0.0047, "step": 9323 }, { "epoch": 1.9, "learning_rate": 0.0002080801560538299, "loss": 0.0063, "step": 9324 }, { "epoch": 1.9, "learning_rate": 0.00020806228235092944, "loss": 0.0362, "step": 9325 }, { "epoch": 1.9, "learning_rate": 0.00020804440767827919, "loss": 0.0058, "step": 9326 }, { "epoch": 1.9, "learning_rate": 0.00020802653203617777, "loss": 0.0112, "step": 9327 }, { "epoch": 1.9, "learning_rate": 0.00020800865542492373, "loss": 0.0068, "step": 9328 }, { "epoch": 1.9, "learning_rate": 0.0002079907778448157, "loss": 0.0142, "step": 9329 }, { "epoch": 1.9, "learning_rate": 0.00020797289929615217, "loss": 0.0048, "step": 9330 }, { "epoch": 1.9, "learning_rate": 0.0002079550197792318, "loss": 0.0035, "step": 9331 }, { "epoch": 1.9, "learning_rate": 0.0002079371392943532, "loss": 0.0065, "step": 9332 }, { "epoch": 1.9, "learning_rate": 0.000207919257841815, "loss": 0.0062, "step": 9333 }, { "epoch": 1.9, "learning_rate": 0.00020790137542191589, "loss": 0.0122, "step": 9334 }, { "epoch": 1.9, "learning_rate": 0.00020788349203495446, "loss": 0.0281, "step": 9335 }, { "epoch": 1.9, "learning_rate": 0.0002078656076812295, "loss": 0.0107, "step": 9336 }, { "epoch": 1.9, "learning_rate": 0.00020784772236103963, "loss": 0.0127, "step": 9337 }, { "epoch": 1.9, "learning_rate": 0.00020782983607468367, "loss": 0.0045, "step": 9338 }, { "epoch": 1.9, "learning_rate": 0.0002078119488224602, "loss": 0.0105, "step": 9339 }, { "epoch": 1.9, "learning_rate": 0.00020779406060466812, "loss": 0.0067, "step": 9340 }, { "epoch": 1.9, "learning_rate": 0.0002077761714216061, "loss": 0.0322, "step": 9341 }, { "epoch": 1.9, "learning_rate": 0.00020775828127357298, "loss": 0.0082, "step": 9342 }, { "epoch": 1.9, "learning_rate": 0.0002077403901608675, "loss": 0.0135, "step": 9343 }, { "epoch": 1.9, "learning_rate": 0.00020772249808378854, "loss": 0.0074, "step": 9344 }, { "epoch": 1.9, "learning_rate": 0.0002077046050426349, "loss": 0.0148, "step": 9345 }, { "epoch": 1.9, "learning_rate": 0.00020768671103770542, "loss": 0.0204, "step": 9346 }, { "epoch": 1.9, "learning_rate": 0.000207668816069299, "loss": 0.0253, "step": 9347 }, { "epoch": 1.9, "learning_rate": 0.00020765092013771448, "loss": 0.0022, "step": 9348 }, { "epoch": 1.9, "learning_rate": 0.00020763302324325078, "loss": 0.0095, "step": 9349 }, { "epoch": 1.9, "learning_rate": 0.00020761512538620676, "loss": 0.0079, "step": 9350 }, { "epoch": 1.9, "learning_rate": 0.0002075972265668814, "loss": 0.0383, "step": 9351 }, { "epoch": 1.9, "learning_rate": 0.00020757932678557367, "loss": 0.0173, "step": 9352 }, { "epoch": 1.9, "learning_rate": 0.00020756142604258247, "loss": 0.0104, "step": 9353 }, { "epoch": 1.9, "learning_rate": 0.00020754352433820678, "loss": 0.0117, "step": 9354 }, { "epoch": 1.9, "learning_rate": 0.00020752562167274563, "loss": 0.0085, "step": 9355 }, { "epoch": 1.91, "learning_rate": 0.00020750771804649802, "loss": 0.032, "step": 9356 }, { "epoch": 1.91, "learning_rate": 0.000207489813459763, "loss": 0.0186, "step": 9357 }, { "epoch": 1.91, "learning_rate": 0.00020747190791283953, "loss": 0.0175, "step": 9358 }, { "epoch": 1.91, "learning_rate": 0.0002074540014060267, "loss": 0.0325, "step": 9359 }, { "epoch": 1.91, "learning_rate": 0.00020743609393962363, "loss": 0.0191, "step": 9360 }, { "epoch": 1.91, "learning_rate": 0.00020741818551392937, "loss": 0.0123, "step": 9361 }, { "epoch": 1.91, "learning_rate": 0.00020740027612924303, "loss": 0.0475, "step": 9362 }, { "epoch": 1.91, "learning_rate": 0.00020738236578586366, "loss": 0.0389, "step": 9363 }, { "epoch": 1.91, "learning_rate": 0.0002073644544840905, "loss": 0.01, "step": 9364 }, { "epoch": 1.91, "learning_rate": 0.00020734654222422268, "loss": 0.0204, "step": 9365 }, { "epoch": 1.91, "learning_rate": 0.0002073286290065594, "loss": 0.0133, "step": 9366 }, { "epoch": 1.91, "learning_rate": 0.00020731071483139977, "loss": 0.0074, "step": 9367 }, { "epoch": 1.91, "learning_rate": 0.000207292799699043, "loss": 0.0052, "step": 9368 }, { "epoch": 1.91, "learning_rate": 0.00020727488360978833, "loss": 0.0316, "step": 9369 }, { "epoch": 1.91, "learning_rate": 0.000207256966563935, "loss": 0.0246, "step": 9370 }, { "epoch": 1.91, "learning_rate": 0.00020723904856178227, "loss": 0.0372, "step": 9371 }, { "epoch": 1.91, "learning_rate": 0.00020722112960362937, "loss": 0.0028, "step": 9372 }, { "epoch": 1.91, "learning_rate": 0.00020720320968977557, "loss": 0.0037, "step": 9373 }, { "epoch": 1.91, "learning_rate": 0.0002071852888205202, "loss": 0.0069, "step": 9374 }, { "epoch": 1.91, "learning_rate": 0.0002071673669961625, "loss": 0.0113, "step": 9375 }, { "epoch": 1.91, "learning_rate": 0.000207149444217002, "loss": 0.0139, "step": 9376 }, { "epoch": 1.91, "learning_rate": 0.0002071315204833378, "loss": 0.0112, "step": 9377 }, { "epoch": 1.91, "learning_rate": 0.0002071135957954694, "loss": 0.0056, "step": 9378 }, { "epoch": 1.91, "learning_rate": 0.00020709567015369612, "loss": 0.0085, "step": 9379 }, { "epoch": 1.91, "learning_rate": 0.0002070777435583174, "loss": 0.0037, "step": 9380 }, { "epoch": 1.91, "learning_rate": 0.0002070598160096326, "loss": 0.0051, "step": 9381 }, { "epoch": 1.91, "learning_rate": 0.00020704188750794117, "loss": 0.0079, "step": 9382 }, { "epoch": 1.91, "learning_rate": 0.00020702395805354256, "loss": 0.012, "step": 9383 }, { "epoch": 1.91, "learning_rate": 0.00020700602764673617, "loss": 0.0048, "step": 9384 }, { "epoch": 1.91, "learning_rate": 0.00020698809628782154, "loss": 0.0136, "step": 9385 }, { "epoch": 1.91, "learning_rate": 0.00020697016397709813, "loss": 0.0076, "step": 9386 }, { "epoch": 1.91, "learning_rate": 0.00020695223071486542, "loss": 0.0166, "step": 9387 }, { "epoch": 1.91, "learning_rate": 0.00020693429650142298, "loss": 0.0067, "step": 9388 }, { "epoch": 1.91, "learning_rate": 0.0002069163613370703, "loss": 0.0296, "step": 9389 }, { "epoch": 1.91, "learning_rate": 0.000206898425222107, "loss": 0.0093, "step": 9390 }, { "epoch": 1.91, "learning_rate": 0.00020688048815683253, "loss": 0.02, "step": 9391 }, { "epoch": 1.91, "learning_rate": 0.0002068625501415466, "loss": 0.016, "step": 9392 }, { "epoch": 1.91, "learning_rate": 0.0002068446111765487, "loss": 0.0064, "step": 9393 }, { "epoch": 1.91, "learning_rate": 0.00020682667126213847, "loss": 0.0103, "step": 9394 }, { "epoch": 1.91, "learning_rate": 0.0002068087303986156, "loss": 0.008, "step": 9395 }, { "epoch": 1.91, "learning_rate": 0.00020679078858627965, "loss": 0.0401, "step": 9396 }, { "epoch": 1.91, "learning_rate": 0.0002067728458254304, "loss": 0.0089, "step": 9397 }, { "epoch": 1.91, "learning_rate": 0.00020675490211636744, "loss": 0.0165, "step": 9398 }, { "epoch": 1.91, "learning_rate": 0.00020673695745939048, "loss": 0.0076, "step": 9399 }, { "epoch": 1.91, "learning_rate": 0.0002067190118547992, "loss": 0.0134, "step": 9400 }, { "epoch": 1.91, "learning_rate": 0.0002067010653028934, "loss": 0.0065, "step": 9401 }, { "epoch": 1.91, "learning_rate": 0.00020668311780397273, "loss": 0.0251, "step": 9402 }, { "epoch": 1.91, "learning_rate": 0.00020666516935833706, "loss": 0.0135, "step": 9403 }, { "epoch": 1.91, "learning_rate": 0.00020664721996628606, "loss": 0.0125, "step": 9404 }, { "epoch": 1.92, "learning_rate": 0.00020662926962811953, "loss": 0.0176, "step": 9405 }, { "epoch": 1.92, "learning_rate": 0.00020661131834413734, "loss": 0.0219, "step": 9406 }, { "epoch": 1.92, "learning_rate": 0.00020659336611463923, "loss": 0.0149, "step": 9407 }, { "epoch": 1.92, "learning_rate": 0.00020657541293992517, "loss": 0.024, "step": 9408 }, { "epoch": 1.92, "learning_rate": 0.00020655745882029486, "loss": 0.0178, "step": 9409 }, { "epoch": 1.92, "learning_rate": 0.0002065395037560482, "loss": 0.0141, "step": 9410 }, { "epoch": 1.92, "learning_rate": 0.00020652154774748513, "loss": 0.0078, "step": 9411 }, { "epoch": 1.92, "learning_rate": 0.00020650359079490554, "loss": 0.0024, "step": 9412 }, { "epoch": 1.92, "learning_rate": 0.00020648563289860932, "loss": 0.0183, "step": 9413 }, { "epoch": 1.92, "learning_rate": 0.0002064676740588964, "loss": 0.0118, "step": 9414 }, { "epoch": 1.92, "learning_rate": 0.00020644971427606672, "loss": 0.0107, "step": 9415 }, { "epoch": 1.92, "learning_rate": 0.00020643175355042023, "loss": 0.0084, "step": 9416 }, { "epoch": 1.92, "learning_rate": 0.000206413791882257, "loss": 0.0236, "step": 9417 }, { "epoch": 1.92, "learning_rate": 0.0002063958292718769, "loss": 0.0099, "step": 9418 }, { "epoch": 1.92, "learning_rate": 0.00020637786571958003, "loss": 0.0077, "step": 9419 }, { "epoch": 1.92, "learning_rate": 0.00020635990122566637, "loss": 0.0173, "step": 9420 }, { "epoch": 1.92, "learning_rate": 0.00020634193579043594, "loss": 0.0084, "step": 9421 }, { "epoch": 1.92, "learning_rate": 0.0002063239694141889, "loss": 0.0101, "step": 9422 }, { "epoch": 1.92, "learning_rate": 0.0002063060020972252, "loss": 0.0086, "step": 9423 }, { "epoch": 1.92, "learning_rate": 0.00020628803383984502, "loss": 0.0009, "step": 9424 }, { "epoch": 1.92, "learning_rate": 0.00020627006464234837, "loss": 0.0113, "step": 9425 }, { "epoch": 1.92, "learning_rate": 0.00020625209450503545, "loss": 0.0129, "step": 9426 }, { "epoch": 1.92, "learning_rate": 0.0002062341234282064, "loss": 0.0064, "step": 9427 }, { "epoch": 1.92, "learning_rate": 0.0002062161514121613, "loss": 0.0139, "step": 9428 }, { "epoch": 1.92, "learning_rate": 0.00020619817845720035, "loss": 0.0123, "step": 9429 }, { "epoch": 1.92, "learning_rate": 0.00020618020456362375, "loss": 0.0016, "step": 9430 }, { "epoch": 1.92, "learning_rate": 0.0002061622297317317, "loss": 0.0099, "step": 9431 }, { "epoch": 1.92, "learning_rate": 0.0002061442539618244, "loss": 0.005, "step": 9432 }, { "epoch": 1.92, "learning_rate": 0.00020612627725420207, "loss": 0.0077, "step": 9433 }, { "epoch": 1.92, "learning_rate": 0.00020610829960916496, "loss": 0.0202, "step": 9434 }, { "epoch": 1.92, "learning_rate": 0.00020609032102701335, "loss": 0.0258, "step": 9435 }, { "epoch": 1.92, "learning_rate": 0.00020607234150804747, "loss": 0.0093, "step": 9436 }, { "epoch": 1.92, "learning_rate": 0.00020605436105256767, "loss": 0.0157, "step": 9437 }, { "epoch": 1.92, "learning_rate": 0.00020603637966087418, "loss": 0.0055, "step": 9438 }, { "epoch": 1.92, "learning_rate": 0.00020601839733326742, "loss": 0.0057, "step": 9439 }, { "epoch": 1.92, "learning_rate": 0.00020600041407004772, "loss": 0.0124, "step": 9440 }, { "epoch": 1.92, "learning_rate": 0.00020598242987151534, "loss": 0.0056, "step": 9441 }, { "epoch": 1.92, "learning_rate": 0.00020596444473797073, "loss": 0.0181, "step": 9442 }, { "epoch": 1.92, "learning_rate": 0.00020594645866971423, "loss": 0.0213, "step": 9443 }, { "epoch": 1.92, "learning_rate": 0.0002059284716670463, "loss": 0.0028, "step": 9444 }, { "epoch": 1.92, "learning_rate": 0.0002059104837302673, "loss": 0.0164, "step": 9445 }, { "epoch": 1.92, "learning_rate": 0.00020589249485967765, "loss": 0.0072, "step": 9446 }, { "epoch": 1.92, "learning_rate": 0.00020587450505557789, "loss": 0.0162, "step": 9447 }, { "epoch": 1.92, "learning_rate": 0.00020585651431826837, "loss": 0.0284, "step": 9448 }, { "epoch": 1.92, "learning_rate": 0.00020583852264804967, "loss": 0.0306, "step": 9449 }, { "epoch": 1.92, "learning_rate": 0.0002058205300452222, "loss": 0.0409, "step": 9450 }, { "epoch": 1.92, "learning_rate": 0.00020580253651008654, "loss": 0.0044, "step": 9451 }, { "epoch": 1.92, "learning_rate": 0.0002057845420429432, "loss": 0.0157, "step": 9452 }, { "epoch": 1.92, "learning_rate": 0.00020576654664409267, "loss": 0.0097, "step": 9453 }, { "epoch": 1.93, "learning_rate": 0.00020574855031383555, "loss": 0.0046, "step": 9454 }, { "epoch": 1.93, "learning_rate": 0.00020573055305247241, "loss": 0.0188, "step": 9455 }, { "epoch": 1.93, "learning_rate": 0.00020571255486030385, "loss": 0.0323, "step": 9456 }, { "epoch": 1.93, "learning_rate": 0.00020569455573763045, "loss": 0.0061, "step": 9457 }, { "epoch": 1.93, "learning_rate": 0.0002056765556847528, "loss": 0.0137, "step": 9458 }, { "epoch": 1.93, "learning_rate": 0.0002056585547019716, "loss": 0.0138, "step": 9459 }, { "epoch": 1.93, "learning_rate": 0.00020564055278958753, "loss": 0.0066, "step": 9460 }, { "epoch": 1.93, "learning_rate": 0.0002056225499479011, "loss": 0.0129, "step": 9461 }, { "epoch": 1.93, "learning_rate": 0.00020560454617721318, "loss": 0.004, "step": 9462 }, { "epoch": 1.93, "learning_rate": 0.00020558654147782434, "loss": 0.0192, "step": 9463 }, { "epoch": 1.93, "learning_rate": 0.00020556853585003534, "loss": 0.04, "step": 9464 }, { "epoch": 1.93, "learning_rate": 0.0002055505292941469, "loss": 0.0155, "step": 9465 }, { "epoch": 1.93, "learning_rate": 0.00020553252181045972, "loss": 0.0217, "step": 9466 }, { "epoch": 1.93, "learning_rate": 0.00020551451339927466, "loss": 0.0076, "step": 9467 }, { "epoch": 1.93, "learning_rate": 0.0002054965040608924, "loss": 0.0171, "step": 9468 }, { "epoch": 1.93, "learning_rate": 0.00020547849379561376, "loss": 0.0044, "step": 9469 }, { "epoch": 1.93, "learning_rate": 0.00020546048260373958, "loss": 0.0077, "step": 9470 }, { "epoch": 1.93, "learning_rate": 0.00020544247048557058, "loss": 0.0058, "step": 9471 }, { "epoch": 1.93, "learning_rate": 0.00020542445744140775, "loss": 0.0054, "step": 9472 }, { "epoch": 1.93, "learning_rate": 0.00020540644347155187, "loss": 0.0056, "step": 9473 }, { "epoch": 1.93, "learning_rate": 0.00020538842857630374, "loss": 0.0193, "step": 9474 }, { "epoch": 1.93, "learning_rate": 0.00020537041275596433, "loss": 0.0406, "step": 9475 }, { "epoch": 1.93, "learning_rate": 0.00020535239601083448, "loss": 0.014, "step": 9476 }, { "epoch": 1.93, "learning_rate": 0.00020533437834121512, "loss": 0.0402, "step": 9477 }, { "epoch": 1.93, "learning_rate": 0.00020531635974740722, "loss": 0.0164, "step": 9478 }, { "epoch": 1.93, "learning_rate": 0.0002052983402297117, "loss": 0.0059, "step": 9479 }, { "epoch": 1.93, "learning_rate": 0.0002052803197884295, "loss": 0.0209, "step": 9480 }, { "epoch": 1.93, "learning_rate": 0.00020526229842386163, "loss": 0.0045, "step": 9481 }, { "epoch": 1.93, "learning_rate": 0.00020524427613630907, "loss": 0.0154, "step": 9482 }, { "epoch": 1.93, "learning_rate": 0.00020522625292607278, "loss": 0.016, "step": 9483 }, { "epoch": 1.93, "learning_rate": 0.00020520822879345385, "loss": 0.0051, "step": 9484 }, { "epoch": 1.93, "learning_rate": 0.00020519020373875328, "loss": 0.0195, "step": 9485 }, { "epoch": 1.93, "learning_rate": 0.00020517217776227207, "loss": 0.0038, "step": 9486 }, { "epoch": 1.93, "learning_rate": 0.00020515415086431145, "loss": 0.0011, "step": 9487 }, { "epoch": 1.93, "learning_rate": 0.00020513612304517233, "loss": 0.0244, "step": 9488 }, { "epoch": 1.93, "learning_rate": 0.00020511809430515587, "loss": 0.0084, "step": 9489 }, { "epoch": 1.93, "learning_rate": 0.00020510006464456322, "loss": 0.0185, "step": 9490 }, { "epoch": 1.93, "learning_rate": 0.00020508203406369553, "loss": 0.0062, "step": 9491 }, { "epoch": 1.93, "learning_rate": 0.00020506400256285385, "loss": 0.0059, "step": 9492 }, { "epoch": 1.93, "learning_rate": 0.00020504597014233935, "loss": 0.0084, "step": 9493 }, { "epoch": 1.93, "learning_rate": 0.00020502793680245328, "loss": 0.0322, "step": 9494 }, { "epoch": 1.93, "learning_rate": 0.00020500990254349678, "loss": 0.0687, "step": 9495 }, { "epoch": 1.93, "learning_rate": 0.0002049918673657711, "loss": 0.0147, "step": 9496 }, { "epoch": 1.93, "learning_rate": 0.00020497383126957743, "loss": 0.0222, "step": 9497 }, { "epoch": 1.93, "learning_rate": 0.00020495579425521695, "loss": 0.0194, "step": 9498 }, { "epoch": 1.93, "learning_rate": 0.00020493775632299098, "loss": 0.0079, "step": 9499 }, { "epoch": 1.93, "learning_rate": 0.0002049197174732008, "loss": 0.0038, "step": 9500 }, { "epoch": 1.93, "learning_rate": 0.0002049016777061477, "loss": 0.0141, "step": 9501 }, { "epoch": 1.93, "learning_rate": 0.00020488363702213293, "loss": 0.0126, "step": 9502 }, { "epoch": 1.93, "learning_rate": 0.0002048655954214578, "loss": 0.0097, "step": 9503 }, { "epoch": 1.94, "learning_rate": 0.00020484755290442366, "loss": 0.0064, "step": 9504 }, { "epoch": 1.94, "learning_rate": 0.0002048295094713319, "loss": 0.0169, "step": 9505 }, { "epoch": 1.94, "learning_rate": 0.0002048114651224838, "loss": 0.016, "step": 9506 }, { "epoch": 1.94, "learning_rate": 0.00020479341985818076, "loss": 0.009, "step": 9507 }, { "epoch": 1.94, "learning_rate": 0.00020477537367872417, "loss": 0.0313, "step": 9508 }, { "epoch": 1.94, "learning_rate": 0.00020475732658441548, "loss": 0.0244, "step": 9509 }, { "epoch": 1.94, "learning_rate": 0.00020473927857555602, "loss": 0.0066, "step": 9510 }, { "epoch": 1.94, "learning_rate": 0.00020472122965244736, "loss": 0.0198, "step": 9511 }, { "epoch": 1.94, "learning_rate": 0.00020470317981539078, "loss": 0.0032, "step": 9512 }, { "epoch": 1.94, "learning_rate": 0.0002046851290646879, "loss": 0.0507, "step": 9513 }, { "epoch": 1.94, "learning_rate": 0.00020466707740064013, "loss": 0.0077, "step": 9514 }, { "epoch": 1.94, "learning_rate": 0.00020464902482354898, "loss": 0.0061, "step": 9515 }, { "epoch": 1.94, "learning_rate": 0.00020463097133371596, "loss": 0.0199, "step": 9516 }, { "epoch": 1.94, "learning_rate": 0.00020461291693144254, "loss": 0.0164, "step": 9517 }, { "epoch": 1.94, "learning_rate": 0.00020459486161703038, "loss": 0.0244, "step": 9518 }, { "epoch": 1.94, "learning_rate": 0.00020457680539078094, "loss": 0.0071, "step": 9519 }, { "epoch": 1.94, "learning_rate": 0.00020455874825299586, "loss": 0.0047, "step": 9520 }, { "epoch": 1.94, "learning_rate": 0.00020454069020397667, "loss": 0.0065, "step": 9521 }, { "epoch": 1.94, "learning_rate": 0.000204522631244025, "loss": 0.0162, "step": 9522 }, { "epoch": 1.94, "learning_rate": 0.0002045045713734425, "loss": 0.0204, "step": 9523 }, { "epoch": 1.94, "learning_rate": 0.00020448651059253077, "loss": 0.0351, "step": 9524 }, { "epoch": 1.94, "learning_rate": 0.00020446844890159146, "loss": 0.0098, "step": 9525 }, { "epoch": 1.94, "learning_rate": 0.0002044503863009262, "loss": 0.0026, "step": 9526 }, { "epoch": 1.94, "learning_rate": 0.00020443232279083673, "loss": 0.017, "step": 9527 }, { "epoch": 1.94, "learning_rate": 0.00020441425837162478, "loss": 0.0197, "step": 9528 }, { "epoch": 1.94, "learning_rate": 0.0002043961930435919, "loss": 0.0156, "step": 9529 }, { "epoch": 1.94, "learning_rate": 0.00020437812680703995, "loss": 0.0175, "step": 9530 }, { "epoch": 1.94, "learning_rate": 0.00020436005966227065, "loss": 0.0184, "step": 9531 }, { "epoch": 1.94, "learning_rate": 0.0002043419916095857, "loss": 0.0123, "step": 9532 }, { "epoch": 1.94, "learning_rate": 0.00020432392264928698, "loss": 0.0086, "step": 9533 }, { "epoch": 1.94, "learning_rate": 0.00020430585278167617, "loss": 0.0244, "step": 9534 }, { "epoch": 1.94, "learning_rate": 0.00020428778200705513, "loss": 0.0184, "step": 9535 }, { "epoch": 1.94, "learning_rate": 0.00020426971032572563, "loss": 0.0195, "step": 9536 }, { "epoch": 1.94, "learning_rate": 0.00020425163773798955, "loss": 0.0098, "step": 9537 }, { "epoch": 1.94, "learning_rate": 0.00020423356424414873, "loss": 0.012, "step": 9538 }, { "epoch": 1.94, "learning_rate": 0.00020421548984450496, "loss": 0.0054, "step": 9539 }, { "epoch": 1.94, "learning_rate": 0.00020419741453936023, "loss": 0.0143, "step": 9540 }, { "epoch": 1.94, "learning_rate": 0.00020417933832901628, "loss": 0.0319, "step": 9541 }, { "epoch": 1.94, "learning_rate": 0.0002041612612137752, "loss": 0.0161, "step": 9542 }, { "epoch": 1.94, "learning_rate": 0.00020414318319393878, "loss": 0.0053, "step": 9543 }, { "epoch": 1.94, "learning_rate": 0.000204125104269809, "loss": 0.0035, "step": 9544 }, { "epoch": 1.94, "learning_rate": 0.0002041070244416878, "loss": 0.0124, "step": 9545 }, { "epoch": 1.94, "learning_rate": 0.00020408894370987717, "loss": 0.0219, "step": 9546 }, { "epoch": 1.94, "learning_rate": 0.00020407086207467913, "loss": 0.0124, "step": 9547 }, { "epoch": 1.94, "learning_rate": 0.00020405277953639556, "loss": 0.0082, "step": 9548 }, { "epoch": 1.94, "learning_rate": 0.00020403469609532856, "loss": 0.0213, "step": 9549 }, { "epoch": 1.94, "learning_rate": 0.00020401661175178018, "loss": 0.0237, "step": 9550 }, { "epoch": 1.94, "learning_rate": 0.00020399852650605235, "loss": 0.0068, "step": 9551 }, { "epoch": 1.94, "learning_rate": 0.0002039804403584472, "loss": 0.0034, "step": 9552 }, { "epoch": 1.95, "learning_rate": 0.00020396235330926682, "loss": 0.0109, "step": 9553 }, { "epoch": 1.95, "learning_rate": 0.00020394426535881333, "loss": 0.0045, "step": 9554 }, { "epoch": 1.95, "learning_rate": 0.00020392617650738873, "loss": 0.0077, "step": 9555 }, { "epoch": 1.95, "learning_rate": 0.0002039080867552952, "loss": 0.0167, "step": 9556 }, { "epoch": 1.95, "learning_rate": 0.00020388999610283486, "loss": 0.0081, "step": 9557 }, { "epoch": 1.95, "learning_rate": 0.00020387190455030984, "loss": 0.0089, "step": 9558 }, { "epoch": 1.95, "learning_rate": 0.00020385381209802236, "loss": 0.0095, "step": 9559 }, { "epoch": 1.95, "learning_rate": 0.00020383571874627455, "loss": 0.024, "step": 9560 }, { "epoch": 1.95, "learning_rate": 0.00020381762449536857, "loss": 0.0247, "step": 9561 }, { "epoch": 1.95, "learning_rate": 0.00020379952934560671, "loss": 0.0124, "step": 9562 }, { "epoch": 1.95, "learning_rate": 0.0002037814332972912, "loss": 0.0145, "step": 9563 }, { "epoch": 1.95, "learning_rate": 0.0002037633363507242, "loss": 0.0063, "step": 9564 }, { "epoch": 1.95, "learning_rate": 0.000203745238506208, "loss": 0.0302, "step": 9565 }, { "epoch": 1.95, "learning_rate": 0.00020372713976404486, "loss": 0.0126, "step": 9566 }, { "epoch": 1.95, "learning_rate": 0.00020370904012453705, "loss": 0.0084, "step": 9567 }, { "epoch": 1.95, "learning_rate": 0.0002036909395879869, "loss": 0.013, "step": 9568 }, { "epoch": 1.95, "learning_rate": 0.0002036728381546967, "loss": 0.0172, "step": 9569 }, { "epoch": 1.95, "learning_rate": 0.00020365473582496885, "loss": 0.0094, "step": 9570 }, { "epoch": 1.95, "learning_rate": 0.00020363663259910555, "loss": 0.006, "step": 9571 }, { "epoch": 1.95, "learning_rate": 0.00020361852847740927, "loss": 0.0159, "step": 9572 }, { "epoch": 1.95, "learning_rate": 0.00020360042346018233, "loss": 0.008, "step": 9573 }, { "epoch": 1.95, "learning_rate": 0.00020358231754772716, "loss": 0.0079, "step": 9574 }, { "epoch": 1.95, "learning_rate": 0.00020356421074034617, "loss": 0.0102, "step": 9575 }, { "epoch": 1.95, "learning_rate": 0.0002035461030383417, "loss": 0.0068, "step": 9576 }, { "epoch": 1.95, "learning_rate": 0.0002035279944420163, "loss": 0.0145, "step": 9577 }, { "epoch": 1.95, "learning_rate": 0.0002035098849516723, "loss": 0.0216, "step": 9578 }, { "epoch": 1.95, "learning_rate": 0.00020349177456761223, "loss": 0.0075, "step": 9579 }, { "epoch": 1.95, "learning_rate": 0.00020347366329013855, "loss": 0.0074, "step": 9580 }, { "epoch": 1.95, "learning_rate": 0.00020345555111955378, "loss": 0.0151, "step": 9581 }, { "epoch": 1.95, "learning_rate": 0.00020343743805616035, "loss": 0.0288, "step": 9582 }, { "epoch": 1.95, "learning_rate": 0.00020341932410026086, "loss": 0.0057, "step": 9583 }, { "epoch": 1.95, "learning_rate": 0.00020340120925215784, "loss": 0.0297, "step": 9584 }, { "epoch": 1.95, "learning_rate": 0.00020338309351215376, "loss": 0.0082, "step": 9585 }, { "epoch": 1.95, "learning_rate": 0.00020336497688055132, "loss": 0.0067, "step": 9586 }, { "epoch": 1.95, "learning_rate": 0.000203346859357653, "loss": 0.0029, "step": 9587 }, { "epoch": 1.95, "learning_rate": 0.00020332874094376147, "loss": 0.0224, "step": 9588 }, { "epoch": 1.95, "learning_rate": 0.00020331062163917924, "loss": 0.0174, "step": 9589 }, { "epoch": 1.95, "learning_rate": 0.00020329250144420904, "loss": 0.0184, "step": 9590 }, { "epoch": 1.95, "learning_rate": 0.00020327438035915344, "loss": 0.0177, "step": 9591 }, { "epoch": 1.95, "learning_rate": 0.00020325625838431516, "loss": 0.005, "step": 9592 }, { "epoch": 1.95, "learning_rate": 0.0002032381355199968, "loss": 0.0019, "step": 9593 }, { "epoch": 1.95, "learning_rate": 0.0002032200117665011, "loss": 0.0098, "step": 9594 }, { "epoch": 1.95, "learning_rate": 0.00020320188712413074, "loss": 0.0123, "step": 9595 }, { "epoch": 1.95, "learning_rate": 0.00020318376159318845, "loss": 0.0292, "step": 9596 }, { "epoch": 1.95, "learning_rate": 0.00020316563517397694, "loss": 0.0083, "step": 9597 }, { "epoch": 1.95, "learning_rate": 0.00020314750786679897, "loss": 0.014, "step": 9598 }, { "epoch": 1.95, "learning_rate": 0.00020312937967195734, "loss": 0.0035, "step": 9599 }, { "epoch": 1.95, "learning_rate": 0.0002031112505897547, "loss": 0.0118, "step": 9600 }, { "epoch": 1.95, "learning_rate": 0.00020309312062049396, "loss": 0.0102, "step": 9601 }, { "epoch": 1.96, "learning_rate": 0.00020307498976447787, "loss": 0.0058, "step": 9602 }, { "epoch": 1.96, "learning_rate": 0.00020305685802200928, "loss": 0.0073, "step": 9603 }, { "epoch": 1.96, "learning_rate": 0.00020303872539339097, "loss": 0.0073, "step": 9604 }, { "epoch": 1.96, "learning_rate": 0.00020302059187892588, "loss": 0.0139, "step": 9605 }, { "epoch": 1.96, "learning_rate": 0.00020300245747891681, "loss": 0.0117, "step": 9606 }, { "epoch": 1.96, "learning_rate": 0.00020298432219366665, "loss": 0.0066, "step": 9607 }, { "epoch": 1.96, "learning_rate": 0.0002029661860234783, "loss": 0.0162, "step": 9608 }, { "epoch": 1.96, "learning_rate": 0.00020294804896865467, "loss": 0.0183, "step": 9609 }, { "epoch": 1.96, "learning_rate": 0.00020292991102949866, "loss": 0.0089, "step": 9610 }, { "epoch": 1.96, "learning_rate": 0.00020291177220631317, "loss": 0.0087, "step": 9611 }, { "epoch": 1.96, "learning_rate": 0.0002028936324994013, "loss": 0.0029, "step": 9612 }, { "epoch": 1.96, "learning_rate": 0.00020287549190906587, "loss": 0.0109, "step": 9613 }, { "epoch": 1.96, "learning_rate": 0.0002028573504356099, "loss": 0.0081, "step": 9614 }, { "epoch": 1.96, "learning_rate": 0.00020283920807933644, "loss": 0.01, "step": 9615 }, { "epoch": 1.96, "learning_rate": 0.00020282106484054846, "loss": 0.0183, "step": 9616 }, { "epoch": 1.96, "learning_rate": 0.00020280292071954897, "loss": 0.0066, "step": 9617 }, { "epoch": 1.96, "learning_rate": 0.00020278477571664106, "loss": 0.022, "step": 9618 }, { "epoch": 1.96, "learning_rate": 0.00020276662983212773, "loss": 0.0156, "step": 9619 }, { "epoch": 1.96, "learning_rate": 0.0002027484830663121, "loss": 0.0205, "step": 9620 }, { "epoch": 1.96, "learning_rate": 0.00020273033541949725, "loss": 0.0044, "step": 9621 }, { "epoch": 1.96, "learning_rate": 0.00020271218689198623, "loss": 0.0068, "step": 9622 }, { "epoch": 1.96, "learning_rate": 0.00020269403748408217, "loss": 0.0241, "step": 9623 }, { "epoch": 1.96, "learning_rate": 0.00020267588719608825, "loss": 0.0028, "step": 9624 }, { "epoch": 1.96, "learning_rate": 0.0002026577360283076, "loss": 0.0208, "step": 9625 }, { "epoch": 1.96, "learning_rate": 0.0002026395839810433, "loss": 0.0189, "step": 9626 }, { "epoch": 1.96, "learning_rate": 0.00020262143105459861, "loss": 0.0172, "step": 9627 }, { "epoch": 1.96, "learning_rate": 0.00020260327724927672, "loss": 0.0077, "step": 9628 }, { "epoch": 1.96, "learning_rate": 0.00020258512256538078, "loss": 0.008, "step": 9629 }, { "epoch": 1.96, "learning_rate": 0.00020256696700321402, "loss": 0.0132, "step": 9630 }, { "epoch": 1.96, "learning_rate": 0.0002025488105630797, "loss": 0.0145, "step": 9631 }, { "epoch": 1.96, "learning_rate": 0.00020253065324528106, "loss": 0.0108, "step": 9632 }, { "epoch": 1.96, "learning_rate": 0.00020251249505012133, "loss": 0.0099, "step": 9633 }, { "epoch": 1.96, "learning_rate": 0.0002024943359779038, "loss": 0.0027, "step": 9634 }, { "epoch": 1.96, "learning_rate": 0.0002024761760289318, "loss": 0.0409, "step": 9635 }, { "epoch": 1.96, "learning_rate": 0.00020245801520350857, "loss": 0.0276, "step": 9636 }, { "epoch": 1.96, "learning_rate": 0.00020243985350193748, "loss": 0.0085, "step": 9637 }, { "epoch": 1.96, "learning_rate": 0.00020242169092452188, "loss": 0.0164, "step": 9638 }, { "epoch": 1.96, "learning_rate": 0.00020240352747156505, "loss": 0.0227, "step": 9639 }, { "epoch": 1.96, "learning_rate": 0.0002023853631433704, "loss": 0.0368, "step": 9640 }, { "epoch": 1.96, "learning_rate": 0.00020236719794024133, "loss": 0.0156, "step": 9641 }, { "epoch": 1.96, "learning_rate": 0.00020234903186248118, "loss": 0.0094, "step": 9642 }, { "epoch": 1.96, "learning_rate": 0.00020233086491039338, "loss": 0.0178, "step": 9643 }, { "epoch": 1.96, "learning_rate": 0.00020231269708428137, "loss": 0.0045, "step": 9644 }, { "epoch": 1.96, "learning_rate": 0.00020229452838444855, "loss": 0.0259, "step": 9645 }, { "epoch": 1.96, "learning_rate": 0.00020227635881119838, "loss": 0.0041, "step": 9646 }, { "epoch": 1.96, "learning_rate": 0.00020225818836483436, "loss": 0.0102, "step": 9647 }, { "epoch": 1.96, "learning_rate": 0.00020224001704565993, "loss": 0.0217, "step": 9648 }, { "epoch": 1.96, "learning_rate": 0.00020222184485397867, "loss": 0.0421, "step": 9649 }, { "epoch": 1.96, "learning_rate": 0.00020220367179009401, "loss": 0.0068, "step": 9650 }, { "epoch": 1.97, "learning_rate": 0.00020218549785430944, "loss": 0.0203, "step": 9651 }, { "epoch": 1.97, "learning_rate": 0.00020216732304692854, "loss": 0.0095, "step": 9652 }, { "epoch": 1.97, "learning_rate": 0.00020214914736825496, "loss": 0.0195, "step": 9653 }, { "epoch": 1.97, "learning_rate": 0.0002021309708185921, "loss": 0.0103, "step": 9654 }, { "epoch": 1.97, "learning_rate": 0.00020211279339824362, "loss": 0.0076, "step": 9655 }, { "epoch": 1.97, "learning_rate": 0.00020209461510751312, "loss": 0.0262, "step": 9656 }, { "epoch": 1.97, "learning_rate": 0.00020207643594670425, "loss": 0.0369, "step": 9657 }, { "epoch": 1.97, "learning_rate": 0.00020205825591612062, "loss": 0.0092, "step": 9658 }, { "epoch": 1.97, "learning_rate": 0.0002020400750160658, "loss": 0.0077, "step": 9659 }, { "epoch": 1.97, "learning_rate": 0.00020202189324684353, "loss": 0.0394, "step": 9660 }, { "epoch": 1.97, "learning_rate": 0.0002020037106087574, "loss": 0.0051, "step": 9661 }, { "epoch": 1.97, "learning_rate": 0.0002019855271021112, "loss": 0.0269, "step": 9662 }, { "epoch": 1.97, "learning_rate": 0.00020196734272720854, "loss": 0.0149, "step": 9663 }, { "epoch": 1.97, "learning_rate": 0.00020194915748435313, "loss": 0.0123, "step": 9664 }, { "epoch": 1.97, "learning_rate": 0.00020193097137384875, "loss": 0.0247, "step": 9665 }, { "epoch": 1.97, "learning_rate": 0.00020191278439599908, "loss": 0.02, "step": 9666 }, { "epoch": 1.97, "learning_rate": 0.000201894596551108, "loss": 0.0102, "step": 9667 }, { "epoch": 1.97, "learning_rate": 0.00020187640783947915, "loss": 0.0078, "step": 9668 }, { "epoch": 1.97, "learning_rate": 0.0002018582182614164, "loss": 0.0066, "step": 9669 }, { "epoch": 1.97, "learning_rate": 0.0002018400278172235, "loss": 0.0128, "step": 9670 }, { "epoch": 1.97, "learning_rate": 0.00020182183650720425, "loss": 0.0122, "step": 9671 }, { "epoch": 1.97, "learning_rate": 0.0002018036443316626, "loss": 0.005, "step": 9672 }, { "epoch": 1.97, "learning_rate": 0.0002017854512909022, "loss": 0.0137, "step": 9673 }, { "epoch": 1.97, "learning_rate": 0.00020176725738522706, "loss": 0.0125, "step": 9674 }, { "epoch": 1.97, "learning_rate": 0.00020174906261494096, "loss": 0.0117, "step": 9675 }, { "epoch": 1.97, "learning_rate": 0.00020173086698034787, "loss": 0.0222, "step": 9676 }, { "epoch": 1.97, "learning_rate": 0.00020171267048175166, "loss": 0.008, "step": 9677 }, { "epoch": 1.97, "learning_rate": 0.0002016944731194562, "loss": 0.0152, "step": 9678 }, { "epoch": 1.97, "learning_rate": 0.00020167627489376546, "loss": 0.0232, "step": 9679 }, { "epoch": 1.97, "learning_rate": 0.00020165807580498342, "loss": 0.0057, "step": 9680 }, { "epoch": 1.97, "learning_rate": 0.000201639875853414, "loss": 0.0119, "step": 9681 }, { "epoch": 1.97, "learning_rate": 0.0002016216750393612, "loss": 0.0191, "step": 9682 }, { "epoch": 1.97, "learning_rate": 0.00020160347336312896, "loss": 0.0115, "step": 9683 }, { "epoch": 1.97, "learning_rate": 0.00020158527082502127, "loss": 0.0142, "step": 9684 }, { "epoch": 1.97, "learning_rate": 0.00020156706742534218, "loss": 0.011, "step": 9685 }, { "epoch": 1.97, "learning_rate": 0.00020154886316439577, "loss": 0.0284, "step": 9686 }, { "epoch": 1.97, "learning_rate": 0.000201530658042486, "loss": 0.0028, "step": 9687 }, { "epoch": 1.97, "learning_rate": 0.00020151245205991702, "loss": 0.0164, "step": 9688 }, { "epoch": 1.97, "learning_rate": 0.00020149424521699282, "loss": 0.0163, "step": 9689 }, { "epoch": 1.97, "learning_rate": 0.00020147603751401755, "loss": 0.0186, "step": 9690 }, { "epoch": 1.97, "learning_rate": 0.00020145782895129524, "loss": 0.0276, "step": 9691 }, { "epoch": 1.97, "learning_rate": 0.00020143961952913007, "loss": 0.0079, "step": 9692 }, { "epoch": 1.97, "learning_rate": 0.00020142140924782616, "loss": 0.0094, "step": 9693 }, { "epoch": 1.97, "learning_rate": 0.00020140319810768765, "loss": 0.0419, "step": 9694 }, { "epoch": 1.97, "learning_rate": 0.00020138498610901872, "loss": 0.0107, "step": 9695 }, { "epoch": 1.97, "learning_rate": 0.0002013667732521235, "loss": 0.011, "step": 9696 }, { "epoch": 1.97, "learning_rate": 0.0002013485595373062, "loss": 0.0311, "step": 9697 }, { "epoch": 1.97, "learning_rate": 0.00020133034496487107, "loss": 0.0276, "step": 9698 }, { "epoch": 1.97, "learning_rate": 0.00020131212953512228, "loss": 0.037, "step": 9699 }, { "epoch": 1.98, "learning_rate": 0.00020129391324836402, "loss": 0.0109, "step": 9700 }, { "epoch": 1.98, "learning_rate": 0.0002012756961049006, "loss": 0.018, "step": 9701 }, { "epoch": 1.98, "learning_rate": 0.00020125747810503626, "loss": 0.0219, "step": 9702 }, { "epoch": 1.98, "learning_rate": 0.00020123925924907533, "loss": 0.0042, "step": 9703 }, { "epoch": 1.98, "learning_rate": 0.00020122103953732203, "loss": 0.0091, "step": 9704 }, { "epoch": 1.98, "learning_rate": 0.00020120281897008068, "loss": 0.0025, "step": 9705 }, { "epoch": 1.98, "learning_rate": 0.0002011845975476556, "loss": 0.0161, "step": 9706 }, { "epoch": 1.98, "learning_rate": 0.00020116637527035105, "loss": 0.0139, "step": 9707 }, { "epoch": 1.98, "learning_rate": 0.00020114815213847153, "loss": 0.0063, "step": 9708 }, { "epoch": 1.98, "learning_rate": 0.00020112992815232134, "loss": 0.0163, "step": 9709 }, { "epoch": 1.98, "learning_rate": 0.00020111170331220477, "loss": 0.0057, "step": 9710 }, { "epoch": 1.98, "learning_rate": 0.00020109347761842632, "loss": 0.0175, "step": 9711 }, { "epoch": 1.98, "learning_rate": 0.0002010752510712903, "loss": 0.0088, "step": 9712 }, { "epoch": 1.98, "learning_rate": 0.00020105702367110125, "loss": 0.0031, "step": 9713 }, { "epoch": 1.98, "learning_rate": 0.00020103879541816347, "loss": 0.0188, "step": 9714 }, { "epoch": 1.98, "learning_rate": 0.0002010205663127815, "loss": 0.0035, "step": 9715 }, { "epoch": 1.98, "learning_rate": 0.00020100233635525976, "loss": 0.0254, "step": 9716 }, { "epoch": 1.98, "learning_rate": 0.00020098410554590266, "loss": 0.0187, "step": 9717 }, { "epoch": 1.98, "learning_rate": 0.0002009658738850148, "loss": 0.0065, "step": 9718 }, { "epoch": 1.98, "learning_rate": 0.00020094764137290066, "loss": 0.0037, "step": 9719 }, { "epoch": 1.98, "learning_rate": 0.00020092940800986475, "loss": 0.0102, "step": 9720 }, { "epoch": 1.98, "learning_rate": 0.00020091117379621157, "loss": 0.0173, "step": 9721 }, { "epoch": 1.98, "learning_rate": 0.00020089293873224568, "loss": 0.0031, "step": 9722 }, { "epoch": 1.98, "learning_rate": 0.00020087470281827168, "loss": 0.0068, "step": 9723 }, { "epoch": 1.98, "learning_rate": 0.00020085646605459408, "loss": 0.0107, "step": 9724 }, { "epoch": 1.98, "learning_rate": 0.0002008382284415175, "loss": 0.0144, "step": 9725 }, { "epoch": 1.98, "learning_rate": 0.00020081998997934655, "loss": 0.004, "step": 9726 }, { "epoch": 1.98, "learning_rate": 0.0002008017506683858, "loss": 0.0054, "step": 9727 }, { "epoch": 1.98, "learning_rate": 0.00020078351050893995, "loss": 0.0096, "step": 9728 }, { "epoch": 1.98, "learning_rate": 0.00020076526950131362, "loss": 0.0105, "step": 9729 }, { "epoch": 1.98, "learning_rate": 0.00020074702764581148, "loss": 0.0131, "step": 9730 }, { "epoch": 1.98, "learning_rate": 0.00020072878494273812, "loss": 0.0079, "step": 9731 }, { "epoch": 1.98, "learning_rate": 0.00020071054139239838, "loss": 0.0106, "step": 9732 }, { "epoch": 1.98, "learning_rate": 0.00020069229699509682, "loss": 0.0112, "step": 9733 }, { "epoch": 1.98, "learning_rate": 0.00020067405175113823, "loss": 0.0132, "step": 9734 }, { "epoch": 1.98, "learning_rate": 0.00020065580566082733, "loss": 0.0353, "step": 9735 }, { "epoch": 1.98, "learning_rate": 0.00020063755872446888, "loss": 0.0087, "step": 9736 }, { "epoch": 1.98, "learning_rate": 0.00020061931094236756, "loss": 0.0069, "step": 9737 }, { "epoch": 1.98, "learning_rate": 0.00020060106231482817, "loss": 0.0077, "step": 9738 }, { "epoch": 1.98, "learning_rate": 0.00020058281284215558, "loss": 0.025, "step": 9739 }, { "epoch": 1.98, "learning_rate": 0.0002005645625246545, "loss": 0.0127, "step": 9740 }, { "epoch": 1.98, "learning_rate": 0.00020054631136262984, "loss": 0.0153, "step": 9741 }, { "epoch": 1.98, "learning_rate": 0.00020052805935638632, "loss": 0.0079, "step": 9742 }, { "epoch": 1.98, "learning_rate": 0.0002005098065062288, "loss": 0.0204, "step": 9743 }, { "epoch": 1.98, "learning_rate": 0.00020049155281246222, "loss": 0.0316, "step": 9744 }, { "epoch": 1.98, "learning_rate": 0.00020047329827539137, "loss": 0.0145, "step": 9745 }, { "epoch": 1.98, "learning_rate": 0.0002004550428953212, "loss": 0.0213, "step": 9746 }, { "epoch": 1.98, "learning_rate": 0.00020043678667255657, "loss": 0.0149, "step": 9747 }, { "epoch": 1.98, "learning_rate": 0.00020041852960740234, "loss": 0.0098, "step": 9748 }, { "epoch": 1.99, "learning_rate": 0.0002004002717001635, "loss": 0.0058, "step": 9749 }, { "epoch": 1.99, "learning_rate": 0.00020038201295114507, "loss": 0.026, "step": 9750 }, { "epoch": 1.99, "learning_rate": 0.00020036375336065184, "loss": 0.0121, "step": 9751 }, { "epoch": 1.99, "learning_rate": 0.00020034549292898888, "loss": 0.0124, "step": 9752 }, { "epoch": 1.99, "learning_rate": 0.00020032723165646117, "loss": 0.006, "step": 9753 }, { "epoch": 1.99, "learning_rate": 0.00020030896954337368, "loss": 0.0072, "step": 9754 }, { "epoch": 1.99, "learning_rate": 0.00020029070659003146, "loss": 0.021, "step": 9755 }, { "epoch": 1.99, "learning_rate": 0.00020027244279673947, "loss": 0.0237, "step": 9756 }, { "epoch": 1.99, "learning_rate": 0.00020025417816380277, "loss": 0.0062, "step": 9757 }, { "epoch": 1.99, "learning_rate": 0.0002002359126915265, "loss": 0.0049, "step": 9758 }, { "epoch": 1.99, "learning_rate": 0.0002002176463802156, "loss": 0.012, "step": 9759 }, { "epoch": 1.99, "learning_rate": 0.00020019937923017523, "loss": 0.0056, "step": 9760 }, { "epoch": 1.99, "learning_rate": 0.0002001811112417105, "loss": 0.0031, "step": 9761 }, { "epoch": 1.99, "learning_rate": 0.00020016284241512647, "loss": 0.0134, "step": 9762 }, { "epoch": 1.99, "learning_rate": 0.00020014457275072825, "loss": 0.0213, "step": 9763 }, { "epoch": 1.99, "learning_rate": 0.0002001263022488211, "loss": 0.012, "step": 9764 }, { "epoch": 1.99, "learning_rate": 0.00020010803090971002, "loss": 0.0096, "step": 9765 }, { "epoch": 1.99, "learning_rate": 0.00020008975873370022, "loss": 0.0093, "step": 9766 }, { "epoch": 1.99, "learning_rate": 0.00020007148572109696, "loss": 0.0056, "step": 9767 }, { "epoch": 1.99, "learning_rate": 0.0002000532118722053, "loss": 0.0138, "step": 9768 }, { "epoch": 1.99, "learning_rate": 0.00020003493718733054, "loss": 0.0024, "step": 9769 }, { "epoch": 1.99, "learning_rate": 0.0002000166616667779, "loss": 0.0075, "step": 9770 }, { "epoch": 1.99, "learning_rate": 0.0001999983853108526, "loss": 0.0123, "step": 9771 }, { "epoch": 1.99, "learning_rate": 0.00019998010811985987, "loss": 0.0101, "step": 9772 }, { "epoch": 1.99, "learning_rate": 0.00019996183009410496, "loss": 0.0151, "step": 9773 }, { "epoch": 1.99, "learning_rate": 0.00019994355123389325, "loss": 0.0087, "step": 9774 }, { "epoch": 1.99, "learning_rate": 0.00019992527153952995, "loss": 0.0143, "step": 9775 }, { "epoch": 1.99, "learning_rate": 0.00019990699101132034, "loss": 0.0031, "step": 9776 }, { "epoch": 1.99, "learning_rate": 0.00019988870964956977, "loss": 0.0146, "step": 9777 }, { "epoch": 1.99, "learning_rate": 0.0001998704274545836, "loss": 0.0063, "step": 9778 }, { "epoch": 1.99, "learning_rate": 0.00019985214442666712, "loss": 0.0152, "step": 9779 }, { "epoch": 1.99, "learning_rate": 0.00019983386056612575, "loss": 0.0177, "step": 9780 }, { "epoch": 1.99, "learning_rate": 0.00019981557587326484, "loss": 0.0098, "step": 9781 }, { "epoch": 1.99, "learning_rate": 0.00019979729034838977, "loss": 0.0115, "step": 9782 }, { "epoch": 1.99, "learning_rate": 0.00019977900399180596, "loss": 0.0222, "step": 9783 }, { "epoch": 1.99, "learning_rate": 0.00019976071680381885, "loss": 0.039, "step": 9784 }, { "epoch": 1.99, "learning_rate": 0.0001997424287847338, "loss": 0.0082, "step": 9785 }, { "epoch": 1.99, "learning_rate": 0.0001997241399348563, "loss": 0.0129, "step": 9786 }, { "epoch": 1.99, "learning_rate": 0.00019970585025449184, "loss": 0.0095, "step": 9787 }, { "epoch": 1.99, "learning_rate": 0.00019968755974394582, "loss": 0.0121, "step": 9788 }, { "epoch": 1.99, "learning_rate": 0.00019966926840352377, "loss": 0.011, "step": 9789 }, { "epoch": 1.99, "learning_rate": 0.00019965097623353116, "loss": 0.0057, "step": 9790 }, { "epoch": 1.99, "learning_rate": 0.00019963268323427348, "loss": 0.002, "step": 9791 }, { "epoch": 1.99, "learning_rate": 0.0001996143894060564, "loss": 0.0188, "step": 9792 }, { "epoch": 1.99, "learning_rate": 0.00019959609474918532, "loss": 0.0131, "step": 9793 }, { "epoch": 1.99, "learning_rate": 0.00019957779926396585, "loss": 0.0183, "step": 9794 }, { "epoch": 1.99, "learning_rate": 0.00019955950295070352, "loss": 0.0088, "step": 9795 }, { "epoch": 1.99, "learning_rate": 0.00019954120580970393, "loss": 0.0145, "step": 9796 }, { "epoch": 1.99, "learning_rate": 0.00019952290784127277, "loss": 0.0298, "step": 9797 }, { "epoch": 2.0, "learning_rate": 0.00019950460904571548, "loss": 0.0147, "step": 9798 }, { "epoch": 2.0, "learning_rate": 0.00019948630942333783, "loss": 0.0079, "step": 9799 }, { "epoch": 2.0, "learning_rate": 0.00019946800897444538, "loss": 0.0376, "step": 9800 }, { "epoch": 2.0, "learning_rate": 0.0001994497076993438, "loss": 0.0064, "step": 9801 }, { "epoch": 2.0, "learning_rate": 0.0001994314055983387, "loss": 0.0053, "step": 9802 }, { "epoch": 2.0, "learning_rate": 0.0001994131026717359, "loss": 0.0106, "step": 9803 }, { "epoch": 2.0, "learning_rate": 0.000199394798919841, "loss": 0.0244, "step": 9804 }, { "epoch": 2.0, "learning_rate": 0.00019937649434295968, "loss": 0.0287, "step": 9805 }, { "epoch": 2.0, "learning_rate": 0.00019935818894139775, "loss": 0.0154, "step": 9806 }, { "epoch": 2.0, "learning_rate": 0.00019933988271546088, "loss": 0.0176, "step": 9807 }, { "epoch": 2.0, "learning_rate": 0.00019932157566545478, "loss": 0.0351, "step": 9808 }, { "epoch": 2.0, "learning_rate": 0.00019930326779168532, "loss": 0.0028, "step": 9809 }, { "epoch": 2.0, "learning_rate": 0.0001992849590944582, "loss": 0.0198, "step": 9810 }, { "epoch": 2.0, "learning_rate": 0.00019926664957407926, "loss": 0.0134, "step": 9811 }, { "epoch": 2.0, "learning_rate": 0.00019924833923085422, "loss": 0.0288, "step": 9812 }, { "epoch": 2.0, "learning_rate": 0.00019923002806508902, "loss": 0.0131, "step": 9813 }, { "epoch": 2.0, "learning_rate": 0.00019921171607708936, "loss": 0.0186, "step": 9814 }, { "epoch": 2.0, "learning_rate": 0.00019919340326716122, "loss": 0.0079, "step": 9815 }, { "epoch": 2.0, "learning_rate": 0.00019917508963561033, "loss": 0.0016, "step": 9816 }, { "epoch": 2.0, "learning_rate": 0.0001991567751827426, "loss": 0.0175, "step": 9817 }, { "epoch": 2.0, "learning_rate": 0.00019913845990886397, "loss": 0.0288, "step": 9818 }, { "epoch": 2.0, "learning_rate": 0.0001991201438142803, "loss": 0.0212, "step": 9819 }, { "epoch": 2.0, "learning_rate": 0.00019910182689929755, "loss": 0.0134, "step": 9820 }, { "epoch": 2.0, "learning_rate": 0.00019908350916422152, "loss": 0.009, "step": 9821 }, { "epoch": 2.0, "learning_rate": 0.00019906519060935827, "loss": 0.0085, "step": 9822 }, { "epoch": 2.0, "learning_rate": 0.00019904687123501374, "loss": 0.0039, "step": 9823 }, { "epoch": 2.0, "learning_rate": 0.00019902855104149387, "loss": 0.0086, "step": 9824 }, { "epoch": 2.0, "learning_rate": 0.00019901023002910466, "loss": 0.0097, "step": 9825 }, { "epoch": 2.0, "learning_rate": 0.00019899190819815208, "loss": 0.0089, "step": 9826 }, { "epoch": 2.0, "learning_rate": 0.00019897358554894215, "loss": 0.0078, "step": 9827 }, { "epoch": 2.0, "learning_rate": 0.0001989552620817809, "loss": 0.002, "step": 9828 }, { "epoch": 2.0, "learning_rate": 0.00019893693779697436, "loss": 0.0072, "step": 9829 }, { "epoch": 2.0, "learning_rate": 0.00019891861269482862, "loss": 0.0067, "step": 9830 }, { "epoch": 2.0, "learning_rate": 0.00019890028677564965, "loss": 0.0045, "step": 9831 }, { "epoch": 2.0, "learning_rate": 0.00019888196003974357, "loss": 0.0165, "step": 9832 }, { "epoch": 2.0, "learning_rate": 0.00019886363248741652, "loss": 0.0012, "step": 9833 }, { "epoch": 2.0, "learning_rate": 0.00019884530411897464, "loss": 0.0041, "step": 9834 }, { "epoch": 2.0, "learning_rate": 0.0001988269749347239, "loss": 0.0078, "step": 9835 }, { "epoch": 2.0, "learning_rate": 0.00019880864493497053, "loss": 0.0035, "step": 9836 }, { "epoch": 2.0, "learning_rate": 0.00019879031412002067, "loss": 0.0158, "step": 9837 }, { "epoch": 2.0, "learning_rate": 0.00019877198249018045, "loss": 0.0042, "step": 9838 }, { "epoch": 2.0, "learning_rate": 0.00019875365004575605, "loss": 0.0062, "step": 9839 }, { "epoch": 2.0, "learning_rate": 0.0001987353167870537, "loss": 0.0082, "step": 9840 }, { "epoch": 2.0, "learning_rate": 0.00019871698271437953, "loss": 0.0045, "step": 9841 }, { "epoch": 2.0, "learning_rate": 0.00019869864782803978, "loss": 0.0111, "step": 9842 }, { "epoch": 2.0, "learning_rate": 0.0001986803121283407, "loss": 0.0063, "step": 9843 }, { "epoch": 2.0, "learning_rate": 0.00019866197561558855, "loss": 0.0165, "step": 9844 }, { "epoch": 2.0, "learning_rate": 0.00019864363829008949, "loss": 0.0057, "step": 9845 }, { "epoch": 2.0, "learning_rate": 0.0001986253001521499, "loss": 0.0038, "step": 9846 }, { "epoch": 2.01, "learning_rate": 0.00019860696120207596, "loss": 0.017, "step": 9847 }, { "epoch": 2.01, "learning_rate": 0.0001985886214401741, "loss": 0.0101, "step": 9848 }, { "epoch": 2.01, "learning_rate": 0.00019857028086675048, "loss": 0.0106, "step": 9849 }, { "epoch": 2.01, "learning_rate": 0.0001985519394821115, "loss": 0.0072, "step": 9850 }, { "epoch": 2.01, "learning_rate": 0.00019853359728656348, "loss": 0.0027, "step": 9851 }, { "epoch": 2.01, "learning_rate": 0.00019851525428041277, "loss": 0.012, "step": 9852 }, { "epoch": 2.01, "learning_rate": 0.00019849691046396574, "loss": 0.0011, "step": 9853 }, { "epoch": 2.01, "learning_rate": 0.00019847856583752875, "loss": 0.0117, "step": 9854 }, { "epoch": 2.01, "learning_rate": 0.0001984602204014082, "loss": 0.0113, "step": 9855 }, { "epoch": 2.01, "learning_rate": 0.00019844187415591052, "loss": 0.0139, "step": 9856 }, { "epoch": 2.01, "learning_rate": 0.0001984235271013421, "loss": 0.0052, "step": 9857 }, { "epoch": 2.01, "learning_rate": 0.00019840517923800936, "loss": 0.0075, "step": 9858 }, { "epoch": 2.01, "learning_rate": 0.00019838683056621877, "loss": 0.0054, "step": 9859 }, { "epoch": 2.01, "learning_rate": 0.00019836848108627673, "loss": 0.0034, "step": 9860 }, { "epoch": 2.01, "learning_rate": 0.0001983501307984898, "loss": 0.009, "step": 9861 }, { "epoch": 2.01, "learning_rate": 0.00019833177970316436, "loss": 0.0023, "step": 9862 }, { "epoch": 2.01, "learning_rate": 0.00019831342780060702, "loss": 0.0029, "step": 9863 }, { "epoch": 2.01, "learning_rate": 0.0001982950750911242, "loss": 0.0044, "step": 9864 }, { "epoch": 2.01, "learning_rate": 0.0001982767215750225, "loss": 0.0031, "step": 9865 }, { "epoch": 2.01, "learning_rate": 0.0001982583672526084, "loss": 0.003, "step": 9866 }, { "epoch": 2.01, "learning_rate": 0.00019824001212418848, "loss": 0.0031, "step": 9867 }, { "epoch": 2.01, "learning_rate": 0.0001982216561900693, "loss": 0.0038, "step": 9868 }, { "epoch": 2.01, "learning_rate": 0.00019820329945055744, "loss": 0.0102, "step": 9869 }, { "epoch": 2.01, "learning_rate": 0.00019818494190595946, "loss": 0.023, "step": 9870 }, { "epoch": 2.01, "learning_rate": 0.00019816658355658204, "loss": 0.0148, "step": 9871 }, { "epoch": 2.01, "learning_rate": 0.00019814822440273174, "loss": 0.0264, "step": 9872 }, { "epoch": 2.01, "learning_rate": 0.00019812986444471518, "loss": 0.0011, "step": 9873 }, { "epoch": 2.01, "learning_rate": 0.00019811150368283904, "loss": 0.0085, "step": 9874 }, { "epoch": 2.01, "learning_rate": 0.00019809314211741, "loss": 0.0027, "step": 9875 }, { "epoch": 2.01, "learning_rate": 0.0001980747797487347, "loss": 0.013, "step": 9876 }, { "epoch": 2.01, "learning_rate": 0.00019805641657711978, "loss": 0.0059, "step": 9877 }, { "epoch": 2.01, "learning_rate": 0.00019803805260287203, "loss": 0.0047, "step": 9878 }, { "epoch": 2.01, "learning_rate": 0.0001980196878262981, "loss": 0.0078, "step": 9879 }, { "epoch": 2.01, "learning_rate": 0.00019800132224770482, "loss": 0.0253, "step": 9880 }, { "epoch": 2.01, "learning_rate": 0.00019798295586739877, "loss": 0.0147, "step": 9881 }, { "epoch": 2.01, "learning_rate": 0.00019796458868568678, "loss": 0.008, "step": 9882 }, { "epoch": 2.01, "learning_rate": 0.00019794622070287566, "loss": 0.0111, "step": 9883 }, { "epoch": 2.01, "learning_rate": 0.0001979278519192721, "loss": 0.0021, "step": 9884 }, { "epoch": 2.01, "learning_rate": 0.000197909482335183, "loss": 0.0203, "step": 9885 }, { "epoch": 2.01, "learning_rate": 0.00019789111195091504, "loss": 0.0133, "step": 9886 }, { "epoch": 2.01, "learning_rate": 0.00019787274076677518, "loss": 0.0052, "step": 9887 }, { "epoch": 2.01, "learning_rate": 0.00019785436878307016, "loss": 0.0102, "step": 9888 }, { "epoch": 2.01, "learning_rate": 0.00019783599600010687, "loss": 0.0162, "step": 9889 }, { "epoch": 2.01, "learning_rate": 0.00019781762241819208, "loss": 0.016, "step": 9890 }, { "epoch": 2.01, "learning_rate": 0.0001977992480376328, "loss": 0.0041, "step": 9891 }, { "epoch": 2.01, "learning_rate": 0.0001977808728587358, "loss": 0.0078, "step": 9892 }, { "epoch": 2.01, "learning_rate": 0.00019776249688180806, "loss": 0.0182, "step": 9893 }, { "epoch": 2.01, "learning_rate": 0.00019774412010715648, "loss": 0.0017, "step": 9894 }, { "epoch": 2.01, "learning_rate": 0.00019772574253508794, "loss": 0.0012, "step": 9895 }, { "epoch": 2.02, "learning_rate": 0.00019770736416590943, "loss": 0.0057, "step": 9896 }, { "epoch": 2.02, "learning_rate": 0.00019768898499992788, "loss": 0.017, "step": 9897 }, { "epoch": 2.02, "learning_rate": 0.00019767060503745026, "loss": 0.0088, "step": 9898 }, { "epoch": 2.02, "learning_rate": 0.00019765222427878354, "loss": 0.0078, "step": 9899 }, { "epoch": 2.02, "learning_rate": 0.00019763384272423475, "loss": 0.0124, "step": 9900 }, { "epoch": 2.02, "learning_rate": 0.00019761546037411087, "loss": 0.0108, "step": 9901 }, { "epoch": 2.02, "learning_rate": 0.00019759707722871888, "loss": 0.0008, "step": 9902 }, { "epoch": 2.02, "learning_rate": 0.0001975786932883659, "loss": 0.0176, "step": 9903 }, { "epoch": 2.02, "learning_rate": 0.00019756030855335891, "loss": 0.0072, "step": 9904 }, { "epoch": 2.02, "learning_rate": 0.000197541923024005, "loss": 0.0095, "step": 9905 }, { "epoch": 2.02, "learning_rate": 0.00019752353670061119, "loss": 0.0041, "step": 9906 }, { "epoch": 2.02, "learning_rate": 0.00019750514958348465, "loss": 0.0046, "step": 9907 }, { "epoch": 2.02, "learning_rate": 0.0001974867616729325, "loss": 0.005, "step": 9908 }, { "epoch": 2.02, "learning_rate": 0.0001974683729692617, "loss": 0.0081, "step": 9909 }, { "epoch": 2.02, "learning_rate": 0.0001974499834727795, "loss": 0.0061, "step": 9910 }, { "epoch": 2.02, "learning_rate": 0.000197431593183793, "loss": 0.013, "step": 9911 }, { "epoch": 2.02, "learning_rate": 0.0001974132021026094, "loss": 0.0035, "step": 9912 }, { "epoch": 2.02, "learning_rate": 0.0001973948102295358, "loss": 0.0112, "step": 9913 }, { "epoch": 2.02, "learning_rate": 0.00019737641756487938, "loss": 0.0081, "step": 9914 }, { "epoch": 2.02, "learning_rate": 0.00019735802410894733, "loss": 0.0059, "step": 9915 }, { "epoch": 2.02, "learning_rate": 0.00019733962986204692, "loss": 0.0088, "step": 9916 }, { "epoch": 2.02, "learning_rate": 0.00019732123482448535, "loss": 0.0129, "step": 9917 }, { "epoch": 2.02, "learning_rate": 0.00019730283899656984, "loss": 0.0317, "step": 9918 }, { "epoch": 2.02, "learning_rate": 0.0001972844423786076, "loss": 0.0051, "step": 9919 }, { "epoch": 2.02, "learning_rate": 0.00019726604497090594, "loss": 0.013, "step": 9920 }, { "epoch": 2.02, "learning_rate": 0.0001972476467737721, "loss": 0.0602, "step": 9921 }, { "epoch": 2.02, "learning_rate": 0.00019722924778751337, "loss": 0.001, "step": 9922 }, { "epoch": 2.02, "learning_rate": 0.00019721084801243706, "loss": 0.0298, "step": 9923 }, { "epoch": 2.02, "learning_rate": 0.00019719244744885044, "loss": 0.0096, "step": 9924 }, { "epoch": 2.02, "learning_rate": 0.00019717404609706087, "loss": 0.0073, "step": 9925 }, { "epoch": 2.02, "learning_rate": 0.0001971556439573757, "loss": 0.0022, "step": 9926 }, { "epoch": 2.02, "learning_rate": 0.00019713724103010227, "loss": 0.0071, "step": 9927 }, { "epoch": 2.02, "learning_rate": 0.00019711883731554793, "loss": 0.0049, "step": 9928 }, { "epoch": 2.02, "learning_rate": 0.00019710043281402005, "loss": 0.01, "step": 9929 }, { "epoch": 2.02, "learning_rate": 0.00019708202752582605, "loss": 0.005, "step": 9930 }, { "epoch": 2.02, "learning_rate": 0.00019706362145127332, "loss": 0.0197, "step": 9931 }, { "epoch": 2.02, "learning_rate": 0.00019704521459066926, "loss": 0.0041, "step": 9932 }, { "epoch": 2.02, "learning_rate": 0.00019702680694432133, "loss": 0.0047, "step": 9933 }, { "epoch": 2.02, "learning_rate": 0.00019700839851253697, "loss": 0.0188, "step": 9934 }, { "epoch": 2.02, "learning_rate": 0.00019698998929562356, "loss": 0.0192, "step": 9935 }, { "epoch": 2.02, "learning_rate": 0.00019697157929388868, "loss": 0.0171, "step": 9936 }, { "epoch": 2.02, "learning_rate": 0.00019695316850763974, "loss": 0.0113, "step": 9937 }, { "epoch": 2.02, "learning_rate": 0.00019693475693718425, "loss": 0.0098, "step": 9938 }, { "epoch": 2.02, "learning_rate": 0.00019691634458282971, "loss": 0.0079, "step": 9939 }, { "epoch": 2.02, "learning_rate": 0.00019689793144488367, "loss": 0.004, "step": 9940 }, { "epoch": 2.02, "learning_rate": 0.00019687951752365366, "loss": 0.0074, "step": 9941 }, { "epoch": 2.02, "learning_rate": 0.00019686110281944724, "loss": 0.0124, "step": 9942 }, { "epoch": 2.02, "learning_rate": 0.0001968426873325719, "loss": 0.0134, "step": 9943 }, { "epoch": 2.02, "learning_rate": 0.00019682427106333528, "loss": 0.0115, "step": 9944 }, { "epoch": 2.02, "learning_rate": 0.00019680585401204493, "loss": 0.0105, "step": 9945 }, { "epoch": 2.03, "learning_rate": 0.0001967874361790085, "loss": 0.0121, "step": 9946 }, { "epoch": 2.03, "learning_rate": 0.00019676901756453353, "loss": 0.0102, "step": 9947 }, { "epoch": 2.03, "learning_rate": 0.00019675059816892768, "loss": 0.0068, "step": 9948 }, { "epoch": 2.03, "learning_rate": 0.00019673217799249864, "loss": 0.0233, "step": 9949 }, { "epoch": 2.03, "learning_rate": 0.000196713757035554, "loss": 0.0109, "step": 9950 }, { "epoch": 2.03, "learning_rate": 0.00019669533529840142, "loss": 0.0137, "step": 9951 }, { "epoch": 2.03, "learning_rate": 0.0001966769127813486, "loss": 0.0105, "step": 9952 }, { "epoch": 2.03, "learning_rate": 0.00019665848948470323, "loss": 0.0047, "step": 9953 }, { "epoch": 2.03, "learning_rate": 0.00019664006540877303, "loss": 0.0183, "step": 9954 }, { "epoch": 2.03, "learning_rate": 0.00019662164055386566, "loss": 0.0144, "step": 9955 }, { "epoch": 2.03, "learning_rate": 0.00019660321492028892, "loss": 0.0052, "step": 9956 }, { "epoch": 2.03, "learning_rate": 0.0001965847885083505, "loss": 0.0153, "step": 9957 }, { "epoch": 2.03, "learning_rate": 0.00019656636131835817, "loss": 0.0035, "step": 9958 }, { "epoch": 2.03, "learning_rate": 0.00019654793335061976, "loss": 0.0147, "step": 9959 }, { "epoch": 2.03, "learning_rate": 0.00019652950460544294, "loss": 0.0127, "step": 9960 }, { "epoch": 2.03, "learning_rate": 0.00019651107508313558, "loss": 0.0108, "step": 9961 }, { "epoch": 2.03, "learning_rate": 0.00019649264478400547, "loss": 0.0083, "step": 9962 }, { "epoch": 2.03, "learning_rate": 0.00019647421370836047, "loss": 0.005, "step": 9963 }, { "epoch": 2.03, "learning_rate": 0.00019645578185650833, "loss": 0.0064, "step": 9964 }, { "epoch": 2.03, "learning_rate": 0.00019643734922875696, "loss": 0.0143, "step": 9965 }, { "epoch": 2.03, "learning_rate": 0.00019641891582541416, "loss": 0.0145, "step": 9966 }, { "epoch": 2.03, "learning_rate": 0.00019640048164678789, "loss": 0.0053, "step": 9967 }, { "epoch": 2.03, "learning_rate": 0.00019638204669318596, "loss": 0.0039, "step": 9968 }, { "epoch": 2.03, "learning_rate": 0.00019636361096491632, "loss": 0.0064, "step": 9969 }, { "epoch": 2.03, "learning_rate": 0.00019634517446228683, "loss": 0.0117, "step": 9970 }, { "epoch": 2.03, "learning_rate": 0.00019632673718560548, "loss": 0.0021, "step": 9971 }, { "epoch": 2.03, "learning_rate": 0.00019630829913518016, "loss": 0.0129, "step": 9972 }, { "epoch": 2.03, "learning_rate": 0.00019628986031131884, "loss": 0.0098, "step": 9973 }, { "epoch": 2.03, "learning_rate": 0.00019627142071432945, "loss": 0.0033, "step": 9974 }, { "epoch": 2.03, "learning_rate": 0.00019625298034452, "loss": 0.0128, "step": 9975 }, { "epoch": 2.03, "learning_rate": 0.00019623453920219848, "loss": 0.002, "step": 9976 }, { "epoch": 2.03, "learning_rate": 0.00019621609728767285, "loss": 0.0115, "step": 9977 }, { "epoch": 2.03, "learning_rate": 0.00019619765460125122, "loss": 0.0107, "step": 9978 }, { "epoch": 2.03, "learning_rate": 0.00019617921114324147, "loss": 0.009, "step": 9979 }, { "epoch": 2.03, "learning_rate": 0.00019616076691395177, "loss": 0.0069, "step": 9980 }, { "epoch": 2.03, "learning_rate": 0.00019614232191369016, "loss": 0.0019, "step": 9981 }, { "epoch": 2.03, "learning_rate": 0.00019612387614276465, "loss": 0.0094, "step": 9982 }, { "epoch": 2.03, "learning_rate": 0.00019610542960148331, "loss": 0.0095, "step": 9983 }, { "epoch": 2.03, "learning_rate": 0.0001960869822901543, "loss": 0.0035, "step": 9984 }, { "epoch": 2.03, "learning_rate": 0.00019606853420908567, "loss": 0.0044, "step": 9985 }, { "epoch": 2.03, "learning_rate": 0.00019605008535858562, "loss": 0.008, "step": 9986 }, { "epoch": 2.03, "learning_rate": 0.00019603163573896212, "loss": 0.0052, "step": 9987 }, { "epoch": 2.03, "learning_rate": 0.00019601318535052346, "loss": 0.0095, "step": 9988 }, { "epoch": 2.03, "learning_rate": 0.00019599473419357774, "loss": 0.0075, "step": 9989 }, { "epoch": 2.03, "learning_rate": 0.00019597628226843312, "loss": 0.0049, "step": 9990 }, { "epoch": 2.03, "learning_rate": 0.00019595782957539787, "loss": 0.0191, "step": 9991 }, { "epoch": 2.03, "learning_rate": 0.00019593937611478006, "loss": 0.0029, "step": 9992 }, { "epoch": 2.03, "learning_rate": 0.00019592092188688796, "loss": 0.0217, "step": 9993 }, { "epoch": 2.03, "learning_rate": 0.00019590246689202978, "loss": 0.0037, "step": 9994 }, { "epoch": 2.04, "learning_rate": 0.00019588401113051376, "loss": 0.0087, "step": 9995 }, { "epoch": 2.04, "learning_rate": 0.00019586555460264816, "loss": 0.005, "step": 9996 }, { "epoch": 2.04, "learning_rate": 0.0001958470973087412, "loss": 0.0023, "step": 9997 }, { "epoch": 2.04, "learning_rate": 0.00019582863924910113, "loss": 0.0078, "step": 9998 }, { "epoch": 2.04, "learning_rate": 0.00019581018042403634, "loss": 0.0008, "step": 9999 }, { "epoch": 2.04, "learning_rate": 0.00019579172083385507, "loss": 0.0017, "step": 10000 }, { "epoch": 2.04, "learning_rate": 0.0001957732604788656, "loss": 0.0075, "step": 10001 }, { "epoch": 2.04, "learning_rate": 0.00019575479935937627, "loss": 0.0053, "step": 10002 }, { "epoch": 2.04, "learning_rate": 0.00019573633747569543, "loss": 0.0061, "step": 10003 }, { "epoch": 2.04, "learning_rate": 0.0001957178748281314, "loss": 0.0016, "step": 10004 }, { "epoch": 2.04, "learning_rate": 0.00019569941141699262, "loss": 0.0044, "step": 10005 }, { "epoch": 2.04, "learning_rate": 0.00019568094724258737, "loss": 0.0056, "step": 10006 }, { "epoch": 2.04, "learning_rate": 0.00019566248230522406, "loss": 0.0089, "step": 10007 }, { "epoch": 2.04, "learning_rate": 0.00019564401660521113, "loss": 0.0122, "step": 10008 }, { "epoch": 2.04, "learning_rate": 0.00019562555014285691, "loss": 0.0118, "step": 10009 }, { "epoch": 2.04, "learning_rate": 0.00019560708291846993, "loss": 0.0094, "step": 10010 }, { "epoch": 2.04, "learning_rate": 0.00019558861493235854, "loss": 0.0094, "step": 10011 }, { "epoch": 2.04, "learning_rate": 0.00019557014618483128, "loss": 0.0201, "step": 10012 }, { "epoch": 2.04, "learning_rate": 0.00019555167667619652, "loss": 0.0176, "step": 10013 }, { "epoch": 2.04, "learning_rate": 0.00019553320640676276, "loss": 0.0116, "step": 10014 }, { "epoch": 2.04, "learning_rate": 0.00019551473537683854, "loss": 0.0049, "step": 10015 }, { "epoch": 2.04, "learning_rate": 0.00019549626358673233, "loss": 0.0021, "step": 10016 }, { "epoch": 2.04, "learning_rate": 0.0001954777910367526, "loss": 0.0081, "step": 10017 }, { "epoch": 2.04, "learning_rate": 0.00019545931772720792, "loss": 0.0046, "step": 10018 }, { "epoch": 2.04, "learning_rate": 0.00019544084365840682, "loss": 0.0228, "step": 10019 }, { "epoch": 2.04, "learning_rate": 0.00019542236883065788, "loss": 0.0279, "step": 10020 }, { "epoch": 2.04, "learning_rate": 0.00019540389324426962, "loss": 0.0058, "step": 10021 }, { "epoch": 2.04, "learning_rate": 0.00019538541689955062, "loss": 0.0031, "step": 10022 }, { "epoch": 2.04, "learning_rate": 0.00019536693979680953, "loss": 0.0085, "step": 10023 }, { "epoch": 2.04, "learning_rate": 0.00019534846193635486, "loss": 0.0039, "step": 10024 }, { "epoch": 2.04, "learning_rate": 0.00019532998331849534, "loss": 0.0067, "step": 10025 }, { "epoch": 2.04, "learning_rate": 0.0001953115039435395, "loss": 0.0239, "step": 10026 }, { "epoch": 2.04, "learning_rate": 0.000195293023811796, "loss": 0.0246, "step": 10027 }, { "epoch": 2.04, "learning_rate": 0.00019527454292357353, "loss": 0.0015, "step": 10028 }, { "epoch": 2.04, "learning_rate": 0.0001952560612791807, "loss": 0.0019, "step": 10029 }, { "epoch": 2.04, "learning_rate": 0.0001952375788789262, "loss": 0.0039, "step": 10030 }, { "epoch": 2.04, "learning_rate": 0.00019521909572311878, "loss": 0.0141, "step": 10031 }, { "epoch": 2.04, "learning_rate": 0.0001952006118120671, "loss": 0.0063, "step": 10032 }, { "epoch": 2.04, "learning_rate": 0.00019518212714607992, "loss": 0.0087, "step": 10033 }, { "epoch": 2.04, "learning_rate": 0.00019516364172546586, "loss": 0.0031, "step": 10034 }, { "epoch": 2.04, "learning_rate": 0.00019514515555053377, "loss": 0.0055, "step": 10035 }, { "epoch": 2.04, "learning_rate": 0.00019512666862159234, "loss": 0.0199, "step": 10036 }, { "epoch": 2.04, "learning_rate": 0.00019510818093895042, "loss": 0.0089, "step": 10037 }, { "epoch": 2.04, "learning_rate": 0.00019508969250291668, "loss": 0.0018, "step": 10038 }, { "epoch": 2.04, "learning_rate": 0.00019507120331379996, "loss": 0.0048, "step": 10039 }, { "epoch": 2.04, "learning_rate": 0.00019505271337190905, "loss": 0.0018, "step": 10040 }, { "epoch": 2.04, "learning_rate": 0.00019503422267755282, "loss": 0.004, "step": 10041 }, { "epoch": 2.04, "learning_rate": 0.00019501573123104006, "loss": 0.0058, "step": 10042 }, { "epoch": 2.04, "learning_rate": 0.0001949972390326796, "loss": 0.0059, "step": 10043 }, { "epoch": 2.05, "learning_rate": 0.00019497874608278033, "loss": 0.0204, "step": 10044 }, { "epoch": 2.05, "learning_rate": 0.00019496025238165108, "loss": 0.0083, "step": 10045 }, { "epoch": 2.05, "learning_rate": 0.00019494175792960077, "loss": 0.025, "step": 10046 }, { "epoch": 2.05, "learning_rate": 0.00019492326272693824, "loss": 0.0053, "step": 10047 }, { "epoch": 2.05, "learning_rate": 0.00019490476677397244, "loss": 0.017, "step": 10048 }, { "epoch": 2.05, "learning_rate": 0.00019488627007101226, "loss": 0.0316, "step": 10049 }, { "epoch": 2.05, "learning_rate": 0.00019486777261836668, "loss": 0.0043, "step": 10050 }, { "epoch": 2.05, "learning_rate": 0.00019484927441634455, "loss": 0.006, "step": 10051 }, { "epoch": 2.05, "learning_rate": 0.0001948307754652549, "loss": 0.0116, "step": 10052 }, { "epoch": 2.05, "learning_rate": 0.00019481227576540668, "loss": 0.0103, "step": 10053 }, { "epoch": 2.05, "learning_rate": 0.00019479377531710884, "loss": 0.0027, "step": 10054 }, { "epoch": 2.05, "learning_rate": 0.00019477527412067042, "loss": 0.0059, "step": 10055 }, { "epoch": 2.05, "learning_rate": 0.0001947567721764004, "loss": 0.0078, "step": 10056 }, { "epoch": 2.05, "learning_rate": 0.0001947382694846078, "loss": 0.0104, "step": 10057 }, { "epoch": 2.05, "learning_rate": 0.00019471976604560167, "loss": 0.0038, "step": 10058 }, { "epoch": 2.05, "learning_rate": 0.000194701261859691, "loss": 0.0396, "step": 10059 }, { "epoch": 2.05, "learning_rate": 0.0001946827569271849, "loss": 0.0086, "step": 10060 }, { "epoch": 2.05, "learning_rate": 0.0001946642512483924, "loss": 0.0021, "step": 10061 }, { "epoch": 2.05, "learning_rate": 0.0001946457448236226, "loss": 0.0071, "step": 10062 }, { "epoch": 2.05, "learning_rate": 0.00019462723765318457, "loss": 0.0046, "step": 10063 }, { "epoch": 2.05, "learning_rate": 0.00019460872973738744, "loss": 0.0066, "step": 10064 }, { "epoch": 2.05, "learning_rate": 0.00019459022107654037, "loss": 0.0093, "step": 10065 }, { "epoch": 2.05, "learning_rate": 0.00019457171167095238, "loss": 0.023, "step": 10066 }, { "epoch": 2.05, "learning_rate": 0.0001945532015209327, "loss": 0.0035, "step": 10067 }, { "epoch": 2.05, "learning_rate": 0.00019453469062679043, "loss": 0.0048, "step": 10068 }, { "epoch": 2.05, "learning_rate": 0.00019451617898883476, "loss": 0.0019, "step": 10069 }, { "epoch": 2.05, "learning_rate": 0.0001944976666073749, "loss": 0.0021, "step": 10070 }, { "epoch": 2.05, "learning_rate": 0.00019447915348271997, "loss": 0.0101, "step": 10071 }, { "epoch": 2.05, "learning_rate": 0.00019446063961517924, "loss": 0.0047, "step": 10072 }, { "epoch": 2.05, "learning_rate": 0.0001944421250050619, "loss": 0.0067, "step": 10073 }, { "epoch": 2.05, "learning_rate": 0.0001944236096526772, "loss": 0.0093, "step": 10074 }, { "epoch": 2.05, "learning_rate": 0.00019440509355833434, "loss": 0.0089, "step": 10075 }, { "epoch": 2.05, "learning_rate": 0.0001943865767223426, "loss": 0.0148, "step": 10076 }, { "epoch": 2.05, "learning_rate": 0.00019436805914501126, "loss": 0.0006, "step": 10077 }, { "epoch": 2.05, "learning_rate": 0.00019434954082664954, "loss": 0.0019, "step": 10078 }, { "epoch": 2.05, "learning_rate": 0.00019433102176756684, "loss": 0.0169, "step": 10079 }, { "epoch": 2.05, "learning_rate": 0.00019431250196807237, "loss": 0.0146, "step": 10080 }, { "epoch": 2.05, "learning_rate": 0.00019429398142847544, "loss": 0.0259, "step": 10081 }, { "epoch": 2.05, "learning_rate": 0.0001942754601490854, "loss": 0.0049, "step": 10082 }, { "epoch": 2.05, "learning_rate": 0.00019425693813021166, "loss": 0.0134, "step": 10083 }, { "epoch": 2.05, "learning_rate": 0.00019423841537216348, "loss": 0.0109, "step": 10084 }, { "epoch": 2.05, "learning_rate": 0.00019421989187525025, "loss": 0.0206, "step": 10085 }, { "epoch": 2.05, "learning_rate": 0.00019420136763978138, "loss": 0.0064, "step": 10086 }, { "epoch": 2.05, "learning_rate": 0.00019418284266606618, "loss": 0.0054, "step": 10087 }, { "epoch": 2.05, "learning_rate": 0.0001941643169544142, "loss": 0.0188, "step": 10088 }, { "epoch": 2.05, "learning_rate": 0.0001941457905051347, "loss": 0.0113, "step": 10089 }, { "epoch": 2.05, "learning_rate": 0.00019412726331853716, "loss": 0.0104, "step": 10090 }, { "epoch": 2.05, "learning_rate": 0.00019410873539493103, "loss": 0.0156, "step": 10091 }, { "epoch": 2.05, "learning_rate": 0.00019409020673462576, "loss": 0.0081, "step": 10092 }, { "epoch": 2.06, "learning_rate": 0.0001940716773379308, "loss": 0.004, "step": 10093 }, { "epoch": 2.06, "learning_rate": 0.0001940531472051557, "loss": 0.0102, "step": 10094 }, { "epoch": 2.06, "learning_rate": 0.0001940346163366098, "loss": 0.0018, "step": 10095 }, { "epoch": 2.06, "learning_rate": 0.00019401608473260275, "loss": 0.001, "step": 10096 }, { "epoch": 2.06, "learning_rate": 0.000193997552393444, "loss": 0.0239, "step": 10097 }, { "epoch": 2.06, "learning_rate": 0.00019397901931944304, "loss": 0.0114, "step": 10098 }, { "epoch": 2.06, "learning_rate": 0.00019396048551090944, "loss": 0.0162, "step": 10099 }, { "epoch": 2.06, "learning_rate": 0.00019394195096815277, "loss": 0.0025, "step": 10100 }, { "epoch": 2.06, "learning_rate": 0.00019392341569148252, "loss": 0.019, "step": 10101 }, { "epoch": 2.06, "learning_rate": 0.0001939048796812084, "loss": 0.0128, "step": 10102 }, { "epoch": 2.06, "learning_rate": 0.00019388634293763987, "loss": 0.0122, "step": 10103 }, { "epoch": 2.06, "learning_rate": 0.00019386780546108655, "loss": 0.0181, "step": 10104 }, { "epoch": 2.06, "learning_rate": 0.00019384926725185807, "loss": 0.0034, "step": 10105 }, { "epoch": 2.06, "learning_rate": 0.00019383072831026413, "loss": 0.0096, "step": 10106 }, { "epoch": 2.06, "learning_rate": 0.00019381218863661422, "loss": 0.0096, "step": 10107 }, { "epoch": 2.06, "learning_rate": 0.00019379364823121813, "loss": 0.0087, "step": 10108 }, { "epoch": 2.06, "learning_rate": 0.0001937751070943854, "loss": 0.0067, "step": 10109 }, { "epoch": 2.06, "learning_rate": 0.00019375656522642573, "loss": 0.0068, "step": 10110 }, { "epoch": 2.06, "learning_rate": 0.00019373802262764888, "loss": 0.0178, "step": 10111 }, { "epoch": 2.06, "learning_rate": 0.00019371947929836442, "loss": 0.0086, "step": 10112 }, { "epoch": 2.06, "learning_rate": 0.00019370093523888213, "loss": 0.0101, "step": 10113 }, { "epoch": 2.06, "learning_rate": 0.00019368239044951176, "loss": 0.0099, "step": 10114 }, { "epoch": 2.06, "learning_rate": 0.00019366384493056305, "loss": 0.0165, "step": 10115 }, { "epoch": 2.06, "learning_rate": 0.00019364529868234567, "loss": 0.0138, "step": 10116 }, { "epoch": 2.06, "learning_rate": 0.00019362675170516943, "loss": 0.0116, "step": 10117 }, { "epoch": 2.06, "learning_rate": 0.0001936082039993441, "loss": 0.01, "step": 10118 }, { "epoch": 2.06, "learning_rate": 0.00019358965556517938, "loss": 0.0075, "step": 10119 }, { "epoch": 2.06, "learning_rate": 0.0001935711064029852, "loss": 0.0129, "step": 10120 }, { "epoch": 2.06, "learning_rate": 0.0001935525565130713, "loss": 0.0076, "step": 10121 }, { "epoch": 2.06, "learning_rate": 0.00019353400589574744, "loss": 0.0093, "step": 10122 }, { "epoch": 2.06, "learning_rate": 0.0001935154545513235, "loss": 0.0049, "step": 10123 }, { "epoch": 2.06, "learning_rate": 0.00019349690248010934, "loss": 0.0012, "step": 10124 }, { "epoch": 2.06, "learning_rate": 0.00019347834968241488, "loss": 0.0016, "step": 10125 }, { "epoch": 2.06, "learning_rate": 0.00019345979615854983, "loss": 0.0102, "step": 10126 }, { "epoch": 2.06, "learning_rate": 0.00019344124190882417, "loss": 0.0007, "step": 10127 }, { "epoch": 2.06, "learning_rate": 0.00019342268693354776, "loss": 0.0076, "step": 10128 }, { "epoch": 2.06, "learning_rate": 0.00019340413123303054, "loss": 0.0103, "step": 10129 }, { "epoch": 2.06, "learning_rate": 0.0001933855748075824, "loss": 0.0014, "step": 10130 }, { "epoch": 2.06, "learning_rate": 0.00019336701765751324, "loss": 0.0053, "step": 10131 }, { "epoch": 2.06, "learning_rate": 0.00019334845978313301, "loss": 0.0093, "step": 10132 }, { "epoch": 2.06, "learning_rate": 0.0001933299011847517, "loss": 0.0112, "step": 10133 }, { "epoch": 2.06, "learning_rate": 0.00019331134186267922, "loss": 0.0046, "step": 10134 }, { "epoch": 2.06, "learning_rate": 0.0001932927818172256, "loss": 0.02, "step": 10135 }, { "epoch": 2.06, "learning_rate": 0.00019327422104870078, "loss": 0.029, "step": 10136 }, { "epoch": 2.06, "learning_rate": 0.0001932556595574148, "loss": 0.0202, "step": 10137 }, { "epoch": 2.06, "learning_rate": 0.00019323709734367765, "loss": 0.0102, "step": 10138 }, { "epoch": 2.06, "learning_rate": 0.00019321853440779942, "loss": 0.012, "step": 10139 }, { "epoch": 2.06, "learning_rate": 0.00019319997075009, "loss": 0.0095, "step": 10140 }, { "epoch": 2.06, "learning_rate": 0.00019318140637085955, "loss": 0.0018, "step": 10141 }, { "epoch": 2.07, "learning_rate": 0.0001931628412704181, "loss": 0.0065, "step": 10142 }, { "epoch": 2.07, "learning_rate": 0.00019314427544907573, "loss": 0.0099, "step": 10143 }, { "epoch": 2.07, "learning_rate": 0.0001931257089071425, "loss": 0.0054, "step": 10144 }, { "epoch": 2.07, "learning_rate": 0.00019310714164492857, "loss": 0.0205, "step": 10145 }, { "epoch": 2.07, "learning_rate": 0.00019308857366274397, "loss": 0.0112, "step": 10146 }, { "epoch": 2.07, "learning_rate": 0.00019307000496089887, "loss": 0.0077, "step": 10147 }, { "epoch": 2.07, "learning_rate": 0.0001930514355397034, "loss": 0.0076, "step": 10148 }, { "epoch": 2.07, "learning_rate": 0.00019303286539946768, "loss": 0.013, "step": 10149 }, { "epoch": 2.07, "learning_rate": 0.00019301429454050186, "loss": 0.0143, "step": 10150 }, { "epoch": 2.07, "learning_rate": 0.0001929957229631161, "loss": 0.0094, "step": 10151 }, { "epoch": 2.07, "learning_rate": 0.00019297715066762068, "loss": 0.0037, "step": 10152 }, { "epoch": 2.07, "learning_rate": 0.00019295857765432565, "loss": 0.007, "step": 10153 }, { "epoch": 2.07, "learning_rate": 0.00019294000392354132, "loss": 0.0053, "step": 10154 }, { "epoch": 2.07, "learning_rate": 0.00019292142947557783, "loss": 0.0096, "step": 10155 }, { "epoch": 2.07, "learning_rate": 0.00019290285431074547, "loss": 0.0117, "step": 10156 }, { "epoch": 2.07, "learning_rate": 0.00019288427842935451, "loss": 0.0118, "step": 10157 }, { "epoch": 2.07, "learning_rate": 0.0001928657018317151, "loss": 0.0038, "step": 10158 }, { "epoch": 2.07, "learning_rate": 0.0001928471245181376, "loss": 0.0266, "step": 10159 }, { "epoch": 2.07, "learning_rate": 0.00019282854648893216, "loss": 0.0088, "step": 10160 }, { "epoch": 2.07, "learning_rate": 0.0001928099677444092, "loss": 0.006, "step": 10161 }, { "epoch": 2.07, "learning_rate": 0.00019279138828487899, "loss": 0.0027, "step": 10162 }, { "epoch": 2.07, "learning_rate": 0.00019277280811065182, "loss": 0.0051, "step": 10163 }, { "epoch": 2.07, "learning_rate": 0.00019275422722203796, "loss": 0.0027, "step": 10164 }, { "epoch": 2.07, "learning_rate": 0.00019273564561934778, "loss": 0.0023, "step": 10165 }, { "epoch": 2.07, "learning_rate": 0.00019271706330289173, "loss": 0.0137, "step": 10166 }, { "epoch": 2.07, "learning_rate": 0.00019269848027298004, "loss": 0.0108, "step": 10167 }, { "epoch": 2.07, "learning_rate": 0.00019267989652992318, "loss": 0.0063, "step": 10168 }, { "epoch": 2.07, "learning_rate": 0.00019266131207403144, "loss": 0.0086, "step": 10169 }, { "epoch": 2.07, "learning_rate": 0.00019264272690561527, "loss": 0.0039, "step": 10170 }, { "epoch": 2.07, "learning_rate": 0.00019262414102498506, "loss": 0.0089, "step": 10171 }, { "epoch": 2.07, "learning_rate": 0.00019260555443245127, "loss": 0.0089, "step": 10172 }, { "epoch": 2.07, "learning_rate": 0.00019258696712832425, "loss": 0.003, "step": 10173 }, { "epoch": 2.07, "learning_rate": 0.00019256837911291454, "loss": 0.0064, "step": 10174 }, { "epoch": 2.07, "learning_rate": 0.0001925497903865325, "loss": 0.0039, "step": 10175 }, { "epoch": 2.07, "learning_rate": 0.00019253120094948865, "loss": 0.0042, "step": 10176 }, { "epoch": 2.07, "learning_rate": 0.0001925126108020935, "loss": 0.0585, "step": 10177 }, { "epoch": 2.07, "learning_rate": 0.00019249401994465745, "loss": 0.0068, "step": 10178 }, { "epoch": 2.07, "learning_rate": 0.00019247542837749103, "loss": 0.0037, "step": 10179 }, { "epoch": 2.07, "learning_rate": 0.00019245683610090485, "loss": 0.0227, "step": 10180 }, { "epoch": 2.07, "learning_rate": 0.00019243824311520935, "loss": 0.0078, "step": 10181 }, { "epoch": 2.07, "learning_rate": 0.00019241964942071508, "loss": 0.0047, "step": 10182 }, { "epoch": 2.07, "learning_rate": 0.0001924010550177326, "loss": 0.0092, "step": 10183 }, { "epoch": 2.07, "learning_rate": 0.0001923824599065724, "loss": 0.0056, "step": 10184 }, { "epoch": 2.07, "learning_rate": 0.00019236386408754517, "loss": 0.0019, "step": 10185 }, { "epoch": 2.07, "learning_rate": 0.00019234526756096144, "loss": 0.0318, "step": 10186 }, { "epoch": 2.07, "learning_rate": 0.0001923266703271318, "loss": 0.0074, "step": 10187 }, { "epoch": 2.07, "learning_rate": 0.00019230807238636687, "loss": 0.0029, "step": 10188 }, { "epoch": 2.07, "learning_rate": 0.00019228947373897727, "loss": 0.0128, "step": 10189 }, { "epoch": 2.07, "learning_rate": 0.00019227087438527363, "loss": 0.0031, "step": 10190 }, { "epoch": 2.08, "learning_rate": 0.0001922522743255666, "loss": 0.0128, "step": 10191 }, { "epoch": 2.08, "learning_rate": 0.00019223367356016686, "loss": 0.0038, "step": 10192 }, { "epoch": 2.08, "learning_rate": 0.000192215072089385, "loss": 0.0172, "step": 10193 }, { "epoch": 2.08, "learning_rate": 0.00019219646991353178, "loss": 0.0099, "step": 10194 }, { "epoch": 2.08, "learning_rate": 0.00019217786703291785, "loss": 0.0029, "step": 10195 }, { "epoch": 2.08, "learning_rate": 0.0001921592634478539, "loss": 0.008, "step": 10196 }, { "epoch": 2.08, "learning_rate": 0.0001921406591586507, "loss": 0.0151, "step": 10197 }, { "epoch": 2.08, "learning_rate": 0.00019212205416561893, "loss": 0.0105, "step": 10198 }, { "epoch": 2.08, "learning_rate": 0.0001921034484690694, "loss": 0.0055, "step": 10199 }, { "epoch": 2.08, "learning_rate": 0.00019208484206931272, "loss": 0.0143, "step": 10200 }, { "epoch": 2.08, "learning_rate": 0.00019206623496665978, "loss": 0.0009, "step": 10201 }, { "epoch": 2.08, "learning_rate": 0.00019204762716142133, "loss": 0.0083, "step": 10202 }, { "epoch": 2.08, "learning_rate": 0.0001920290186539081, "loss": 0.0032, "step": 10203 }, { "epoch": 2.08, "learning_rate": 0.00019201040944443094, "loss": 0.0144, "step": 10204 }, { "epoch": 2.08, "learning_rate": 0.00019199179953330065, "loss": 0.0028, "step": 10205 }, { "epoch": 2.08, "learning_rate": 0.000191973188920828, "loss": 0.0013, "step": 10206 }, { "epoch": 2.08, "learning_rate": 0.00019195457760732388, "loss": 0.0021, "step": 10207 }, { "epoch": 2.08, "learning_rate": 0.00019193596559309914, "loss": 0.0149, "step": 10208 }, { "epoch": 2.08, "learning_rate": 0.00019191735287846462, "loss": 0.023, "step": 10209 }, { "epoch": 2.08, "learning_rate": 0.00019189873946373116, "loss": 0.0063, "step": 10210 }, { "epoch": 2.08, "learning_rate": 0.00019188012534920968, "loss": 0.0163, "step": 10211 }, { "epoch": 2.08, "learning_rate": 0.00019186151053521104, "loss": 0.0012, "step": 10212 }, { "epoch": 2.08, "learning_rate": 0.0001918428950220462, "loss": 0.0127, "step": 10213 }, { "epoch": 2.08, "learning_rate": 0.00019182427881002595, "loss": 0.0096, "step": 10214 }, { "epoch": 2.08, "learning_rate": 0.00019180566189946134, "loss": 0.0136, "step": 10215 }, { "epoch": 2.08, "learning_rate": 0.00019178704429066327, "loss": 0.0088, "step": 10216 }, { "epoch": 2.08, "learning_rate": 0.00019176842598394266, "loss": 0.0047, "step": 10217 }, { "epoch": 2.08, "learning_rate": 0.0001917498069796105, "loss": 0.0073, "step": 10218 }, { "epoch": 2.08, "learning_rate": 0.00019173118727797774, "loss": 0.0011, "step": 10219 }, { "epoch": 2.08, "learning_rate": 0.00019171256687935538, "loss": 0.0053, "step": 10220 }, { "epoch": 2.08, "learning_rate": 0.00019169394578405445, "loss": 0.0057, "step": 10221 }, { "epoch": 2.08, "learning_rate": 0.0001916753239923859, "loss": 0.0093, "step": 10222 }, { "epoch": 2.08, "learning_rate": 0.0001916567015046608, "loss": 0.0069, "step": 10223 }, { "epoch": 2.08, "learning_rate": 0.0001916380783211901, "loss": 0.0355, "step": 10224 }, { "epoch": 2.08, "learning_rate": 0.00019161945444228493, "loss": 0.0062, "step": 10225 }, { "epoch": 2.08, "learning_rate": 0.0001916008298682563, "loss": 0.0207, "step": 10226 }, { "epoch": 2.08, "learning_rate": 0.0001915822045994153, "loss": 0.0122, "step": 10227 }, { "epoch": 2.08, "learning_rate": 0.00019156357863607296, "loss": 0.0064, "step": 10228 }, { "epoch": 2.08, "learning_rate": 0.00019154495197854038, "loss": 0.0067, "step": 10229 }, { "epoch": 2.08, "learning_rate": 0.00019152632462712872, "loss": 0.0032, "step": 10230 }, { "epoch": 2.08, "learning_rate": 0.00019150769658214908, "loss": 0.0061, "step": 10231 }, { "epoch": 2.08, "learning_rate": 0.00019148906784391252, "loss": 0.0076, "step": 10232 }, { "epoch": 2.08, "learning_rate": 0.0001914704384127302, "loss": 0.0018, "step": 10233 }, { "epoch": 2.08, "learning_rate": 0.0001914518082889133, "loss": 0.0192, "step": 10234 }, { "epoch": 2.08, "learning_rate": 0.00019143317747277294, "loss": 0.0071, "step": 10235 }, { "epoch": 2.08, "learning_rate": 0.00019141454596462035, "loss": 0.0047, "step": 10236 }, { "epoch": 2.08, "learning_rate": 0.00019139591376476656, "loss": 0.0155, "step": 10237 }, { "epoch": 2.08, "learning_rate": 0.000191377280873523, "loss": 0.0049, "step": 10238 }, { "epoch": 2.08, "learning_rate": 0.00019135864729120065, "loss": 0.0078, "step": 10239 }, { "epoch": 2.09, "learning_rate": 0.00019134001301811086, "loss": 0.0117, "step": 10240 }, { "epoch": 2.09, "learning_rate": 0.00019132137805456483, "loss": 0.0022, "step": 10241 }, { "epoch": 2.09, "learning_rate": 0.00019130274240087376, "loss": 0.0068, "step": 10242 }, { "epoch": 2.09, "learning_rate": 0.00019128410605734892, "loss": 0.0041, "step": 10243 }, { "epoch": 2.09, "learning_rate": 0.0001912654690243016, "loss": 0.0152, "step": 10244 }, { "epoch": 2.09, "learning_rate": 0.00019124683130204308, "loss": 0.0063, "step": 10245 }, { "epoch": 2.09, "learning_rate": 0.00019122819289088455, "loss": 0.0204, "step": 10246 }, { "epoch": 2.09, "learning_rate": 0.00019120955379113745, "loss": 0.002, "step": 10247 }, { "epoch": 2.09, "learning_rate": 0.0001911909140031129, "loss": 0.0244, "step": 10248 }, { "epoch": 2.09, "learning_rate": 0.0001911722735271224, "loss": 0.0077, "step": 10249 }, { "epoch": 2.09, "learning_rate": 0.0001911536323634773, "loss": 0.0069, "step": 10250 }, { "epoch": 2.09, "learning_rate": 0.00019113499051248877, "loss": 0.0085, "step": 10251 }, { "epoch": 2.09, "learning_rate": 0.00019111634797446824, "loss": 0.0161, "step": 10252 }, { "epoch": 2.09, "learning_rate": 0.0001910977047497271, "loss": 0.0056, "step": 10253 }, { "epoch": 2.09, "learning_rate": 0.00019107906083857672, "loss": 0.018, "step": 10254 }, { "epoch": 2.09, "learning_rate": 0.0001910604162413285, "loss": 0.0025, "step": 10255 }, { "epoch": 2.09, "learning_rate": 0.00019104177095829382, "loss": 0.0123, "step": 10256 }, { "epoch": 2.09, "learning_rate": 0.00019102312498978408, "loss": 0.0046, "step": 10257 }, { "epoch": 2.09, "learning_rate": 0.00019100447833611067, "loss": 0.0063, "step": 10258 }, { "epoch": 2.09, "learning_rate": 0.0001909858309975851, "loss": 0.0041, "step": 10259 }, { "epoch": 2.09, "learning_rate": 0.0001909671829745188, "loss": 0.0083, "step": 10260 }, { "epoch": 2.09, "learning_rate": 0.0001909485342672232, "loss": 0.0067, "step": 10261 }, { "epoch": 2.09, "learning_rate": 0.0001909298848760098, "loss": 0.0089, "step": 10262 }, { "epoch": 2.09, "learning_rate": 0.00019091123480119004, "loss": 0.0136, "step": 10263 }, { "epoch": 2.09, "learning_rate": 0.0001908925840430755, "loss": 0.0045, "step": 10264 }, { "epoch": 2.09, "learning_rate": 0.00019087393260197754, "loss": 0.0056, "step": 10265 }, { "epoch": 2.09, "learning_rate": 0.00019085528047820777, "loss": 0.0043, "step": 10266 }, { "epoch": 2.09, "learning_rate": 0.0001908366276720777, "loss": 0.0166, "step": 10267 }, { "epoch": 2.09, "learning_rate": 0.0001908179741838989, "loss": 0.0056, "step": 10268 }, { "epoch": 2.09, "learning_rate": 0.00019079932001398283, "loss": 0.0074, "step": 10269 }, { "epoch": 2.09, "learning_rate": 0.0001907806651626411, "loss": 0.0041, "step": 10270 }, { "epoch": 2.09, "learning_rate": 0.0001907620096301853, "loss": 0.0244, "step": 10271 }, { "epoch": 2.09, "learning_rate": 0.00019074335341692696, "loss": 0.0375, "step": 10272 }, { "epoch": 2.09, "learning_rate": 0.00019072469652317778, "loss": 0.0141, "step": 10273 }, { "epoch": 2.09, "learning_rate": 0.0001907060389492493, "loss": 0.0035, "step": 10274 }, { "epoch": 2.09, "learning_rate": 0.00019068738069545307, "loss": 0.0059, "step": 10275 }, { "epoch": 2.09, "learning_rate": 0.00019066872176210078, "loss": 0.0107, "step": 10276 }, { "epoch": 2.09, "learning_rate": 0.0001906500621495041, "loss": 0.0074, "step": 10277 }, { "epoch": 2.09, "learning_rate": 0.00019063140185797463, "loss": 0.0065, "step": 10278 }, { "epoch": 2.09, "learning_rate": 0.00019061274088782407, "loss": 0.0134, "step": 10279 }, { "epoch": 2.09, "learning_rate": 0.00019059407923936408, "loss": 0.0018, "step": 10280 }, { "epoch": 2.09, "learning_rate": 0.0001905754169129063, "loss": 0.0137, "step": 10281 }, { "epoch": 2.09, "learning_rate": 0.0001905567539087625, "loss": 0.0018, "step": 10282 }, { "epoch": 2.09, "learning_rate": 0.00019053809022724437, "loss": 0.0075, "step": 10283 }, { "epoch": 2.09, "learning_rate": 0.00019051942586866357, "loss": 0.0085, "step": 10284 }, { "epoch": 2.09, "learning_rate": 0.00019050076083333188, "loss": 0.0143, "step": 10285 }, { "epoch": 2.09, "learning_rate": 0.00019048209512156106, "loss": 0.0224, "step": 10286 }, { "epoch": 2.09, "learning_rate": 0.00019046342873366284, "loss": 0.0119, "step": 10287 }, { "epoch": 2.09, "learning_rate": 0.00019044476166994896, "loss": 0.0061, "step": 10288 }, { "epoch": 2.1, "learning_rate": 0.00019042609393073122, "loss": 0.0056, "step": 10289 }, { "epoch": 2.1, "learning_rate": 0.00019040742551632136, "loss": 0.016, "step": 10290 }, { "epoch": 2.1, "learning_rate": 0.00019038875642703122, "loss": 0.0036, "step": 10291 }, { "epoch": 2.1, "learning_rate": 0.0001903700866631727, "loss": 0.0243, "step": 10292 }, { "epoch": 2.1, "learning_rate": 0.00019035141622505747, "loss": 0.0052, "step": 10293 }, { "epoch": 2.1, "learning_rate": 0.00019033274511299743, "loss": 0.0078, "step": 10294 }, { "epoch": 2.1, "learning_rate": 0.0001903140733273044, "loss": 0.0066, "step": 10295 }, { "epoch": 2.1, "learning_rate": 0.00019029540086829027, "loss": 0.0061, "step": 10296 }, { "epoch": 2.1, "learning_rate": 0.00019027672773626686, "loss": 0.0051, "step": 10297 }, { "epoch": 2.1, "learning_rate": 0.00019025805393154606, "loss": 0.0049, "step": 10298 }, { "epoch": 2.1, "learning_rate": 0.0001902393794544398, "loss": 0.0102, "step": 10299 }, { "epoch": 2.1, "learning_rate": 0.00019022070430525992, "loss": 0.0113, "step": 10300 }, { "epoch": 2.1, "learning_rate": 0.00019020202848431836, "loss": 0.0076, "step": 10301 }, { "epoch": 2.1, "learning_rate": 0.00019018335199192705, "loss": 0.0111, "step": 10302 }, { "epoch": 2.1, "learning_rate": 0.00019016467482839788, "loss": 0.0253, "step": 10303 }, { "epoch": 2.1, "learning_rate": 0.00019014599699404284, "loss": 0.001, "step": 10304 }, { "epoch": 2.1, "learning_rate": 0.0001901273184891739, "loss": 0.004, "step": 10305 }, { "epoch": 2.1, "learning_rate": 0.00019010863931410296, "loss": 0.0116, "step": 10306 }, { "epoch": 2.1, "learning_rate": 0.00019008995946914205, "loss": 0.0141, "step": 10307 }, { "epoch": 2.1, "learning_rate": 0.00019007127895460317, "loss": 0.0184, "step": 10308 }, { "epoch": 2.1, "learning_rate": 0.00019005259777079824, "loss": 0.0119, "step": 10309 }, { "epoch": 2.1, "learning_rate": 0.00019003391591803934, "loss": 0.0037, "step": 10310 }, { "epoch": 2.1, "learning_rate": 0.00019001523339663844, "loss": 0.0187, "step": 10311 }, { "epoch": 2.1, "learning_rate": 0.00018999655020690765, "loss": 0.0081, "step": 10312 }, { "epoch": 2.1, "learning_rate": 0.00018997786634915897, "loss": 0.0083, "step": 10313 }, { "epoch": 2.1, "learning_rate": 0.00018995918182370446, "loss": 0.0095, "step": 10314 }, { "epoch": 2.1, "learning_rate": 0.0001899404966308562, "loss": 0.0098, "step": 10315 }, { "epoch": 2.1, "learning_rate": 0.0001899218107709262, "loss": 0.0076, "step": 10316 }, { "epoch": 2.1, "learning_rate": 0.00018990312424422664, "loss": 0.0191, "step": 10317 }, { "epoch": 2.1, "learning_rate": 0.00018988443705106957, "loss": 0.0144, "step": 10318 }, { "epoch": 2.1, "learning_rate": 0.0001898657491917672, "loss": 0.0093, "step": 10319 }, { "epoch": 2.1, "learning_rate": 0.00018984706066663143, "loss": 0.0148, "step": 10320 }, { "epoch": 2.1, "learning_rate": 0.0001898283714759746, "loss": 0.0095, "step": 10321 }, { "epoch": 2.1, "learning_rate": 0.00018980968162010876, "loss": 0.0058, "step": 10322 }, { "epoch": 2.1, "learning_rate": 0.00018979099109934608, "loss": 0.0272, "step": 10323 }, { "epoch": 2.1, "learning_rate": 0.00018977229991399883, "loss": 0.0076, "step": 10324 }, { "epoch": 2.1, "learning_rate": 0.000189753608064379, "loss": 0.009, "step": 10325 }, { "epoch": 2.1, "learning_rate": 0.0001897349155507989, "loss": 0.0059, "step": 10326 }, { "epoch": 2.1, "learning_rate": 0.0001897162223735707, "loss": 0.0151, "step": 10327 }, { "epoch": 2.1, "learning_rate": 0.00018969752853300662, "loss": 0.0113, "step": 10328 }, { "epoch": 2.1, "learning_rate": 0.00018967883402941891, "loss": 0.0065, "step": 10329 }, { "epoch": 2.1, "learning_rate": 0.00018966013886311976, "loss": 0.0046, "step": 10330 }, { "epoch": 2.1, "learning_rate": 0.00018964144303442137, "loss": 0.0102, "step": 10331 }, { "epoch": 2.1, "learning_rate": 0.0001896227465436361, "loss": 0.0056, "step": 10332 }, { "epoch": 2.1, "learning_rate": 0.0001896040493910762, "loss": 0.0043, "step": 10333 }, { "epoch": 2.1, "learning_rate": 0.00018958535157705386, "loss": 0.022, "step": 10334 }, { "epoch": 2.1, "learning_rate": 0.00018956665310188145, "loss": 0.0155, "step": 10335 }, { "epoch": 2.1, "learning_rate": 0.00018954795396587123, "loss": 0.0062, "step": 10336 }, { "epoch": 2.1, "learning_rate": 0.00018952925416933556, "loss": 0.0031, "step": 10337 }, { "epoch": 2.11, "learning_rate": 0.00018951055371258673, "loss": 0.0344, "step": 10338 }, { "epoch": 2.11, "learning_rate": 0.00018949185259593707, "loss": 0.0102, "step": 10339 }, { "epoch": 2.11, "learning_rate": 0.00018947315081969889, "loss": 0.0071, "step": 10340 }, { "epoch": 2.11, "learning_rate": 0.00018945444838418458, "loss": 0.0069, "step": 10341 }, { "epoch": 2.11, "learning_rate": 0.00018943574528970655, "loss": 0.0144, "step": 10342 }, { "epoch": 2.11, "learning_rate": 0.0001894170415365771, "loss": 0.006, "step": 10343 }, { "epoch": 2.11, "learning_rate": 0.00018939833712510866, "loss": 0.0074, "step": 10344 }, { "epoch": 2.11, "learning_rate": 0.00018937963205561362, "loss": 0.0066, "step": 10345 }, { "epoch": 2.11, "learning_rate": 0.00018936092632840435, "loss": 0.0097, "step": 10346 }, { "epoch": 2.11, "learning_rate": 0.0001893422199437934, "loss": 0.006, "step": 10347 }, { "epoch": 2.11, "learning_rate": 0.00018932351290209306, "loss": 0.0052, "step": 10348 }, { "epoch": 2.11, "learning_rate": 0.00018930480520361584, "loss": 0.0054, "step": 10349 }, { "epoch": 2.11, "learning_rate": 0.00018928609684867417, "loss": 0.0093, "step": 10350 }, { "epoch": 2.11, "learning_rate": 0.0001892673878375805, "loss": 0.0018, "step": 10351 }, { "epoch": 2.11, "learning_rate": 0.00018924867817064734, "loss": 0.0034, "step": 10352 }, { "epoch": 2.11, "learning_rate": 0.00018922996784818721, "loss": 0.0085, "step": 10353 }, { "epoch": 2.11, "learning_rate": 0.00018921125687051252, "loss": 0.0112, "step": 10354 }, { "epoch": 2.11, "learning_rate": 0.00018919254523793586, "loss": 0.0079, "step": 10355 }, { "epoch": 2.11, "learning_rate": 0.00018917383295076972, "loss": 0.0176, "step": 10356 }, { "epoch": 2.11, "learning_rate": 0.00018915512000932657, "loss": 0.02, "step": 10357 }, { "epoch": 2.11, "learning_rate": 0.00018913640641391905, "loss": 0.0117, "step": 10358 }, { "epoch": 2.11, "learning_rate": 0.00018911769216485965, "loss": 0.0123, "step": 10359 }, { "epoch": 2.11, "learning_rate": 0.00018909897726246096, "loss": 0.0069, "step": 10360 }, { "epoch": 2.11, "learning_rate": 0.00018908026170703552, "loss": 0.0091, "step": 10361 }, { "epoch": 2.11, "learning_rate": 0.00018906154549889597, "loss": 0.0069, "step": 10362 }, { "epoch": 2.11, "learning_rate": 0.00018904282863835487, "loss": 0.0125, "step": 10363 }, { "epoch": 2.11, "learning_rate": 0.0001890241111257248, "loss": 0.0521, "step": 10364 }, { "epoch": 2.11, "learning_rate": 0.00018900539296131847, "loss": 0.0075, "step": 10365 }, { "epoch": 2.11, "learning_rate": 0.00018898667414544843, "loss": 0.0062, "step": 10366 }, { "epoch": 2.11, "learning_rate": 0.0001889679546784273, "loss": 0.0049, "step": 10367 }, { "epoch": 2.11, "learning_rate": 0.00018894923456056782, "loss": 0.0096, "step": 10368 }, { "epoch": 2.11, "learning_rate": 0.00018893051379218257, "loss": 0.0149, "step": 10369 }, { "epoch": 2.11, "learning_rate": 0.0001889117923735843, "loss": 0.0024, "step": 10370 }, { "epoch": 2.11, "learning_rate": 0.0001888930703050856, "loss": 0.0177, "step": 10371 }, { "epoch": 2.11, "learning_rate": 0.0001888743475869992, "loss": 0.0161, "step": 10372 }, { "epoch": 2.11, "learning_rate": 0.00018885562421963782, "loss": 0.0013, "step": 10373 }, { "epoch": 2.11, "learning_rate": 0.00018883690020331416, "loss": 0.0155, "step": 10374 }, { "epoch": 2.11, "learning_rate": 0.00018881817553834102, "loss": 0.0089, "step": 10375 }, { "epoch": 2.11, "learning_rate": 0.00018879945022503102, "loss": 0.0067, "step": 10376 }, { "epoch": 2.11, "learning_rate": 0.000188780724263697, "loss": 0.0135, "step": 10377 }, { "epoch": 2.11, "learning_rate": 0.00018876199765465164, "loss": 0.007, "step": 10378 }, { "epoch": 2.11, "learning_rate": 0.0001887432703982078, "loss": 0.0049, "step": 10379 }, { "epoch": 2.11, "learning_rate": 0.0001887245424946782, "loss": 0.0039, "step": 10380 }, { "epoch": 2.11, "learning_rate": 0.00018870581394437558, "loss": 0.0154, "step": 10381 }, { "epoch": 2.11, "learning_rate": 0.00018868708474761286, "loss": 0.0085, "step": 10382 }, { "epoch": 2.11, "learning_rate": 0.00018866835490470276, "loss": 0.0042, "step": 10383 }, { "epoch": 2.11, "learning_rate": 0.0001886496244159582, "loss": 0.0111, "step": 10384 }, { "epoch": 2.11, "learning_rate": 0.0001886308932816919, "loss": 0.0057, "step": 10385 }, { "epoch": 2.11, "learning_rate": 0.00018861216150221677, "loss": 0.0122, "step": 10386 }, { "epoch": 2.11, "learning_rate": 0.00018859342907784566, "loss": 0.0071, "step": 10387 }, { "epoch": 2.12, "learning_rate": 0.00018857469600889145, "loss": 0.0243, "step": 10388 }, { "epoch": 2.12, "learning_rate": 0.00018855596229566706, "loss": 0.0099, "step": 10389 }, { "epoch": 2.12, "learning_rate": 0.00018853722793848524, "loss": 0.007, "step": 10390 }, { "epoch": 2.12, "learning_rate": 0.00018851849293765894, "loss": 0.0115, "step": 10391 }, { "epoch": 2.12, "learning_rate": 0.00018849975729350117, "loss": 0.0111, "step": 10392 }, { "epoch": 2.12, "learning_rate": 0.00018848102100632477, "loss": 0.0239, "step": 10393 }, { "epoch": 2.12, "learning_rate": 0.00018846228407644265, "loss": 0.0033, "step": 10394 }, { "epoch": 2.12, "learning_rate": 0.0001884435465041678, "loss": 0.0059, "step": 10395 }, { "epoch": 2.12, "learning_rate": 0.00018842480828981312, "loss": 0.0012, "step": 10396 }, { "epoch": 2.12, "learning_rate": 0.00018840606943369166, "loss": 0.0064, "step": 10397 }, { "epoch": 2.12, "learning_rate": 0.00018838732993611636, "loss": 0.0055, "step": 10398 }, { "epoch": 2.12, "learning_rate": 0.00018836858979740016, "loss": 0.0129, "step": 10399 }, { "epoch": 2.12, "learning_rate": 0.00018834984901785608, "loss": 0.0296, "step": 10400 }, { "epoch": 2.12, "learning_rate": 0.0001883311075977971, "loss": 0.0181, "step": 10401 }, { "epoch": 2.12, "learning_rate": 0.00018831236553753632, "loss": 0.0011, "step": 10402 }, { "epoch": 2.12, "learning_rate": 0.0001882936228373867, "loss": 0.0038, "step": 10403 }, { "epoch": 2.12, "learning_rate": 0.0001882748794976613, "loss": 0.0334, "step": 10404 }, { "epoch": 2.12, "learning_rate": 0.00018825613551867311, "loss": 0.0026, "step": 10405 }, { "epoch": 2.12, "learning_rate": 0.0001882373909007353, "loss": 0.0058, "step": 10406 }, { "epoch": 2.12, "learning_rate": 0.0001882186456441609, "loss": 0.0099, "step": 10407 }, { "epoch": 2.12, "learning_rate": 0.00018819989974926292, "loss": 0.0099, "step": 10408 }, { "epoch": 2.12, "learning_rate": 0.00018818115321635455, "loss": 0.0036, "step": 10409 }, { "epoch": 2.12, "learning_rate": 0.00018816240604574883, "loss": 0.0056, "step": 10410 }, { "epoch": 2.12, "learning_rate": 0.00018814365823775889, "loss": 0.0139, "step": 10411 }, { "epoch": 2.12, "learning_rate": 0.00018812490979269787, "loss": 0.0089, "step": 10412 }, { "epoch": 2.12, "learning_rate": 0.0001881061607108789, "loss": 0.0123, "step": 10413 }, { "epoch": 2.12, "learning_rate": 0.00018808741099261508, "loss": 0.0127, "step": 10414 }, { "epoch": 2.12, "learning_rate": 0.00018806866063821961, "loss": 0.0235, "step": 10415 }, { "epoch": 2.12, "learning_rate": 0.00018804990964800566, "loss": 0.0093, "step": 10416 }, { "epoch": 2.12, "learning_rate": 0.00018803115802228638, "loss": 0.0086, "step": 10417 }, { "epoch": 2.12, "learning_rate": 0.000188012405761375, "loss": 0.0047, "step": 10418 }, { "epoch": 2.12, "learning_rate": 0.0001879936528655847, "loss": 0.0054, "step": 10419 }, { "epoch": 2.12, "learning_rate": 0.00018797489933522862, "loss": 0.0042, "step": 10420 }, { "epoch": 2.12, "learning_rate": 0.0001879561451706201, "loss": 0.0228, "step": 10421 }, { "epoch": 2.12, "learning_rate": 0.0001879373903720723, "loss": 0.0081, "step": 10422 }, { "epoch": 2.12, "learning_rate": 0.00018791863493989843, "loss": 0.0169, "step": 10423 }, { "epoch": 2.12, "learning_rate": 0.00018789987887441178, "loss": 0.0091, "step": 10424 }, { "epoch": 2.12, "learning_rate": 0.0001878811221759256, "loss": 0.0057, "step": 10425 }, { "epoch": 2.12, "learning_rate": 0.00018786236484475324, "loss": 0.0058, "step": 10426 }, { "epoch": 2.12, "learning_rate": 0.00018784360688120784, "loss": 0.0046, "step": 10427 }, { "epoch": 2.12, "learning_rate": 0.00018782484828560282, "loss": 0.0087, "step": 10428 }, { "epoch": 2.12, "learning_rate": 0.00018780608905825144, "loss": 0.0032, "step": 10429 }, { "epoch": 2.12, "learning_rate": 0.00018778732919946703, "loss": 0.0127, "step": 10430 }, { "epoch": 2.12, "learning_rate": 0.00018776856870956286, "loss": 0.0372, "step": 10431 }, { "epoch": 2.12, "learning_rate": 0.00018774980758885229, "loss": 0.0059, "step": 10432 }, { "epoch": 2.12, "learning_rate": 0.00018773104583764865, "loss": 0.011, "step": 10433 }, { "epoch": 2.12, "learning_rate": 0.00018771228345626536, "loss": 0.0169, "step": 10434 }, { "epoch": 2.12, "learning_rate": 0.00018769352044501573, "loss": 0.0068, "step": 10435 }, { "epoch": 2.12, "learning_rate": 0.0001876747568042132, "loss": 0.0115, "step": 10436 }, { "epoch": 2.13, "learning_rate": 0.00018765599253417104, "loss": 0.0044, "step": 10437 }, { "epoch": 2.13, "learning_rate": 0.00018763722763520278, "loss": 0.004, "step": 10438 }, { "epoch": 2.13, "learning_rate": 0.00018761846210762175, "loss": 0.004, "step": 10439 }, { "epoch": 2.13, "learning_rate": 0.00018759969595174146, "loss": 0.0028, "step": 10440 }, { "epoch": 2.13, "learning_rate": 0.00018758092916787523, "loss": 0.0063, "step": 10441 }, { "epoch": 2.13, "learning_rate": 0.00018756216175633652, "loss": 0.0293, "step": 10442 }, { "epoch": 2.13, "learning_rate": 0.00018754339371743878, "loss": 0.0059, "step": 10443 }, { "epoch": 2.13, "learning_rate": 0.00018752462505149556, "loss": 0.0042, "step": 10444 }, { "epoch": 2.13, "learning_rate": 0.00018750585575882023, "loss": 0.0066, "step": 10445 }, { "epoch": 2.13, "learning_rate": 0.00018748708583972632, "loss": 0.0147, "step": 10446 }, { "epoch": 2.13, "learning_rate": 0.00018746831529452732, "loss": 0.0048, "step": 10447 }, { "epoch": 2.13, "learning_rate": 0.00018744954412353671, "loss": 0.0083, "step": 10448 }, { "epoch": 2.13, "learning_rate": 0.0001874307723270681, "loss": 0.0006, "step": 10449 }, { "epoch": 2.13, "learning_rate": 0.00018741199990543486, "loss": 0.0197, "step": 10450 }, { "epoch": 2.13, "learning_rate": 0.0001873932268589506, "loss": 0.0052, "step": 10451 }, { "epoch": 2.13, "learning_rate": 0.0001873744531879289, "loss": 0.0087, "step": 10452 }, { "epoch": 2.13, "learning_rate": 0.00018735567889268322, "loss": 0.0167, "step": 10453 }, { "epoch": 2.13, "learning_rate": 0.0001873369039735273, "loss": 0.0044, "step": 10454 }, { "epoch": 2.13, "learning_rate": 0.00018731812843077454, "loss": 0.0184, "step": 10455 }, { "epoch": 2.13, "learning_rate": 0.00018729935226473855, "loss": 0.0094, "step": 10456 }, { "epoch": 2.13, "learning_rate": 0.00018728057547573302, "loss": 0.0078, "step": 10457 }, { "epoch": 2.13, "learning_rate": 0.00018726179806407151, "loss": 0.0024, "step": 10458 }, { "epoch": 2.13, "learning_rate": 0.00018724302003006763, "loss": 0.0192, "step": 10459 }, { "epoch": 2.13, "learning_rate": 0.000187224241374035, "loss": 0.002, "step": 10460 }, { "epoch": 2.13, "learning_rate": 0.00018720546209628728, "loss": 0.0061, "step": 10461 }, { "epoch": 2.13, "learning_rate": 0.0001871866821971381, "loss": 0.0185, "step": 10462 }, { "epoch": 2.13, "learning_rate": 0.0001871679016769012, "loss": 0.0105, "step": 10463 }, { "epoch": 2.13, "learning_rate": 0.00018714912053589011, "loss": 0.0065, "step": 10464 }, { "epoch": 2.13, "learning_rate": 0.0001871303387744186, "loss": 0.012, "step": 10465 }, { "epoch": 2.13, "learning_rate": 0.00018711155639280035, "loss": 0.004, "step": 10466 }, { "epoch": 2.13, "learning_rate": 0.00018709277339134907, "loss": 0.0092, "step": 10467 }, { "epoch": 2.13, "learning_rate": 0.00018707398977037845, "loss": 0.0121, "step": 10468 }, { "epoch": 2.13, "learning_rate": 0.0001870552055302022, "loss": 0.0158, "step": 10469 }, { "epoch": 2.13, "learning_rate": 0.00018703642067113407, "loss": 0.0084, "step": 10470 }, { "epoch": 2.13, "learning_rate": 0.0001870176351934878, "loss": 0.0224, "step": 10471 }, { "epoch": 2.13, "learning_rate": 0.00018699884909757718, "loss": 0.0139, "step": 10472 }, { "epoch": 2.13, "learning_rate": 0.00018698006238371593, "loss": 0.014, "step": 10473 }, { "epoch": 2.13, "learning_rate": 0.00018696127505221782, "loss": 0.0163, "step": 10474 }, { "epoch": 2.13, "learning_rate": 0.00018694248710339665, "loss": 0.0077, "step": 10475 }, { "epoch": 2.13, "learning_rate": 0.0001869236985375662, "loss": 0.0111, "step": 10476 }, { "epoch": 2.13, "learning_rate": 0.00018690490935504027, "loss": 0.0074, "step": 10477 }, { "epoch": 2.13, "learning_rate": 0.00018688611955613275, "loss": 0.0088, "step": 10478 }, { "epoch": 2.13, "learning_rate": 0.00018686732914115737, "loss": 0.004, "step": 10479 }, { "epoch": 2.13, "learning_rate": 0.000186848538110428, "loss": 0.0109, "step": 10480 }, { "epoch": 2.13, "learning_rate": 0.00018682974646425852, "loss": 0.0056, "step": 10481 }, { "epoch": 2.13, "learning_rate": 0.0001868109542029627, "loss": 0.0022, "step": 10482 }, { "epoch": 2.13, "learning_rate": 0.00018679216132685451, "loss": 0.0141, "step": 10483 }, { "epoch": 2.13, "learning_rate": 0.00018677336783624776, "loss": 0.0074, "step": 10484 }, { "epoch": 2.13, "learning_rate": 0.0001867545737314563, "loss": 0.005, "step": 10485 }, { "epoch": 2.14, "learning_rate": 0.00018673577901279415, "loss": 0.0014, "step": 10486 }, { "epoch": 2.14, "learning_rate": 0.0001867169836805751, "loss": 0.0071, "step": 10487 }, { "epoch": 2.14, "learning_rate": 0.00018669818773511313, "loss": 0.0195, "step": 10488 }, { "epoch": 2.14, "learning_rate": 0.00018667939117672215, "loss": 0.0078, "step": 10489 }, { "epoch": 2.14, "learning_rate": 0.00018666059400571612, "loss": 0.0117, "step": 10490 }, { "epoch": 2.14, "learning_rate": 0.000186641796222409, "loss": 0.0094, "step": 10491 }, { "epoch": 2.14, "learning_rate": 0.00018662299782711464, "loss": 0.0057, "step": 10492 }, { "epoch": 2.14, "learning_rate": 0.00018660419882014713, "loss": 0.0097, "step": 10493 }, { "epoch": 2.14, "learning_rate": 0.00018658539920182038, "loss": 0.0039, "step": 10494 }, { "epoch": 2.14, "learning_rate": 0.00018656659897244842, "loss": 0.009, "step": 10495 }, { "epoch": 2.14, "learning_rate": 0.00018654779813234525, "loss": 0.0098, "step": 10496 }, { "epoch": 2.14, "learning_rate": 0.00018652899668182481, "loss": 0.0045, "step": 10497 }, { "epoch": 2.14, "learning_rate": 0.00018651019462120118, "loss": 0.0109, "step": 10498 }, { "epoch": 2.14, "learning_rate": 0.0001864913919507884, "loss": 0.0123, "step": 10499 }, { "epoch": 2.14, "learning_rate": 0.00018647258867090054, "loss": 0.0099, "step": 10500 }, { "epoch": 2.14, "learning_rate": 0.00018645378478185156, "loss": 0.0032, "step": 10501 }, { "epoch": 2.14, "learning_rate": 0.00018643498028395554, "loss": 0.0104, "step": 10502 }, { "epoch": 2.14, "learning_rate": 0.0001864161751775266, "loss": 0.0022, "step": 10503 }, { "epoch": 2.14, "learning_rate": 0.0001863973694628788, "loss": 0.0224, "step": 10504 }, { "epoch": 2.14, "learning_rate": 0.00018637856314032624, "loss": 0.0068, "step": 10505 }, { "epoch": 2.14, "learning_rate": 0.00018635975621018297, "loss": 0.021, "step": 10506 }, { "epoch": 2.14, "learning_rate": 0.00018634094867276313, "loss": 0.0235, "step": 10507 }, { "epoch": 2.14, "learning_rate": 0.00018632214052838087, "loss": 0.0012, "step": 10508 }, { "epoch": 2.14, "learning_rate": 0.0001863033317773503, "loss": 0.0047, "step": 10509 }, { "epoch": 2.14, "learning_rate": 0.00018628452241998555, "loss": 0.0034, "step": 10510 }, { "epoch": 2.14, "learning_rate": 0.0001862657124566008, "loss": 0.0037, "step": 10511 }, { "epoch": 2.14, "learning_rate": 0.00018624690188751017, "loss": 0.0203, "step": 10512 }, { "epoch": 2.14, "learning_rate": 0.00018622809071302786, "loss": 0.0042, "step": 10513 }, { "epoch": 2.14, "learning_rate": 0.0001862092789334681, "loss": 0.0165, "step": 10514 }, { "epoch": 2.14, "learning_rate": 0.00018619046654914497, "loss": 0.003, "step": 10515 }, { "epoch": 2.14, "learning_rate": 0.0001861716535603728, "loss": 0.0154, "step": 10516 }, { "epoch": 2.14, "learning_rate": 0.00018615283996746565, "loss": 0.0024, "step": 10517 }, { "epoch": 2.14, "learning_rate": 0.0001861340257707379, "loss": 0.0076, "step": 10518 }, { "epoch": 2.14, "learning_rate": 0.0001861152109705037, "loss": 0.0014, "step": 10519 }, { "epoch": 2.14, "learning_rate": 0.00018609639556707726, "loss": 0.0085, "step": 10520 }, { "epoch": 2.14, "learning_rate": 0.00018607757956077292, "loss": 0.0137, "step": 10521 }, { "epoch": 2.14, "learning_rate": 0.00018605876295190487, "loss": 0.005, "step": 10522 }, { "epoch": 2.14, "learning_rate": 0.00018603994574078748, "loss": 0.0004, "step": 10523 }, { "epoch": 2.14, "learning_rate": 0.00018602112792773492, "loss": 0.0051, "step": 10524 }, { "epoch": 2.14, "learning_rate": 0.00018600230951306156, "loss": 0.0127, "step": 10525 }, { "epoch": 2.14, "learning_rate": 0.0001859834904970816, "loss": 0.0021, "step": 10526 }, { "epoch": 2.14, "learning_rate": 0.00018596467088010944, "loss": 0.0077, "step": 10527 }, { "epoch": 2.14, "learning_rate": 0.00018594585066245944, "loss": 0.006, "step": 10528 }, { "epoch": 2.14, "learning_rate": 0.00018592702984444585, "loss": 0.0083, "step": 10529 }, { "epoch": 2.14, "learning_rate": 0.00018590820842638304, "loss": 0.0064, "step": 10530 }, { "epoch": 2.14, "learning_rate": 0.0001858893864085854, "loss": 0.0051, "step": 10531 }, { "epoch": 2.14, "learning_rate": 0.00018587056379136725, "loss": 0.0027, "step": 10532 }, { "epoch": 2.14, "learning_rate": 0.00018585174057504297, "loss": 0.005, "step": 10533 }, { "epoch": 2.14, "learning_rate": 0.00018583291675992693, "loss": 0.0098, "step": 10534 }, { "epoch": 2.15, "learning_rate": 0.00018581409234633354, "loss": 0.0163, "step": 10535 }, { "epoch": 2.15, "learning_rate": 0.0001857952673345772, "loss": 0.0221, "step": 10536 }, { "epoch": 2.15, "learning_rate": 0.00018577644172497237, "loss": 0.0115, "step": 10537 }, { "epoch": 2.15, "learning_rate": 0.0001857576155178334, "loss": 0.0016, "step": 10538 }, { "epoch": 2.15, "learning_rate": 0.00018573878871347473, "loss": 0.0045, "step": 10539 }, { "epoch": 2.15, "learning_rate": 0.00018571996131221084, "loss": 0.0058, "step": 10540 }, { "epoch": 2.15, "learning_rate": 0.00018570113331435622, "loss": 0.01, "step": 10541 }, { "epoch": 2.15, "learning_rate": 0.00018568230472022524, "loss": 0.0113, "step": 10542 }, { "epoch": 2.15, "learning_rate": 0.00018566347553013242, "loss": 0.0186, "step": 10543 }, { "epoch": 2.15, "learning_rate": 0.00018564464574439223, "loss": 0.0082, "step": 10544 }, { "epoch": 2.15, "learning_rate": 0.00018562581536331918, "loss": 0.0038, "step": 10545 }, { "epoch": 2.15, "learning_rate": 0.0001856069843872278, "loss": 0.0113, "step": 10546 }, { "epoch": 2.15, "learning_rate": 0.00018558815281643254, "loss": 0.004, "step": 10547 }, { "epoch": 2.15, "learning_rate": 0.00018556932065124794, "loss": 0.0036, "step": 10548 }, { "epoch": 2.15, "learning_rate": 0.00018555048789198854, "loss": 0.0018, "step": 10549 }, { "epoch": 2.15, "learning_rate": 0.0001855316545389689, "loss": 0.012, "step": 10550 }, { "epoch": 2.15, "learning_rate": 0.00018551282059250354, "loss": 0.0176, "step": 10551 }, { "epoch": 2.15, "learning_rate": 0.00018549398605290706, "loss": 0.0126, "step": 10552 }, { "epoch": 2.15, "learning_rate": 0.00018547515092049398, "loss": 0.0115, "step": 10553 }, { "epoch": 2.15, "learning_rate": 0.00018545631519557894, "loss": 0.0191, "step": 10554 }, { "epoch": 2.15, "learning_rate": 0.00018543747887847653, "loss": 0.0019, "step": 10555 }, { "epoch": 2.15, "learning_rate": 0.00018541864196950131, "loss": 0.0044, "step": 10556 }, { "epoch": 2.15, "learning_rate": 0.0001853998044689679, "loss": 0.0035, "step": 10557 }, { "epoch": 2.15, "learning_rate": 0.00018538096637719096, "loss": 0.0046, "step": 10558 }, { "epoch": 2.15, "learning_rate": 0.0001853621276944851, "loss": 0.0164, "step": 10559 }, { "epoch": 2.15, "learning_rate": 0.00018534328842116494, "loss": 0.0022, "step": 10560 }, { "epoch": 2.15, "learning_rate": 0.00018532444855754511, "loss": 0.0157, "step": 10561 }, { "epoch": 2.15, "learning_rate": 0.00018530560810394036, "loss": 0.0078, "step": 10562 }, { "epoch": 2.15, "learning_rate": 0.00018528676706066528, "loss": 0.0084, "step": 10563 }, { "epoch": 2.15, "learning_rate": 0.0001852679254280346, "loss": 0.0204, "step": 10564 }, { "epoch": 2.15, "learning_rate": 0.00018524908320636304, "loss": 0.005, "step": 10565 }, { "epoch": 2.15, "learning_rate": 0.00018523024039596517, "loss": 0.0035, "step": 10566 }, { "epoch": 2.15, "learning_rate": 0.00018521139699715584, "loss": 0.0143, "step": 10567 }, { "epoch": 2.15, "learning_rate": 0.00018519255301024967, "loss": 0.0285, "step": 10568 }, { "epoch": 2.15, "learning_rate": 0.00018517370843556145, "loss": 0.0018, "step": 10569 }, { "epoch": 2.15, "learning_rate": 0.0001851548632734059, "loss": 0.0031, "step": 10570 }, { "epoch": 2.15, "learning_rate": 0.00018513601752409778, "loss": 0.0149, "step": 10571 }, { "epoch": 2.15, "learning_rate": 0.00018511717118795183, "loss": 0.0155, "step": 10572 }, { "epoch": 2.15, "learning_rate": 0.00018509832426528286, "loss": 0.021, "step": 10573 }, { "epoch": 2.15, "learning_rate": 0.00018507947675640564, "loss": 0.0194, "step": 10574 }, { "epoch": 2.15, "learning_rate": 0.0001850606286616349, "loss": 0.0064, "step": 10575 }, { "epoch": 2.15, "learning_rate": 0.0001850417799812855, "loss": 0.0162, "step": 10576 }, { "epoch": 2.15, "learning_rate": 0.0001850229307156722, "loss": 0.0064, "step": 10577 }, { "epoch": 2.15, "learning_rate": 0.0001850040808651099, "loss": 0.0087, "step": 10578 }, { "epoch": 2.15, "learning_rate": 0.00018498523042991336, "loss": 0.0247, "step": 10579 }, { "epoch": 2.15, "learning_rate": 0.0001849663794103974, "loss": 0.0237, "step": 10580 }, { "epoch": 2.15, "learning_rate": 0.00018494752780687688, "loss": 0.0049, "step": 10581 }, { "epoch": 2.15, "learning_rate": 0.0001849286756196667, "loss": 0.0158, "step": 10582 }, { "epoch": 2.15, "learning_rate": 0.00018490982284908173, "loss": 0.0012, "step": 10583 }, { "epoch": 2.16, "learning_rate": 0.0001848909694954368, "loss": 0.0019, "step": 10584 }, { "epoch": 2.16, "learning_rate": 0.00018487211555904686, "loss": 0.0091, "step": 10585 }, { "epoch": 2.16, "learning_rate": 0.0001848532610402267, "loss": 0.026, "step": 10586 }, { "epoch": 2.16, "learning_rate": 0.0001848344059392913, "loss": 0.0024, "step": 10587 }, { "epoch": 2.16, "learning_rate": 0.00018481555025655564, "loss": 0.0107, "step": 10588 }, { "epoch": 2.16, "learning_rate": 0.00018479669399233453, "loss": 0.0263, "step": 10589 }, { "epoch": 2.16, "learning_rate": 0.0001847778371469429, "loss": 0.0067, "step": 10590 }, { "epoch": 2.16, "learning_rate": 0.00018475897972069577, "loss": 0.0109, "step": 10591 }, { "epoch": 2.16, "learning_rate": 0.00018474012171390807, "loss": 0.0435, "step": 10592 }, { "epoch": 2.16, "learning_rate": 0.00018472126312689478, "loss": 0.042, "step": 10593 }, { "epoch": 2.16, "learning_rate": 0.00018470240395997086, "loss": 0.0045, "step": 10594 }, { "epoch": 2.16, "learning_rate": 0.0001846835442134512, "loss": 0.0106, "step": 10595 }, { "epoch": 2.16, "learning_rate": 0.00018466468388765096, "loss": 0.0103, "step": 10596 }, { "epoch": 2.16, "learning_rate": 0.0001846458229828851, "loss": 0.0079, "step": 10597 }, { "epoch": 2.16, "learning_rate": 0.00018462696149946855, "loss": 0.0029, "step": 10598 }, { "epoch": 2.16, "learning_rate": 0.0001846080994377164, "loss": 0.0062, "step": 10599 }, { "epoch": 2.16, "learning_rate": 0.00018458923679794362, "loss": 0.0062, "step": 10600 }, { "epoch": 2.16, "learning_rate": 0.0001845703735804653, "loss": 0.0065, "step": 10601 }, { "epoch": 2.16, "learning_rate": 0.00018455150978559652, "loss": 0.0074, "step": 10602 }, { "epoch": 2.16, "learning_rate": 0.0001845326454136523, "loss": 0.007, "step": 10603 }, { "epoch": 2.16, "learning_rate": 0.00018451378046494766, "loss": 0.0158, "step": 10604 }, { "epoch": 2.16, "learning_rate": 0.0001844949149397978, "loss": 0.0039, "step": 10605 }, { "epoch": 2.16, "learning_rate": 0.00018447604883851774, "loss": 0.0136, "step": 10606 }, { "epoch": 2.16, "learning_rate": 0.00018445718216142257, "loss": 0.0037, "step": 10607 }, { "epoch": 2.16, "learning_rate": 0.00018443831490882743, "loss": 0.0047, "step": 10608 }, { "epoch": 2.16, "learning_rate": 0.0001844194470810474, "loss": 0.0103, "step": 10609 }, { "epoch": 2.16, "learning_rate": 0.00018440057867839766, "loss": 0.0107, "step": 10610 }, { "epoch": 2.16, "learning_rate": 0.00018438170970119328, "loss": 0.0029, "step": 10611 }, { "epoch": 2.16, "learning_rate": 0.00018436284014974947, "loss": 0.0113, "step": 10612 }, { "epoch": 2.16, "learning_rate": 0.00018434397002438138, "loss": 0.0136, "step": 10613 }, { "epoch": 2.16, "learning_rate": 0.00018432509932540412, "loss": 0.0072, "step": 10614 }, { "epoch": 2.16, "learning_rate": 0.00018430622805313298, "loss": 0.006, "step": 10615 }, { "epoch": 2.16, "learning_rate": 0.00018428735620788303, "loss": 0.006, "step": 10616 }, { "epoch": 2.16, "learning_rate": 0.0001842684837899695, "loss": 0.0062, "step": 10617 }, { "epoch": 2.16, "learning_rate": 0.00018424961079970762, "loss": 0.0221, "step": 10618 }, { "epoch": 2.16, "learning_rate": 0.0001842307372374126, "loss": 0.0133, "step": 10619 }, { "epoch": 2.16, "learning_rate": 0.00018421186310339967, "loss": 0.0015, "step": 10620 }, { "epoch": 2.16, "learning_rate": 0.00018419298839798402, "loss": 0.0083, "step": 10621 }, { "epoch": 2.16, "learning_rate": 0.00018417411312148085, "loss": 0.0084, "step": 10622 }, { "epoch": 2.16, "learning_rate": 0.00018415523727420557, "loss": 0.0089, "step": 10623 }, { "epoch": 2.16, "learning_rate": 0.00018413636085647334, "loss": 0.009, "step": 10624 }, { "epoch": 2.16, "learning_rate": 0.00018411748386859946, "loss": 0.0056, "step": 10625 }, { "epoch": 2.16, "learning_rate": 0.00018409860631089916, "loss": 0.0058, "step": 10626 }, { "epoch": 2.16, "learning_rate": 0.00018407972818368777, "loss": 0.002, "step": 10627 }, { "epoch": 2.16, "learning_rate": 0.00018406084948728062, "loss": 0.012, "step": 10628 }, { "epoch": 2.16, "learning_rate": 0.000184041970221993, "loss": 0.0205, "step": 10629 }, { "epoch": 2.16, "learning_rate": 0.0001840230903881402, "loss": 0.0045, "step": 10630 }, { "epoch": 2.16, "learning_rate": 0.00018400420998603755, "loss": 0.0059, "step": 10631 }, { "epoch": 2.16, "learning_rate": 0.0001839853290160004, "loss": 0.0181, "step": 10632 }, { "epoch": 2.17, "learning_rate": 0.00018396644747834413, "loss": 0.0183, "step": 10633 }, { "epoch": 2.17, "learning_rate": 0.00018394756537338407, "loss": 0.0096, "step": 10634 }, { "epoch": 2.17, "learning_rate": 0.00018392868270143554, "loss": 0.0037, "step": 10635 }, { "epoch": 2.17, "learning_rate": 0.00018390979946281401, "loss": 0.0067, "step": 10636 }, { "epoch": 2.17, "learning_rate": 0.0001838909156578348, "loss": 0.0116, "step": 10637 }, { "epoch": 2.17, "learning_rate": 0.00018387203128681333, "loss": 0.0075, "step": 10638 }, { "epoch": 2.17, "learning_rate": 0.00018385314635006509, "loss": 0.01, "step": 10639 }, { "epoch": 2.17, "learning_rate": 0.0001838342608479053, "loss": 0.0048, "step": 10640 }, { "epoch": 2.17, "learning_rate": 0.0001838153747806495, "loss": 0.0134, "step": 10641 }, { "epoch": 2.17, "learning_rate": 0.0001837964881486131, "loss": 0.0074, "step": 10642 }, { "epoch": 2.17, "learning_rate": 0.00018377760095211157, "loss": 0.0045, "step": 10643 }, { "epoch": 2.17, "learning_rate": 0.00018375871319146033, "loss": 0.0136, "step": 10644 }, { "epoch": 2.17, "learning_rate": 0.0001837398248669749, "loss": 0.0082, "step": 10645 }, { "epoch": 2.17, "learning_rate": 0.00018372093597897066, "loss": 0.0064, "step": 10646 }, { "epoch": 2.17, "learning_rate": 0.00018370204652776317, "loss": 0.0127, "step": 10647 }, { "epoch": 2.17, "learning_rate": 0.00018368315651366788, "loss": 0.0051, "step": 10648 }, { "epoch": 2.17, "learning_rate": 0.00018366426593700028, "loss": 0.0013, "step": 10649 }, { "epoch": 2.17, "learning_rate": 0.0001836453747980759, "loss": 0.0123, "step": 10650 }, { "epoch": 2.17, "learning_rate": 0.00018362648309721023, "loss": 0.0177, "step": 10651 }, { "epoch": 2.17, "learning_rate": 0.00018360759083471884, "loss": 0.009, "step": 10652 }, { "epoch": 2.17, "learning_rate": 0.00018358869801091723, "loss": 0.0039, "step": 10653 }, { "epoch": 2.17, "learning_rate": 0.00018356980462612098, "loss": 0.0083, "step": 10654 }, { "epoch": 2.17, "learning_rate": 0.00018355091068064557, "loss": 0.0139, "step": 10655 }, { "epoch": 2.17, "learning_rate": 0.0001835320161748067, "loss": 0.0096, "step": 10656 }, { "epoch": 2.17, "learning_rate": 0.00018351312110891982, "loss": 0.0058, "step": 10657 }, { "epoch": 2.17, "learning_rate": 0.00018349422548330057, "loss": 0.0093, "step": 10658 }, { "epoch": 2.17, "learning_rate": 0.00018347532929826455, "loss": 0.0098, "step": 10659 }, { "epoch": 2.17, "learning_rate": 0.0001834564325541273, "loss": 0.0077, "step": 10660 }, { "epoch": 2.17, "learning_rate": 0.0001834375352512045, "loss": 0.0132, "step": 10661 }, { "epoch": 2.17, "learning_rate": 0.00018341863738981175, "loss": 0.0029, "step": 10662 }, { "epoch": 2.17, "learning_rate": 0.00018339973897026464, "loss": 0.0047, "step": 10663 }, { "epoch": 2.17, "learning_rate": 0.00018338083999287883, "loss": 0.0038, "step": 10664 }, { "epoch": 2.17, "learning_rate": 0.00018336194045797, "loss": 0.0195, "step": 10665 }, { "epoch": 2.17, "learning_rate": 0.00018334304036585384, "loss": 0.0097, "step": 10666 }, { "epoch": 2.17, "learning_rate": 0.00018332413971684593, "loss": 0.0049, "step": 10667 }, { "epoch": 2.17, "learning_rate": 0.00018330523851126196, "loss": 0.0045, "step": 10668 }, { "epoch": 2.17, "learning_rate": 0.00018328633674941766, "loss": 0.0032, "step": 10669 }, { "epoch": 2.17, "learning_rate": 0.0001832674344316287, "loss": 0.0083, "step": 10670 }, { "epoch": 2.17, "learning_rate": 0.0001832485315582108, "loss": 0.0108, "step": 10671 }, { "epoch": 2.17, "learning_rate": 0.00018322962812947967, "loss": 0.0233, "step": 10672 }, { "epoch": 2.17, "learning_rate": 0.00018321072414575102, "loss": 0.0047, "step": 10673 }, { "epoch": 2.17, "learning_rate": 0.00018319181960734058, "loss": 0.0049, "step": 10674 }, { "epoch": 2.17, "learning_rate": 0.000183172914514564, "loss": 0.006, "step": 10675 }, { "epoch": 2.17, "learning_rate": 0.00018315400886773726, "loss": 0.0111, "step": 10676 }, { "epoch": 2.17, "learning_rate": 0.00018313510266717596, "loss": 0.007, "step": 10677 }, { "epoch": 2.17, "learning_rate": 0.00018311619591319592, "loss": 0.0264, "step": 10678 }, { "epoch": 2.17, "learning_rate": 0.00018309728860611282, "loss": 0.0108, "step": 10679 }, { "epoch": 2.17, "learning_rate": 0.00018307838074624262, "loss": 0.0146, "step": 10680 }, { "epoch": 2.17, "learning_rate": 0.00018305947233390095, "loss": 0.0233, "step": 10681 }, { "epoch": 2.18, "learning_rate": 0.00018304056336940374, "loss": 0.0119, "step": 10682 }, { "epoch": 2.18, "learning_rate": 0.0001830216538530667, "loss": 0.0062, "step": 10683 }, { "epoch": 2.18, "learning_rate": 0.00018300274378520571, "loss": 0.0037, "step": 10684 }, { "epoch": 2.18, "learning_rate": 0.00018298383316613665, "loss": 0.0362, "step": 10685 }, { "epoch": 2.18, "learning_rate": 0.0001829649219961753, "loss": 0.0234, "step": 10686 }, { "epoch": 2.18, "learning_rate": 0.0001829460102756375, "loss": 0.002, "step": 10687 }, { "epoch": 2.18, "learning_rate": 0.00018292709800483915, "loss": 0.0208, "step": 10688 }, { "epoch": 2.18, "learning_rate": 0.00018290818518409613, "loss": 0.0267, "step": 10689 }, { "epoch": 2.18, "learning_rate": 0.00018288927181372427, "loss": 0.0101, "step": 10690 }, { "epoch": 2.18, "learning_rate": 0.0001828703578940395, "loss": 0.005, "step": 10691 }, { "epoch": 2.18, "learning_rate": 0.0001828514434253577, "loss": 0.0054, "step": 10692 }, { "epoch": 2.18, "learning_rate": 0.0001828325284079948, "loss": 0.0054, "step": 10693 }, { "epoch": 2.18, "learning_rate": 0.0001828136128422667, "loss": 0.0191, "step": 10694 }, { "epoch": 2.18, "learning_rate": 0.00018279469672848929, "loss": 0.0172, "step": 10695 }, { "epoch": 2.18, "learning_rate": 0.00018277578006697855, "loss": 0.0119, "step": 10696 }, { "epoch": 2.18, "learning_rate": 0.00018275686285805043, "loss": 0.007, "step": 10697 }, { "epoch": 2.18, "learning_rate": 0.00018273794510202088, "loss": 0.0039, "step": 10698 }, { "epoch": 2.18, "learning_rate": 0.00018271902679920586, "loss": 0.0093, "step": 10699 }, { "epoch": 2.18, "learning_rate": 0.00018270010794992127, "loss": 0.0104, "step": 10700 }, { "epoch": 2.18, "learning_rate": 0.00018268118855448322, "loss": 0.0092, "step": 10701 }, { "epoch": 2.18, "learning_rate": 0.00018266226861320757, "loss": 0.0149, "step": 10702 }, { "epoch": 2.18, "learning_rate": 0.00018264334812641045, "loss": 0.0104, "step": 10703 }, { "epoch": 2.18, "learning_rate": 0.00018262442709440776, "loss": 0.0029, "step": 10704 }, { "epoch": 2.18, "learning_rate": 0.0001826055055175155, "loss": 0.0165, "step": 10705 }, { "epoch": 2.18, "learning_rate": 0.0001825865833960498, "loss": 0.0038, "step": 10706 }, { "epoch": 2.18, "learning_rate": 0.00018256766073032661, "loss": 0.0086, "step": 10707 }, { "epoch": 2.18, "learning_rate": 0.00018254873752066212, "loss": 0.0043, "step": 10708 }, { "epoch": 2.18, "learning_rate": 0.00018252981376737219, "loss": 0.0083, "step": 10709 }, { "epoch": 2.18, "learning_rate": 0.00018251088947077298, "loss": 0.0047, "step": 10710 }, { "epoch": 2.18, "learning_rate": 0.00018249196463118055, "loss": 0.0068, "step": 10711 }, { "epoch": 2.18, "learning_rate": 0.00018247303924891095, "loss": 0.0053, "step": 10712 }, { "epoch": 2.18, "learning_rate": 0.00018245411332428032, "loss": 0.0014, "step": 10713 }, { "epoch": 2.18, "learning_rate": 0.00018243518685760477, "loss": 0.0169, "step": 10714 }, { "epoch": 2.18, "learning_rate": 0.0001824162598492003, "loss": 0.0041, "step": 10715 }, { "epoch": 2.18, "learning_rate": 0.00018239733229938313, "loss": 0.0213, "step": 10716 }, { "epoch": 2.18, "learning_rate": 0.00018237840420846937, "loss": 0.0019, "step": 10717 }, { "epoch": 2.18, "learning_rate": 0.00018235947557677514, "loss": 0.005, "step": 10718 }, { "epoch": 2.18, "learning_rate": 0.00018234054640461656, "loss": 0.0151, "step": 10719 }, { "epoch": 2.18, "learning_rate": 0.00018232161669230984, "loss": 0.0131, "step": 10720 }, { "epoch": 2.18, "learning_rate": 0.0001823026864401711, "loss": 0.0017, "step": 10721 }, { "epoch": 2.18, "learning_rate": 0.00018228375564851654, "loss": 0.0078, "step": 10722 }, { "epoch": 2.18, "learning_rate": 0.00018226482431766232, "loss": 0.005, "step": 10723 }, { "epoch": 2.18, "learning_rate": 0.0001822458924479246, "loss": 0.004, "step": 10724 }, { "epoch": 2.18, "learning_rate": 0.00018222696003961962, "loss": 0.0093, "step": 10725 }, { "epoch": 2.18, "learning_rate": 0.00018220802709306355, "loss": 0.0141, "step": 10726 }, { "epoch": 2.18, "learning_rate": 0.00018218909360857266, "loss": 0.0049, "step": 10727 }, { "epoch": 2.18, "learning_rate": 0.0001821701595864631, "loss": 0.0013, "step": 10728 }, { "epoch": 2.18, "learning_rate": 0.00018215122502705122, "loss": 0.0098, "step": 10729 }, { "epoch": 2.18, "learning_rate": 0.00018213228993065313, "loss": 0.003, "step": 10730 }, { "epoch": 2.19, "learning_rate": 0.00018211335429758524, "loss": 0.0088, "step": 10731 }, { "epoch": 2.19, "learning_rate": 0.00018209441812816363, "loss": 0.0043, "step": 10732 }, { "epoch": 2.19, "learning_rate": 0.00018207548142270465, "loss": 0.0168, "step": 10733 }, { "epoch": 2.19, "learning_rate": 0.00018205654418152462, "loss": 0.0222, "step": 10734 }, { "epoch": 2.19, "learning_rate": 0.00018203760640493976, "loss": 0.0024, "step": 10735 }, { "epoch": 2.19, "learning_rate": 0.0001820186680932664, "loss": 0.0097, "step": 10736 }, { "epoch": 2.19, "learning_rate": 0.00018199972924682088, "loss": 0.0118, "step": 10737 }, { "epoch": 2.19, "learning_rate": 0.00018198078986591946, "loss": 0.0056, "step": 10738 }, { "epoch": 2.19, "learning_rate": 0.0001819618499508785, "loss": 0.0029, "step": 10739 }, { "epoch": 2.19, "learning_rate": 0.00018194290950201432, "loss": 0.0057, "step": 10740 }, { "epoch": 2.19, "learning_rate": 0.00018192396851964321, "loss": 0.002, "step": 10741 }, { "epoch": 2.19, "learning_rate": 0.00018190502700408156, "loss": 0.0167, "step": 10742 }, { "epoch": 2.19, "learning_rate": 0.00018188608495564576, "loss": 0.0137, "step": 10743 }, { "epoch": 2.19, "learning_rate": 0.00018186714237465216, "loss": 0.0034, "step": 10744 }, { "epoch": 2.19, "learning_rate": 0.00018184819926141712, "loss": 0.0114, "step": 10745 }, { "epoch": 2.19, "learning_rate": 0.00018182925561625703, "loss": 0.0037, "step": 10746 }, { "epoch": 2.19, "learning_rate": 0.0001818103114394883, "loss": 0.0122, "step": 10747 }, { "epoch": 2.19, "learning_rate": 0.00018179136673142728, "loss": 0.0377, "step": 10748 }, { "epoch": 2.19, "learning_rate": 0.00018177242149239046, "loss": 0.0142, "step": 10749 }, { "epoch": 2.19, "learning_rate": 0.00018175347572269425, "loss": 0.0072, "step": 10750 }, { "epoch": 2.19, "learning_rate": 0.00018173452942265504, "loss": 0.0006, "step": 10751 }, { "epoch": 2.19, "learning_rate": 0.00018171558259258926, "loss": 0.0064, "step": 10752 }, { "epoch": 2.19, "learning_rate": 0.0001816966352328134, "loss": 0.007, "step": 10753 }, { "epoch": 2.19, "learning_rate": 0.0001816776873436439, "loss": 0.0033, "step": 10754 }, { "epoch": 2.19, "learning_rate": 0.00018165873892539726, "loss": 0.0083, "step": 10755 }, { "epoch": 2.19, "learning_rate": 0.00018163978997838987, "loss": 0.0118, "step": 10756 }, { "epoch": 2.19, "learning_rate": 0.00018162084050293828, "loss": 0.0175, "step": 10757 }, { "epoch": 2.19, "learning_rate": 0.00018160189049935892, "loss": 0.0092, "step": 10758 }, { "epoch": 2.19, "learning_rate": 0.0001815829399679684, "loss": 0.0024, "step": 10759 }, { "epoch": 2.19, "learning_rate": 0.00018156398890908316, "loss": 0.0107, "step": 10760 }, { "epoch": 2.19, "learning_rate": 0.00018154503732301967, "loss": 0.0103, "step": 10761 }, { "epoch": 2.19, "learning_rate": 0.00018152608521009456, "loss": 0.0172, "step": 10762 }, { "epoch": 2.19, "learning_rate": 0.00018150713257062434, "loss": 0.0112, "step": 10763 }, { "epoch": 2.19, "learning_rate": 0.00018148817940492548, "loss": 0.0062, "step": 10764 }, { "epoch": 2.19, "learning_rate": 0.00018146922571331462, "loss": 0.0039, "step": 10765 }, { "epoch": 2.19, "learning_rate": 0.00018145027149610828, "loss": 0.0097, "step": 10766 }, { "epoch": 2.19, "learning_rate": 0.00018143131675362302, "loss": 0.0226, "step": 10767 }, { "epoch": 2.19, "learning_rate": 0.00018141236148617546, "loss": 0.0081, "step": 10768 }, { "epoch": 2.19, "learning_rate": 0.00018139340569408213, "loss": 0.0034, "step": 10769 }, { "epoch": 2.19, "learning_rate": 0.0001813744493776597, "loss": 0.0218, "step": 10770 }, { "epoch": 2.19, "learning_rate": 0.00018135549253722472, "loss": 0.0069, "step": 10771 }, { "epoch": 2.19, "learning_rate": 0.00018133653517309387, "loss": 0.0245, "step": 10772 }, { "epoch": 2.19, "learning_rate": 0.00018131757728558371, "loss": 0.0057, "step": 10773 }, { "epoch": 2.19, "learning_rate": 0.0001812986188750109, "loss": 0.0015, "step": 10774 }, { "epoch": 2.19, "learning_rate": 0.00018127965994169207, "loss": 0.0037, "step": 10775 }, { "epoch": 2.19, "learning_rate": 0.00018126070048594386, "loss": 0.0062, "step": 10776 }, { "epoch": 2.19, "learning_rate": 0.00018124174050808292, "loss": 0.0017, "step": 10777 }, { "epoch": 2.19, "learning_rate": 0.000181222780008426, "loss": 0.0127, "step": 10778 }, { "epoch": 2.19, "learning_rate": 0.0001812038189872897, "loss": 0.0029, "step": 10779 }, { "epoch": 2.2, "learning_rate": 0.0001811848574449907, "loss": 0.0132, "step": 10780 }, { "epoch": 2.2, "learning_rate": 0.0001811658953818457, "loss": 0.0253, "step": 10781 }, { "epoch": 2.2, "learning_rate": 0.00018114693279817147, "loss": 0.0057, "step": 10782 }, { "epoch": 2.2, "learning_rate": 0.00018112796969428464, "loss": 0.0067, "step": 10783 }, { "epoch": 2.2, "learning_rate": 0.00018110900607050195, "loss": 0.0049, "step": 10784 }, { "epoch": 2.2, "learning_rate": 0.00018109004192714016, "loss": 0.0134, "step": 10785 }, { "epoch": 2.2, "learning_rate": 0.00018107107726451595, "loss": 0.0045, "step": 10786 }, { "epoch": 2.2, "learning_rate": 0.00018105211208294616, "loss": 0.0078, "step": 10787 }, { "epoch": 2.2, "learning_rate": 0.00018103314638274744, "loss": 0.0183, "step": 10788 }, { "epoch": 2.2, "learning_rate": 0.00018101418016423654, "loss": 0.0051, "step": 10789 }, { "epoch": 2.2, "learning_rate": 0.00018099521342773036, "loss": 0.0048, "step": 10790 }, { "epoch": 2.2, "learning_rate": 0.0001809762461735456, "loss": 0.016, "step": 10791 }, { "epoch": 2.2, "learning_rate": 0.00018095727840199903, "loss": 0.0065, "step": 10792 }, { "epoch": 2.2, "learning_rate": 0.0001809383101134075, "loss": 0.0055, "step": 10793 }, { "epoch": 2.2, "learning_rate": 0.00018091934130808778, "loss": 0.0054, "step": 10794 }, { "epoch": 2.2, "learning_rate": 0.0001809003719863567, "loss": 0.012, "step": 10795 }, { "epoch": 2.2, "learning_rate": 0.00018088140214853114, "loss": 0.0102, "step": 10796 }, { "epoch": 2.2, "learning_rate": 0.00018086243179492778, "loss": 0.0036, "step": 10797 }, { "epoch": 2.2, "learning_rate": 0.0001808434609258636, "loss": 0.0019, "step": 10798 }, { "epoch": 2.2, "learning_rate": 0.00018082448954165537, "loss": 0.0066, "step": 10799 }, { "epoch": 2.2, "learning_rate": 0.00018080551764261999, "loss": 0.0167, "step": 10800 }, { "epoch": 2.2, "learning_rate": 0.00018078654522907432, "loss": 0.0094, "step": 10801 }, { "epoch": 2.2, "learning_rate": 0.00018076757230133523, "loss": 0.0029, "step": 10802 }, { "epoch": 2.2, "learning_rate": 0.0001807485988597196, "loss": 0.0104, "step": 10803 }, { "epoch": 2.2, "learning_rate": 0.0001807296249045443, "loss": 0.007, "step": 10804 }, { "epoch": 2.2, "learning_rate": 0.00018071065043612631, "loss": 0.0062, "step": 10805 }, { "epoch": 2.2, "learning_rate": 0.0001806916754547825, "loss": 0.0052, "step": 10806 }, { "epoch": 2.2, "learning_rate": 0.00018067269996082972, "loss": 0.0101, "step": 10807 }, { "epoch": 2.2, "learning_rate": 0.00018065372395458497, "loss": 0.0045, "step": 10808 }, { "epoch": 2.2, "learning_rate": 0.00018063474743636518, "loss": 0.0063, "step": 10809 }, { "epoch": 2.2, "learning_rate": 0.0001806157704064873, "loss": 0.0162, "step": 10810 }, { "epoch": 2.2, "learning_rate": 0.0001805967928652682, "loss": 0.0136, "step": 10811 }, { "epoch": 2.2, "learning_rate": 0.00018057781481302496, "loss": 0.0088, "step": 10812 }, { "epoch": 2.2, "learning_rate": 0.00018055883625007447, "loss": 0.0156, "step": 10813 }, { "epoch": 2.2, "learning_rate": 0.00018053985717673374, "loss": 0.0181, "step": 10814 }, { "epoch": 2.2, "learning_rate": 0.00018052087759331972, "loss": 0.0031, "step": 10815 }, { "epoch": 2.2, "learning_rate": 0.00018050189750014946, "loss": 0.0026, "step": 10816 }, { "epoch": 2.2, "learning_rate": 0.00018048291689753992, "loss": 0.0083, "step": 10817 }, { "epoch": 2.2, "learning_rate": 0.00018046393578580812, "loss": 0.0099, "step": 10818 }, { "epoch": 2.2, "learning_rate": 0.0001804449541652711, "loss": 0.0155, "step": 10819 }, { "epoch": 2.2, "learning_rate": 0.00018042597203624588, "loss": 0.0033, "step": 10820 }, { "epoch": 2.2, "learning_rate": 0.00018040698939904949, "loss": 0.0144, "step": 10821 }, { "epoch": 2.2, "learning_rate": 0.00018038800625399897, "loss": 0.0167, "step": 10822 }, { "epoch": 2.2, "learning_rate": 0.0001803690226014114, "loss": 0.0178, "step": 10823 }, { "epoch": 2.2, "learning_rate": 0.00018035003844160384, "loss": 0.0013, "step": 10824 }, { "epoch": 2.2, "learning_rate": 0.00018033105377489333, "loss": 0.0202, "step": 10825 }, { "epoch": 2.2, "learning_rate": 0.00018031206860159697, "loss": 0.0137, "step": 10826 }, { "epoch": 2.2, "learning_rate": 0.00018029308292203183, "loss": 0.0048, "step": 10827 }, { "epoch": 2.2, "learning_rate": 0.00018027409673651508, "loss": 0.0077, "step": 10828 }, { "epoch": 2.2, "learning_rate": 0.00018025511004536373, "loss": 0.0094, "step": 10829 }, { "epoch": 2.21, "learning_rate": 0.0001802361228488949, "loss": 0.0171, "step": 10830 }, { "epoch": 2.21, "learning_rate": 0.00018021713514742576, "loss": 0.0049, "step": 10831 }, { "epoch": 2.21, "learning_rate": 0.00018019814694127342, "loss": 0.0072, "step": 10832 }, { "epoch": 2.21, "learning_rate": 0.0001801791582307551, "loss": 0.0099, "step": 10833 }, { "epoch": 2.21, "learning_rate": 0.00018016016901618777, "loss": 0.008, "step": 10834 }, { "epoch": 2.21, "learning_rate": 0.00018014117929788875, "loss": 0.0079, "step": 10835 }, { "epoch": 2.21, "learning_rate": 0.0001801221890761751, "loss": 0.0199, "step": 10836 }, { "epoch": 2.21, "learning_rate": 0.0001801031983513641, "loss": 0.0171, "step": 10837 }, { "epoch": 2.21, "learning_rate": 0.00018008420712377276, "loss": 0.0014, "step": 10838 }, { "epoch": 2.21, "learning_rate": 0.00018006521539371844, "loss": 0.0153, "step": 10839 }, { "epoch": 2.21, "learning_rate": 0.00018004622316151824, "loss": 0.0013, "step": 10840 }, { "epoch": 2.21, "learning_rate": 0.0001800272304274894, "loss": 0.0183, "step": 10841 }, { "epoch": 2.21, "learning_rate": 0.00018000823719194913, "loss": 0.0091, "step": 10842 }, { "epoch": 2.21, "learning_rate": 0.0001799892434552147, "loss": 0.0155, "step": 10843 }, { "epoch": 2.21, "learning_rate": 0.00017997024921760326, "loss": 0.0032, "step": 10844 }, { "epoch": 2.21, "learning_rate": 0.00017995125447943207, "loss": 0.0302, "step": 10845 }, { "epoch": 2.21, "learning_rate": 0.0001799322592410184, "loss": 0.0074, "step": 10846 }, { "epoch": 2.21, "learning_rate": 0.00017991326350267955, "loss": 0.0016, "step": 10847 }, { "epoch": 2.21, "learning_rate": 0.0001798942672647327, "loss": 0.0058, "step": 10848 }, { "epoch": 2.21, "learning_rate": 0.00017987527052749518, "loss": 0.0033, "step": 10849 }, { "epoch": 2.21, "learning_rate": 0.0001798562732912842, "loss": 0.0033, "step": 10850 }, { "epoch": 2.21, "learning_rate": 0.0001798372755564171, "loss": 0.0539, "step": 10851 }, { "epoch": 2.21, "learning_rate": 0.0001798182773232112, "loss": 0.0038, "step": 10852 }, { "epoch": 2.21, "learning_rate": 0.00017979927859198378, "loss": 0.0138, "step": 10853 }, { "epoch": 2.21, "learning_rate": 0.00017978027936305216, "loss": 0.0029, "step": 10854 }, { "epoch": 2.21, "learning_rate": 0.00017976127963673365, "loss": 0.0079, "step": 10855 }, { "epoch": 2.21, "learning_rate": 0.0001797422794133456, "loss": 0.0144, "step": 10856 }, { "epoch": 2.21, "learning_rate": 0.00017972327869320538, "loss": 0.0045, "step": 10857 }, { "epoch": 2.21, "learning_rate": 0.00017970427747663025, "loss": 0.0157, "step": 10858 }, { "epoch": 2.21, "learning_rate": 0.0001796852757639376, "loss": 0.0031, "step": 10859 }, { "epoch": 2.21, "learning_rate": 0.00017966627355544485, "loss": 0.0198, "step": 10860 }, { "epoch": 2.21, "learning_rate": 0.00017964727085146933, "loss": 0.0364, "step": 10861 }, { "epoch": 2.21, "learning_rate": 0.00017962826765232837, "loss": 0.0051, "step": 10862 }, { "epoch": 2.21, "learning_rate": 0.00017960926395833946, "loss": 0.014, "step": 10863 }, { "epoch": 2.21, "learning_rate": 0.00017959025976981995, "loss": 0.0091, "step": 10864 }, { "epoch": 2.21, "learning_rate": 0.00017957125508708726, "loss": 0.0362, "step": 10865 }, { "epoch": 2.21, "learning_rate": 0.00017955224991045876, "loss": 0.0062, "step": 10866 }, { "epoch": 2.21, "learning_rate": 0.00017953324424025191, "loss": 0.0046, "step": 10867 }, { "epoch": 2.21, "learning_rate": 0.00017951423807678415, "loss": 0.0104, "step": 10868 }, { "epoch": 2.21, "learning_rate": 0.00017949523142037286, "loss": 0.0093, "step": 10869 }, { "epoch": 2.21, "learning_rate": 0.0001794762242713356, "loss": 0.0164, "step": 10870 }, { "epoch": 2.21, "learning_rate": 0.0001794572166299897, "loss": 0.0032, "step": 10871 }, { "epoch": 2.21, "learning_rate": 0.00017943820849665267, "loss": 0.0068, "step": 10872 }, { "epoch": 2.21, "learning_rate": 0.000179419199871642, "loss": 0.0287, "step": 10873 }, { "epoch": 2.21, "learning_rate": 0.00017940019075527518, "loss": 0.0016, "step": 10874 }, { "epoch": 2.21, "learning_rate": 0.0001793811811478697, "loss": 0.0088, "step": 10875 }, { "epoch": 2.21, "learning_rate": 0.00017936217104974297, "loss": 0.0113, "step": 10876 }, { "epoch": 2.21, "learning_rate": 0.0001793431604612126, "loss": 0.0102, "step": 10877 }, { "epoch": 2.21, "learning_rate": 0.00017932414938259605, "loss": 0.0099, "step": 10878 }, { "epoch": 2.22, "learning_rate": 0.00017930513781421085, "loss": 0.027, "step": 10879 }, { "epoch": 2.22, "learning_rate": 0.00017928612575637454, "loss": 0.0047, "step": 10880 }, { "epoch": 2.22, "learning_rate": 0.00017926711320940465, "loss": 0.0151, "step": 10881 }, { "epoch": 2.22, "learning_rate": 0.0001792481001736187, "loss": 0.0014, "step": 10882 }, { "epoch": 2.22, "learning_rate": 0.00017922908664933426, "loss": 0.0045, "step": 10883 }, { "epoch": 2.22, "learning_rate": 0.00017921007263686895, "loss": 0.019, "step": 10884 }, { "epoch": 2.22, "learning_rate": 0.00017919105813654025, "loss": 0.008, "step": 10885 }, { "epoch": 2.22, "learning_rate": 0.00017917204314866578, "loss": 0.0069, "step": 10886 }, { "epoch": 2.22, "learning_rate": 0.00017915302767356313, "loss": 0.0109, "step": 10887 }, { "epoch": 2.22, "learning_rate": 0.00017913401171154993, "loss": 0.017, "step": 10888 }, { "epoch": 2.22, "learning_rate": 0.0001791149952629437, "loss": 0.0059, "step": 10889 }, { "epoch": 2.22, "learning_rate": 0.00017909597832806208, "loss": 0.0065, "step": 10890 }, { "epoch": 2.22, "learning_rate": 0.0001790769609072227, "loss": 0.0072, "step": 10891 }, { "epoch": 2.22, "learning_rate": 0.00017905794300074318, "loss": 0.0101, "step": 10892 }, { "epoch": 2.22, "learning_rate": 0.00017903892460894118, "loss": 0.0102, "step": 10893 }, { "epoch": 2.22, "learning_rate": 0.00017901990573213433, "loss": 0.0026, "step": 10894 }, { "epoch": 2.22, "learning_rate": 0.00017900088637064028, "loss": 0.0012, "step": 10895 }, { "epoch": 2.22, "learning_rate": 0.00017898186652477667, "loss": 0.0168, "step": 10896 }, { "epoch": 2.22, "learning_rate": 0.00017896284619486116, "loss": 0.0102, "step": 10897 }, { "epoch": 2.22, "learning_rate": 0.0001789438253812115, "loss": 0.0166, "step": 10898 }, { "epoch": 2.22, "learning_rate": 0.00017892480408414528, "loss": 0.0089, "step": 10899 }, { "epoch": 2.22, "learning_rate": 0.00017890578230398023, "loss": 0.0142, "step": 10900 }, { "epoch": 2.22, "learning_rate": 0.00017888676004103408, "loss": 0.0104, "step": 10901 }, { "epoch": 2.22, "learning_rate": 0.00017886773729562446, "loss": 0.0073, "step": 10902 }, { "epoch": 2.22, "learning_rate": 0.0001788487140680692, "loss": 0.0131, "step": 10903 }, { "epoch": 2.22, "learning_rate": 0.0001788296903586859, "loss": 0.0009, "step": 10904 }, { "epoch": 2.22, "learning_rate": 0.0001788106661677924, "loss": 0.0215, "step": 10905 }, { "epoch": 2.22, "learning_rate": 0.00017879164149570638, "loss": 0.0075, "step": 10906 }, { "epoch": 2.22, "learning_rate": 0.0001787726163427456, "loss": 0.0035, "step": 10907 }, { "epoch": 2.22, "learning_rate": 0.0001787535907092278, "loss": 0.0078, "step": 10908 }, { "epoch": 2.22, "learning_rate": 0.00017873456459547074, "loss": 0.0054, "step": 10909 }, { "epoch": 2.22, "learning_rate": 0.00017871553800179223, "loss": 0.0084, "step": 10910 }, { "epoch": 2.22, "learning_rate": 0.00017869651092851008, "loss": 0.011, "step": 10911 }, { "epoch": 2.22, "learning_rate": 0.00017867748337594197, "loss": 0.011, "step": 10912 }, { "epoch": 2.22, "learning_rate": 0.00017865845534440576, "loss": 0.0027, "step": 10913 }, { "epoch": 2.22, "learning_rate": 0.00017863942683421925, "loss": 0.0193, "step": 10914 }, { "epoch": 2.22, "learning_rate": 0.00017862039784570025, "loss": 0.0209, "step": 10915 }, { "epoch": 2.22, "learning_rate": 0.0001786013683791666, "loss": 0.0042, "step": 10916 }, { "epoch": 2.22, "learning_rate": 0.00017858233843493613, "loss": 0.004, "step": 10917 }, { "epoch": 2.22, "learning_rate": 0.00017856330801332661, "loss": 0.0076, "step": 10918 }, { "epoch": 2.22, "learning_rate": 0.00017854427711465595, "loss": 0.0112, "step": 10919 }, { "epoch": 2.22, "learning_rate": 0.00017852524573924196, "loss": 0.0049, "step": 10920 }, { "epoch": 2.22, "learning_rate": 0.00017850621388740257, "loss": 0.0007, "step": 10921 }, { "epoch": 2.22, "learning_rate": 0.00017848718155945555, "loss": 0.0057, "step": 10922 }, { "epoch": 2.22, "learning_rate": 0.00017846814875571886, "loss": 0.0138, "step": 10923 }, { "epoch": 2.22, "learning_rate": 0.00017844911547651034, "loss": 0.0145, "step": 10924 }, { "epoch": 2.22, "learning_rate": 0.00017843008172214783, "loss": 0.0064, "step": 10925 }, { "epoch": 2.22, "learning_rate": 0.00017841104749294936, "loss": 0.0182, "step": 10926 }, { "epoch": 2.22, "learning_rate": 0.00017839201278923274, "loss": 0.0056, "step": 10927 }, { "epoch": 2.23, "learning_rate": 0.0001783729776113159, "loss": 0.0032, "step": 10928 }, { "epoch": 2.23, "learning_rate": 0.0001783539419595168, "loss": 0.0121, "step": 10929 }, { "epoch": 2.23, "learning_rate": 0.00017833490583415336, "loss": 0.0047, "step": 10930 }, { "epoch": 2.23, "learning_rate": 0.0001783158692355435, "loss": 0.0089, "step": 10931 }, { "epoch": 2.23, "learning_rate": 0.00017829683216400515, "loss": 0.0025, "step": 10932 }, { "epoch": 2.23, "learning_rate": 0.00017827779461985628, "loss": 0.0046, "step": 10933 }, { "epoch": 2.23, "learning_rate": 0.00017825875660341492, "loss": 0.01, "step": 10934 }, { "epoch": 2.23, "learning_rate": 0.00017823971811499893, "loss": 0.0167, "step": 10935 }, { "epoch": 2.23, "learning_rate": 0.00017822067915492635, "loss": 0.0065, "step": 10936 }, { "epoch": 2.23, "learning_rate": 0.00017820163972351514, "loss": 0.004, "step": 10937 }, { "epoch": 2.23, "learning_rate": 0.00017818259982108336, "loss": 0.0098, "step": 10938 }, { "epoch": 2.23, "learning_rate": 0.00017816355944794897, "loss": 0.0079, "step": 10939 }, { "epoch": 2.23, "learning_rate": 0.00017814451860442994, "loss": 0.0031, "step": 10940 }, { "epoch": 2.23, "learning_rate": 0.0001781254772908443, "loss": 0.0013, "step": 10941 }, { "epoch": 2.23, "learning_rate": 0.00017810643550751016, "loss": 0.0081, "step": 10942 }, { "epoch": 2.23, "learning_rate": 0.00017808739325474545, "loss": 0.0007, "step": 10943 }, { "epoch": 2.23, "learning_rate": 0.00017806835053286825, "loss": 0.0251, "step": 10944 }, { "epoch": 2.23, "learning_rate": 0.00017804930734219662, "loss": 0.0112, "step": 10945 }, { "epoch": 2.23, "learning_rate": 0.00017803026368304862, "loss": 0.0099, "step": 10946 }, { "epoch": 2.23, "learning_rate": 0.0001780112195557423, "loss": 0.0017, "step": 10947 }, { "epoch": 2.23, "learning_rate": 0.00017799217496059576, "loss": 0.0073, "step": 10948 }, { "epoch": 2.23, "learning_rate": 0.00017797312989792705, "loss": 0.0032, "step": 10949 }, { "epoch": 2.23, "learning_rate": 0.00017795408436805423, "loss": 0.0134, "step": 10950 }, { "epoch": 2.23, "learning_rate": 0.00017793503837129548, "loss": 0.0149, "step": 10951 }, { "epoch": 2.23, "learning_rate": 0.00017791599190796883, "loss": 0.0088, "step": 10952 }, { "epoch": 2.23, "learning_rate": 0.00017789694497839244, "loss": 0.0048, "step": 10953 }, { "epoch": 2.23, "learning_rate": 0.0001778778975828844, "loss": 0.0064, "step": 10954 }, { "epoch": 2.23, "learning_rate": 0.00017785884972176282, "loss": 0.0128, "step": 10955 }, { "epoch": 2.23, "learning_rate": 0.0001778398013953459, "loss": 0.0051, "step": 10956 }, { "epoch": 2.23, "learning_rate": 0.0001778207526039517, "loss": 0.0075, "step": 10957 }, { "epoch": 2.23, "learning_rate": 0.0001778017033478985, "loss": 0.0092, "step": 10958 }, { "epoch": 2.23, "learning_rate": 0.00017778265362750433, "loss": 0.0064, "step": 10959 }, { "epoch": 2.23, "learning_rate": 0.00017776360344308738, "loss": 0.0269, "step": 10960 }, { "epoch": 2.23, "learning_rate": 0.00017774455279496586, "loss": 0.0099, "step": 10961 }, { "epoch": 2.23, "learning_rate": 0.00017772550168345798, "loss": 0.0062, "step": 10962 }, { "epoch": 2.23, "learning_rate": 0.00017770645010888183, "loss": 0.0152, "step": 10963 }, { "epoch": 2.23, "learning_rate": 0.00017768739807155567, "loss": 0.0177, "step": 10964 }, { "epoch": 2.23, "learning_rate": 0.0001776683455717977, "loss": 0.0051, "step": 10965 }, { "epoch": 2.23, "learning_rate": 0.0001776492926099261, "loss": 0.0025, "step": 10966 }, { "epoch": 2.23, "learning_rate": 0.0001776302391862592, "loss": 0.0037, "step": 10967 }, { "epoch": 2.23, "learning_rate": 0.0001776111853011151, "loss": 0.004, "step": 10968 }, { "epoch": 2.23, "learning_rate": 0.0001775921309548121, "loss": 0.0107, "step": 10969 }, { "epoch": 2.23, "learning_rate": 0.0001775730761476684, "loss": 0.0126, "step": 10970 }, { "epoch": 2.23, "learning_rate": 0.00017755402088000233, "loss": 0.0065, "step": 10971 }, { "epoch": 2.23, "learning_rate": 0.0001775349651521321, "loss": 0.0034, "step": 10972 }, { "epoch": 2.23, "learning_rate": 0.00017751590896437596, "loss": 0.0151, "step": 10973 }, { "epoch": 2.23, "learning_rate": 0.00017749685231705216, "loss": 0.0106, "step": 10974 }, { "epoch": 2.23, "learning_rate": 0.00017747779521047906, "loss": 0.0037, "step": 10975 }, { "epoch": 2.23, "learning_rate": 0.0001774587376449749, "loss": 0.0037, "step": 10976 }, { "epoch": 2.24, "learning_rate": 0.00017743967962085798, "loss": 0.004, "step": 10977 }, { "epoch": 2.24, "learning_rate": 0.00017742062113844663, "loss": 0.0006, "step": 10978 }, { "epoch": 2.24, "learning_rate": 0.00017740156219805915, "loss": 0.0194, "step": 10979 }, { "epoch": 2.24, "learning_rate": 0.00017738250280001383, "loss": 0.0108, "step": 10980 }, { "epoch": 2.24, "learning_rate": 0.0001773634429446291, "loss": 0.0148, "step": 10981 }, { "epoch": 2.24, "learning_rate": 0.00017734438263222318, "loss": 0.0099, "step": 10982 }, { "epoch": 2.24, "learning_rate": 0.0001773253218631144, "loss": 0.0253, "step": 10983 }, { "epoch": 2.24, "learning_rate": 0.00017730626063762123, "loss": 0.0058, "step": 10984 }, { "epoch": 2.24, "learning_rate": 0.00017728719895606192, "loss": 0.0037, "step": 10985 }, { "epoch": 2.24, "learning_rate": 0.0001772681368187549, "loss": 0.0055, "step": 10986 }, { "epoch": 2.24, "learning_rate": 0.00017724907422601852, "loss": 0.0109, "step": 10987 }, { "epoch": 2.24, "learning_rate": 0.00017723001117817116, "loss": 0.0201, "step": 10988 }, { "epoch": 2.24, "learning_rate": 0.0001772109476755312, "loss": 0.0123, "step": 10989 }, { "epoch": 2.24, "learning_rate": 0.0001771918837184171, "loss": 0.0156, "step": 10990 }, { "epoch": 2.24, "learning_rate": 0.0001771728193071472, "loss": 0.023, "step": 10991 }, { "epoch": 2.24, "learning_rate": 0.0001771537544420399, "loss": 0.0038, "step": 10992 }, { "epoch": 2.24, "learning_rate": 0.00017713468912341365, "loss": 0.0059, "step": 10993 }, { "epoch": 2.24, "learning_rate": 0.0001771156233515869, "loss": 0.0029, "step": 10994 }, { "epoch": 2.24, "learning_rate": 0.00017709655712687804, "loss": 0.0091, "step": 10995 }, { "epoch": 2.24, "learning_rate": 0.00017707749044960547, "loss": 0.0023, "step": 10996 }, { "epoch": 2.24, "learning_rate": 0.00017705842332008774, "loss": 0.003, "step": 10997 }, { "epoch": 2.24, "learning_rate": 0.00017703935573864328, "loss": 0.0157, "step": 10998 }, { "epoch": 2.24, "learning_rate": 0.00017702028770559053, "loss": 0.0095, "step": 10999 }, { "epoch": 2.24, "learning_rate": 0.00017700121922124796, "loss": 0.0292, "step": 11000 }, { "epoch": 2.24, "learning_rate": 0.00017698215028593404, "loss": 0.0019, "step": 11001 }, { "epoch": 2.24, "learning_rate": 0.00017696308089996731, "loss": 0.0028, "step": 11002 }, { "epoch": 2.24, "learning_rate": 0.00017694401106366626, "loss": 0.0123, "step": 11003 }, { "epoch": 2.24, "learning_rate": 0.00017692494077734932, "loss": 0.0074, "step": 11004 }, { "epoch": 2.24, "learning_rate": 0.0001769058700413351, "loss": 0.0116, "step": 11005 }, { "epoch": 2.24, "learning_rate": 0.000176886798855942, "loss": 0.0117, "step": 11006 }, { "epoch": 2.24, "learning_rate": 0.00017686772722148863, "loss": 0.0061, "step": 11007 }, { "epoch": 2.24, "learning_rate": 0.00017684865513829345, "loss": 0.0068, "step": 11008 }, { "epoch": 2.24, "learning_rate": 0.00017682958260667513, "loss": 0.0081, "step": 11009 }, { "epoch": 2.24, "learning_rate": 0.0001768105096269521, "loss": 0.0136, "step": 11010 }, { "epoch": 2.24, "learning_rate": 0.00017679143619944295, "loss": 0.0052, "step": 11011 }, { "epoch": 2.24, "learning_rate": 0.00017677236232446625, "loss": 0.0099, "step": 11012 }, { "epoch": 2.24, "learning_rate": 0.00017675328800234057, "loss": 0.0076, "step": 11013 }, { "epoch": 2.24, "learning_rate": 0.00017673421323338446, "loss": 0.0177, "step": 11014 }, { "epoch": 2.24, "learning_rate": 0.00017671513801791654, "loss": 0.0098, "step": 11015 }, { "epoch": 2.24, "learning_rate": 0.00017669606235625536, "loss": 0.0134, "step": 11016 }, { "epoch": 2.24, "learning_rate": 0.0001766769862487196, "loss": 0.0045, "step": 11017 }, { "epoch": 2.24, "learning_rate": 0.00017665790969562773, "loss": 0.0243, "step": 11018 }, { "epoch": 2.24, "learning_rate": 0.0001766388326972985, "loss": 0.0121, "step": 11019 }, { "epoch": 2.24, "learning_rate": 0.00017661975525405047, "loss": 0.0111, "step": 11020 }, { "epoch": 2.24, "learning_rate": 0.00017660067736620228, "loss": 0.0066, "step": 11021 }, { "epoch": 2.24, "learning_rate": 0.0001765815990340726, "loss": 0.0066, "step": 11022 }, { "epoch": 2.24, "learning_rate": 0.00017656252025798, "loss": 0.0057, "step": 11023 }, { "epoch": 2.24, "learning_rate": 0.00017654344103824318, "loss": 0.003, "step": 11024 }, { "epoch": 2.24, "learning_rate": 0.0001765243613751808, "loss": 0.0226, "step": 11025 }, { "epoch": 2.25, "learning_rate": 0.0001765052812691115, "loss": 0.007, "step": 11026 }, { "epoch": 2.25, "learning_rate": 0.00017648620072035397, "loss": 0.0033, "step": 11027 }, { "epoch": 2.25, "learning_rate": 0.0001764671197292269, "loss": 0.0124, "step": 11028 }, { "epoch": 2.25, "learning_rate": 0.00017644803829604895, "loss": 0.0062, "step": 11029 }, { "epoch": 2.25, "learning_rate": 0.0001764289564211389, "loss": 0.0142, "step": 11030 }, { "epoch": 2.25, "learning_rate": 0.0001764098741048153, "loss": 0.0265, "step": 11031 }, { "epoch": 2.25, "learning_rate": 0.00017639079134739702, "loss": 0.0034, "step": 11032 }, { "epoch": 2.25, "learning_rate": 0.0001763717081492027, "loss": 0.002, "step": 11033 }, { "epoch": 2.25, "learning_rate": 0.00017635262451055103, "loss": 0.0068, "step": 11034 }, { "epoch": 2.25, "learning_rate": 0.00017633354043176085, "loss": 0.0135, "step": 11035 }, { "epoch": 2.25, "learning_rate": 0.0001763144559131508, "loss": 0.0227, "step": 11036 }, { "epoch": 2.25, "learning_rate": 0.00017629537095503967, "loss": 0.0353, "step": 11037 }, { "epoch": 2.25, "learning_rate": 0.00017627628555774618, "loss": 0.0022, "step": 11038 }, { "epoch": 2.25, "learning_rate": 0.00017625719972158915, "loss": 0.0043, "step": 11039 }, { "epoch": 2.25, "learning_rate": 0.0001762381134468873, "loss": 0.0111, "step": 11040 }, { "epoch": 2.25, "learning_rate": 0.00017621902673395948, "loss": 0.01, "step": 11041 }, { "epoch": 2.25, "learning_rate": 0.00017619993958312437, "loss": 0.0008, "step": 11042 }, { "epoch": 2.25, "learning_rate": 0.00017618085199470082, "loss": 0.0067, "step": 11043 }, { "epoch": 2.25, "learning_rate": 0.00017616176396900764, "loss": 0.0249, "step": 11044 }, { "epoch": 2.25, "learning_rate": 0.00017614267550636358, "loss": 0.0169, "step": 11045 }, { "epoch": 2.25, "learning_rate": 0.00017612358660708757, "loss": 0.0039, "step": 11046 }, { "epoch": 2.25, "learning_rate": 0.00017610449727149832, "loss": 0.0092, "step": 11047 }, { "epoch": 2.25, "learning_rate": 0.00017608540749991465, "loss": 0.018, "step": 11048 }, { "epoch": 2.25, "learning_rate": 0.00017606631729265542, "loss": 0.0044, "step": 11049 }, { "epoch": 2.25, "learning_rate": 0.00017604722665003956, "loss": 0.0065, "step": 11050 }, { "epoch": 2.25, "learning_rate": 0.00017602813557238579, "loss": 0.0188, "step": 11051 }, { "epoch": 2.25, "learning_rate": 0.00017600904406001305, "loss": 0.025, "step": 11052 }, { "epoch": 2.25, "learning_rate": 0.00017598995211324015, "loss": 0.0103, "step": 11053 }, { "epoch": 2.25, "learning_rate": 0.00017597085973238604, "loss": 0.0095, "step": 11054 }, { "epoch": 2.25, "learning_rate": 0.00017595176691776956, "loss": 0.0164, "step": 11055 }, { "epoch": 2.25, "learning_rate": 0.00017593267366970952, "loss": 0.0011, "step": 11056 }, { "epoch": 2.25, "learning_rate": 0.00017591357998852493, "loss": 0.0113, "step": 11057 }, { "epoch": 2.25, "learning_rate": 0.0001758944858745346, "loss": 0.0123, "step": 11058 }, { "epoch": 2.25, "learning_rate": 0.0001758753913280575, "loss": 0.0031, "step": 11059 }, { "epoch": 2.25, "learning_rate": 0.0001758562963494125, "loss": 0.0142, "step": 11060 }, { "epoch": 2.25, "learning_rate": 0.00017583720093891856, "loss": 0.0029, "step": 11061 }, { "epoch": 2.25, "learning_rate": 0.00017581810509689457, "loss": 0.0182, "step": 11062 }, { "epoch": 2.25, "learning_rate": 0.0001757990088236595, "loss": 0.0145, "step": 11063 }, { "epoch": 2.25, "learning_rate": 0.00017577991211953234, "loss": 0.0073, "step": 11064 }, { "epoch": 2.25, "learning_rate": 0.00017576081498483194, "loss": 0.0013, "step": 11065 }, { "epoch": 2.25, "learning_rate": 0.00017574171741987729, "loss": 0.0091, "step": 11066 }, { "epoch": 2.25, "learning_rate": 0.00017572261942498736, "loss": 0.0156, "step": 11067 }, { "epoch": 2.25, "learning_rate": 0.00017570352100048116, "loss": 0.0066, "step": 11068 }, { "epoch": 2.25, "learning_rate": 0.00017568442214667762, "loss": 0.0076, "step": 11069 }, { "epoch": 2.25, "learning_rate": 0.00017566532286389578, "loss": 0.0124, "step": 11070 }, { "epoch": 2.25, "learning_rate": 0.00017564622315245458, "loss": 0.0019, "step": 11071 }, { "epoch": 2.25, "learning_rate": 0.00017562712301267302, "loss": 0.0103, "step": 11072 }, { "epoch": 2.25, "learning_rate": 0.00017560802244487018, "loss": 0.0109, "step": 11073 }, { "epoch": 2.25, "learning_rate": 0.00017558892144936498, "loss": 0.01, "step": 11074 }, { "epoch": 2.26, "learning_rate": 0.0001755698200264765, "loss": 0.0238, "step": 11075 }, { "epoch": 2.26, "learning_rate": 0.0001755507181765238, "loss": 0.01, "step": 11076 }, { "epoch": 2.26, "learning_rate": 0.00017553161589982586, "loss": 0.0019, "step": 11077 }, { "epoch": 2.26, "learning_rate": 0.00017551251319670172, "loss": 0.0081, "step": 11078 }, { "epoch": 2.26, "learning_rate": 0.00017549341006747047, "loss": 0.0082, "step": 11079 }, { "epoch": 2.26, "learning_rate": 0.0001754743065124511, "loss": 0.0026, "step": 11080 }, { "epoch": 2.26, "learning_rate": 0.00017545520253196275, "loss": 0.0438, "step": 11081 }, { "epoch": 2.26, "learning_rate": 0.00017543609812632448, "loss": 0.0126, "step": 11082 }, { "epoch": 2.26, "learning_rate": 0.0001754169932958554, "loss": 0.0027, "step": 11083 }, { "epoch": 2.26, "learning_rate": 0.00017539788804087447, "loss": 0.0058, "step": 11084 }, { "epoch": 2.26, "learning_rate": 0.00017537878236170094, "loss": 0.0114, "step": 11085 }, { "epoch": 2.26, "learning_rate": 0.0001753596762586538, "loss": 0.0231, "step": 11086 }, { "epoch": 2.26, "learning_rate": 0.00017534056973205224, "loss": 0.0091, "step": 11087 }, { "epoch": 2.26, "learning_rate": 0.00017532146278221528, "loss": 0.01, "step": 11088 }, { "epoch": 2.26, "learning_rate": 0.0001753023554094621, "loss": 0.004, "step": 11089 }, { "epoch": 2.26, "learning_rate": 0.00017528324761411184, "loss": 0.0164, "step": 11090 }, { "epoch": 2.26, "learning_rate": 0.00017526413939648354, "loss": 0.0148, "step": 11091 }, { "epoch": 2.26, "learning_rate": 0.00017524503075689652, "loss": 0.0101, "step": 11092 }, { "epoch": 2.26, "learning_rate": 0.00017522592169566984, "loss": 0.0139, "step": 11093 }, { "epoch": 2.26, "learning_rate": 0.0001752068122131226, "loss": 0.0107, "step": 11094 }, { "epoch": 2.26, "learning_rate": 0.000175187702309574, "loss": 0.0063, "step": 11095 }, { "epoch": 2.26, "learning_rate": 0.00017516859198534327, "loss": 0.0107, "step": 11096 }, { "epoch": 2.26, "learning_rate": 0.00017514948124074955, "loss": 0.0116, "step": 11097 }, { "epoch": 2.26, "learning_rate": 0.000175130370076112, "loss": 0.02, "step": 11098 }, { "epoch": 2.26, "learning_rate": 0.00017511125849174985, "loss": 0.0111, "step": 11099 }, { "epoch": 2.26, "learning_rate": 0.00017509214648798226, "loss": 0.0158, "step": 11100 }, { "epoch": 2.26, "learning_rate": 0.00017507303406512847, "loss": 0.0039, "step": 11101 }, { "epoch": 2.26, "learning_rate": 0.00017505392122350768, "loss": 0.0005, "step": 11102 }, { "epoch": 2.26, "learning_rate": 0.0001750348079634391, "loss": 0.0031, "step": 11103 }, { "epoch": 2.26, "learning_rate": 0.000175015694285242, "loss": 0.0052, "step": 11104 }, { "epoch": 2.26, "learning_rate": 0.00017499658018923557, "loss": 0.0107, "step": 11105 }, { "epoch": 2.26, "learning_rate": 0.0001749774656757391, "loss": 0.0224, "step": 11106 }, { "epoch": 2.26, "learning_rate": 0.00017495835074507173, "loss": 0.0176, "step": 11107 }, { "epoch": 2.26, "learning_rate": 0.00017493923539755284, "loss": 0.0075, "step": 11108 }, { "epoch": 2.26, "learning_rate": 0.0001749201196335016, "loss": 0.0234, "step": 11109 }, { "epoch": 2.26, "learning_rate": 0.00017490100345323738, "loss": 0.0287, "step": 11110 }, { "epoch": 2.26, "learning_rate": 0.00017488188685707936, "loss": 0.009, "step": 11111 }, { "epoch": 2.26, "learning_rate": 0.00017486276984534686, "loss": 0.0103, "step": 11112 }, { "epoch": 2.26, "learning_rate": 0.0001748436524183592, "loss": 0.0014, "step": 11113 }, { "epoch": 2.26, "learning_rate": 0.00017482453457643563, "loss": 0.0085, "step": 11114 }, { "epoch": 2.26, "learning_rate": 0.0001748054163198955, "loss": 0.0061, "step": 11115 }, { "epoch": 2.26, "learning_rate": 0.00017478629764905806, "loss": 0.005, "step": 11116 }, { "epoch": 2.26, "learning_rate": 0.0001747671785642427, "loss": 0.0039, "step": 11117 }, { "epoch": 2.26, "learning_rate": 0.00017474805906576865, "loss": 0.0063, "step": 11118 }, { "epoch": 2.26, "learning_rate": 0.0001747289391539553, "loss": 0.0161, "step": 11119 }, { "epoch": 2.26, "learning_rate": 0.0001747098188291221, "loss": 0.0161, "step": 11120 }, { "epoch": 2.26, "learning_rate": 0.00017469069809158814, "loss": 0.0027, "step": 11121 }, { "epoch": 2.26, "learning_rate": 0.00017467157694167298, "loss": 0.0118, "step": 11122 }, { "epoch": 2.26, "learning_rate": 0.0001746524553796959, "loss": 0.0211, "step": 11123 }, { "epoch": 2.27, "learning_rate": 0.00017463333340597632, "loss": 0.0043, "step": 11124 }, { "epoch": 2.27, "learning_rate": 0.00017461421102083353, "loss": 0.0069, "step": 11125 }, { "epoch": 2.27, "learning_rate": 0.00017459508822458694, "loss": 0.007, "step": 11126 }, { "epoch": 2.27, "learning_rate": 0.00017457596501755597, "loss": 0.0122, "step": 11127 }, { "epoch": 2.27, "learning_rate": 0.00017455684140006, "loss": 0.0061, "step": 11128 }, { "epoch": 2.27, "learning_rate": 0.00017453771737241847, "loss": 0.0087, "step": 11129 }, { "epoch": 2.27, "learning_rate": 0.00017451859293495068, "loss": 0.0059, "step": 11130 }, { "epoch": 2.27, "learning_rate": 0.00017449946808797612, "loss": 0.0092, "step": 11131 }, { "epoch": 2.27, "learning_rate": 0.0001744803428318142, "loss": 0.0011, "step": 11132 }, { "epoch": 2.27, "learning_rate": 0.0001744612171667843, "loss": 0.0032, "step": 11133 }, { "epoch": 2.27, "learning_rate": 0.00017444209109320597, "loss": 0.0114, "step": 11134 }, { "epoch": 2.27, "learning_rate": 0.00017442296461139857, "loss": 0.0087, "step": 11135 }, { "epoch": 2.27, "learning_rate": 0.0001744038377216815, "loss": 0.0057, "step": 11136 }, { "epoch": 2.27, "learning_rate": 0.0001743847104243743, "loss": 0.0044, "step": 11137 }, { "epoch": 2.27, "learning_rate": 0.0001743655827197965, "loss": 0.0121, "step": 11138 }, { "epoch": 2.27, "learning_rate": 0.00017434645460826737, "loss": 0.0091, "step": 11139 }, { "epoch": 2.27, "learning_rate": 0.00017432732609010652, "loss": 0.0079, "step": 11140 }, { "epoch": 2.27, "learning_rate": 0.0001743081971656334, "loss": 0.0054, "step": 11141 }, { "epoch": 2.27, "learning_rate": 0.00017428906783516752, "loss": 0.0033, "step": 11142 }, { "epoch": 2.27, "learning_rate": 0.00017426993809902832, "loss": 0.0054, "step": 11143 }, { "epoch": 2.27, "learning_rate": 0.00017425080795753536, "loss": 0.0084, "step": 11144 }, { "epoch": 2.27, "learning_rate": 0.00017423167741100815, "loss": 0.0068, "step": 11145 }, { "epoch": 2.27, "learning_rate": 0.00017421254645976614, "loss": 0.0055, "step": 11146 }, { "epoch": 2.27, "learning_rate": 0.00017419341510412897, "loss": 0.0053, "step": 11147 }, { "epoch": 2.27, "learning_rate": 0.00017417428334441605, "loss": 0.0029, "step": 11148 }, { "epoch": 2.27, "learning_rate": 0.000174155151180947, "loss": 0.0018, "step": 11149 }, { "epoch": 2.27, "learning_rate": 0.00017413601861404127, "loss": 0.013, "step": 11150 }, { "epoch": 2.27, "learning_rate": 0.0001741168856440185, "loss": 0.0085, "step": 11151 }, { "epoch": 2.27, "learning_rate": 0.0001740977522711982, "loss": 0.0169, "step": 11152 }, { "epoch": 2.27, "learning_rate": 0.00017407861849589999, "loss": 0.0262, "step": 11153 }, { "epoch": 2.27, "learning_rate": 0.00017405948431844338, "loss": 0.0151, "step": 11154 }, { "epoch": 2.27, "learning_rate": 0.00017404034973914794, "loss": 0.0074, "step": 11155 }, { "epoch": 2.27, "learning_rate": 0.00017402121475833333, "loss": 0.0023, "step": 11156 }, { "epoch": 2.27, "learning_rate": 0.00017400207937631908, "loss": 0.0058, "step": 11157 }, { "epoch": 2.27, "learning_rate": 0.0001739829435934248, "loss": 0.0115, "step": 11158 }, { "epoch": 2.27, "learning_rate": 0.00017396380740997003, "loss": 0.0039, "step": 11159 }, { "epoch": 2.27, "learning_rate": 0.0001739446708262745, "loss": 0.0077, "step": 11160 }, { "epoch": 2.27, "learning_rate": 0.00017392553384265778, "loss": 0.0121, "step": 11161 }, { "epoch": 2.27, "learning_rate": 0.00017390639645943945, "loss": 0.0101, "step": 11162 }, { "epoch": 2.27, "learning_rate": 0.00017388725867693915, "loss": 0.01, "step": 11163 }, { "epoch": 2.27, "learning_rate": 0.00017386812049547656, "loss": 0.003, "step": 11164 }, { "epoch": 2.27, "learning_rate": 0.00017384898191537132, "loss": 0.0089, "step": 11165 }, { "epoch": 2.27, "learning_rate": 0.00017382984293694306, "loss": 0.0094, "step": 11166 }, { "epoch": 2.27, "learning_rate": 0.00017381070356051144, "loss": 0.0145, "step": 11167 }, { "epoch": 2.27, "learning_rate": 0.00017379156378639614, "loss": 0.0221, "step": 11168 }, { "epoch": 2.27, "learning_rate": 0.0001737724236149168, "loss": 0.007, "step": 11169 }, { "epoch": 2.27, "learning_rate": 0.0001737532830463931, "loss": 0.0111, "step": 11170 }, { "epoch": 2.27, "learning_rate": 0.00017373414208114477, "loss": 0.0033, "step": 11171 }, { "epoch": 2.27, "learning_rate": 0.00017371500071949143, "loss": 0.0118, "step": 11172 }, { "epoch": 2.28, "learning_rate": 0.0001736958589617528, "loss": 0.0147, "step": 11173 }, { "epoch": 2.28, "learning_rate": 0.0001736767168082486, "loss": 0.0048, "step": 11174 }, { "epoch": 2.28, "learning_rate": 0.00017365757425929858, "loss": 0.0101, "step": 11175 }, { "epoch": 2.28, "learning_rate": 0.00017363843131522238, "loss": 0.0155, "step": 11176 }, { "epoch": 2.28, "learning_rate": 0.00017361928797633976, "loss": 0.0168, "step": 11177 }, { "epoch": 2.28, "learning_rate": 0.00017360014424297045, "loss": 0.001, "step": 11178 }, { "epoch": 2.28, "learning_rate": 0.00017358100011543418, "loss": 0.0048, "step": 11179 }, { "epoch": 2.28, "learning_rate": 0.00017356185559405074, "loss": 0.0045, "step": 11180 }, { "epoch": 2.28, "learning_rate": 0.00017354271067913978, "loss": 0.0048, "step": 11181 }, { "epoch": 2.28, "learning_rate": 0.0001735235653710211, "loss": 0.0096, "step": 11182 }, { "epoch": 2.28, "learning_rate": 0.00017350441967001453, "loss": 0.0131, "step": 11183 }, { "epoch": 2.28, "learning_rate": 0.00017348527357643974, "loss": 0.0048, "step": 11184 }, { "epoch": 2.28, "learning_rate": 0.00017346612709061656, "loss": 0.0088, "step": 11185 }, { "epoch": 2.28, "learning_rate": 0.0001734469802128648, "loss": 0.0012, "step": 11186 }, { "epoch": 2.28, "learning_rate": 0.00017342783294350416, "loss": 0.0047, "step": 11187 }, { "epoch": 2.28, "learning_rate": 0.0001734086852828545, "loss": 0.001, "step": 11188 }, { "epoch": 2.28, "learning_rate": 0.00017338953723123563, "loss": 0.0169, "step": 11189 }, { "epoch": 2.28, "learning_rate": 0.0001733703887889673, "loss": 0.0035, "step": 11190 }, { "epoch": 2.28, "learning_rate": 0.0001733512399563694, "loss": 0.0038, "step": 11191 }, { "epoch": 2.28, "learning_rate": 0.00017333209073376168, "loss": 0.0006, "step": 11192 }, { "epoch": 2.28, "learning_rate": 0.00017331294112146403, "loss": 0.01, "step": 11193 }, { "epoch": 2.28, "learning_rate": 0.00017329379111979626, "loss": 0.0129, "step": 11194 }, { "epoch": 2.28, "learning_rate": 0.00017327464072907817, "loss": 0.0116, "step": 11195 }, { "epoch": 2.28, "learning_rate": 0.00017325548994962965, "loss": 0.0061, "step": 11196 }, { "epoch": 2.28, "learning_rate": 0.00017323633878177057, "loss": 0.003, "step": 11197 }, { "epoch": 2.28, "learning_rate": 0.0001732171872258208, "loss": 0.0155, "step": 11198 }, { "epoch": 2.28, "learning_rate": 0.00017319803528210016, "loss": 0.0143, "step": 11199 }, { "epoch": 2.28, "learning_rate": 0.00017317888295092853, "loss": 0.0039, "step": 11200 }, { "epoch": 2.28, "learning_rate": 0.0001731597302326258, "loss": 0.0305, "step": 11201 }, { "epoch": 2.28, "learning_rate": 0.00017314057712751184, "loss": 0.0087, "step": 11202 }, { "epoch": 2.28, "learning_rate": 0.00017312142363590659, "loss": 0.001, "step": 11203 }, { "epoch": 2.28, "learning_rate": 0.00017310226975812988, "loss": 0.0078, "step": 11204 }, { "epoch": 2.28, "learning_rate": 0.0001730831154945017, "loss": 0.0032, "step": 11205 }, { "epoch": 2.28, "learning_rate": 0.0001730639608453419, "loss": 0.0118, "step": 11206 }, { "epoch": 2.28, "learning_rate": 0.00017304480581097043, "loss": 0.0024, "step": 11207 }, { "epoch": 2.28, "learning_rate": 0.0001730256503917072, "loss": 0.0093, "step": 11208 }, { "epoch": 2.28, "learning_rate": 0.00017300649458787214, "loss": 0.0399, "step": 11209 }, { "epoch": 2.28, "learning_rate": 0.00017298733839978518, "loss": 0.0058, "step": 11210 }, { "epoch": 2.28, "learning_rate": 0.00017296818182776632, "loss": 0.0105, "step": 11211 }, { "epoch": 2.28, "learning_rate": 0.00017294902487213548, "loss": 0.0139, "step": 11212 }, { "epoch": 2.28, "learning_rate": 0.00017292986753321253, "loss": 0.0115, "step": 11213 }, { "epoch": 2.28, "learning_rate": 0.00017291070981131755, "loss": 0.0141, "step": 11214 }, { "epoch": 2.28, "learning_rate": 0.00017289155170677043, "loss": 0.005, "step": 11215 }, { "epoch": 2.28, "learning_rate": 0.00017287239321989119, "loss": 0.0062, "step": 11216 }, { "epoch": 2.28, "learning_rate": 0.0001728532343509999, "loss": 0.0039, "step": 11217 }, { "epoch": 2.28, "learning_rate": 0.00017283407510041638, "loss": 0.0046, "step": 11218 }, { "epoch": 2.28, "learning_rate": 0.0001728149154684607, "loss": 0.0103, "step": 11219 }, { "epoch": 2.28, "learning_rate": 0.00017279575545545286, "loss": 0.0069, "step": 11220 }, { "epoch": 2.28, "learning_rate": 0.00017277659506171296, "loss": 0.0022, "step": 11221 }, { "epoch": 2.29, "learning_rate": 0.00017275743428756083, "loss": 0.01, "step": 11222 }, { "epoch": 2.29, "learning_rate": 0.00017273827313331664, "loss": 0.0095, "step": 11223 }, { "epoch": 2.29, "learning_rate": 0.00017271911159930036, "loss": 0.0259, "step": 11224 }, { "epoch": 2.29, "learning_rate": 0.00017269994968583202, "loss": 0.0072, "step": 11225 }, { "epoch": 2.29, "learning_rate": 0.00017268078739323168, "loss": 0.0019, "step": 11226 }, { "epoch": 2.29, "learning_rate": 0.00017266162472181934, "loss": 0.0037, "step": 11227 }, { "epoch": 2.29, "learning_rate": 0.00017264246167191514, "loss": 0.0183, "step": 11228 }, { "epoch": 2.29, "learning_rate": 0.00017262329824383903, "loss": 0.0042, "step": 11229 }, { "epoch": 2.29, "learning_rate": 0.0001726041344379112, "loss": 0.0171, "step": 11230 }, { "epoch": 2.29, "learning_rate": 0.00017258497025445164, "loss": 0.0194, "step": 11231 }, { "epoch": 2.29, "learning_rate": 0.00017256580569378045, "loss": 0.0086, "step": 11232 }, { "epoch": 2.29, "learning_rate": 0.00017254664075621768, "loss": 0.0055, "step": 11233 }, { "epoch": 2.29, "learning_rate": 0.00017252747544208347, "loss": 0.0058, "step": 11234 }, { "epoch": 2.29, "learning_rate": 0.00017250830975169788, "loss": 0.0077, "step": 11235 }, { "epoch": 2.29, "learning_rate": 0.00017248914368538107, "loss": 0.0162, "step": 11236 }, { "epoch": 2.29, "learning_rate": 0.00017246997724345306, "loss": 0.0055, "step": 11237 }, { "epoch": 2.29, "learning_rate": 0.00017245081042623403, "loss": 0.0124, "step": 11238 }, { "epoch": 2.29, "learning_rate": 0.0001724316432340441, "loss": 0.0048, "step": 11239 }, { "epoch": 2.29, "learning_rate": 0.0001724124756672034, "loss": 0.0095, "step": 11240 }, { "epoch": 2.29, "learning_rate": 0.00017239330772603204, "loss": 0.0052, "step": 11241 }, { "epoch": 2.29, "learning_rate": 0.00017237413941085015, "loss": 0.0116, "step": 11242 }, { "epoch": 2.29, "learning_rate": 0.0001723549707219779, "loss": 0.0048, "step": 11243 }, { "epoch": 2.29, "learning_rate": 0.00017233580165973542, "loss": 0.0026, "step": 11244 }, { "epoch": 2.29, "learning_rate": 0.00017231663222444296, "loss": 0.0159, "step": 11245 }, { "epoch": 2.29, "learning_rate": 0.00017229746241642052, "loss": 0.0044, "step": 11246 }, { "epoch": 2.29, "learning_rate": 0.0001722782922359884, "loss": 0.012, "step": 11247 }, { "epoch": 2.29, "learning_rate": 0.0001722591216834668, "loss": 0.0047, "step": 11248 }, { "epoch": 2.29, "learning_rate": 0.00017223995075917584, "loss": 0.0059, "step": 11249 }, { "epoch": 2.29, "learning_rate": 0.0001722207794634357, "loss": 0.0101, "step": 11250 }, { "epoch": 2.29, "learning_rate": 0.00017220160779656658, "loss": 0.0139, "step": 11251 }, { "epoch": 2.29, "learning_rate": 0.00017218243575888872, "loss": 0.0038, "step": 11252 }, { "epoch": 2.29, "learning_rate": 0.00017216326335072233, "loss": 0.0174, "step": 11253 }, { "epoch": 2.29, "learning_rate": 0.00017214409057238764, "loss": 0.0028, "step": 11254 }, { "epoch": 2.29, "learning_rate": 0.00017212491742420475, "loss": 0.0084, "step": 11255 }, { "epoch": 2.29, "learning_rate": 0.00017210574390649403, "loss": 0.0099, "step": 11256 }, { "epoch": 2.29, "learning_rate": 0.0001720865700195756, "loss": 0.0332, "step": 11257 }, { "epoch": 2.29, "learning_rate": 0.00017206739576376982, "loss": 0.0085, "step": 11258 }, { "epoch": 2.29, "learning_rate": 0.00017204822113939684, "loss": 0.0116, "step": 11259 }, { "epoch": 2.29, "learning_rate": 0.00017202904614677694, "loss": 0.0041, "step": 11260 }, { "epoch": 2.29, "learning_rate": 0.0001720098707862304, "loss": 0.0079, "step": 11261 }, { "epoch": 2.29, "learning_rate": 0.00017199069505807748, "loss": 0.0097, "step": 11262 }, { "epoch": 2.29, "learning_rate": 0.0001719715189626385, "loss": 0.003, "step": 11263 }, { "epoch": 2.29, "learning_rate": 0.00017195234250023361, "loss": 0.0025, "step": 11264 }, { "epoch": 2.29, "learning_rate": 0.00017193316567118316, "loss": 0.0054, "step": 11265 }, { "epoch": 2.29, "learning_rate": 0.00017191398847580746, "loss": 0.0021, "step": 11266 }, { "epoch": 2.29, "learning_rate": 0.00017189481091442677, "loss": 0.0123, "step": 11267 }, { "epoch": 2.29, "learning_rate": 0.00017187563298736144, "loss": 0.0083, "step": 11268 }, { "epoch": 2.29, "learning_rate": 0.00017185645469493168, "loss": 0.0153, "step": 11269 }, { "epoch": 2.29, "learning_rate": 0.0001718372760374579, "loss": 0.0043, "step": 11270 }, { "epoch": 2.29, "learning_rate": 0.00017181809701526042, "loss": 0.0042, "step": 11271 }, { "epoch": 2.3, "learning_rate": 0.00017179891762865955, "loss": 0.0092, "step": 11272 }, { "epoch": 2.3, "learning_rate": 0.0001717797378779756, "loss": 0.0178, "step": 11273 }, { "epoch": 2.3, "learning_rate": 0.00017176055776352888, "loss": 0.0011, "step": 11274 }, { "epoch": 2.3, "learning_rate": 0.0001717413772856398, "loss": 0.0084, "step": 11275 }, { "epoch": 2.3, "learning_rate": 0.00017172219644462862, "loss": 0.0056, "step": 11276 }, { "epoch": 2.3, "learning_rate": 0.00017170301524081582, "loss": 0.0109, "step": 11277 }, { "epoch": 2.3, "learning_rate": 0.00017168383367452167, "loss": 0.0059, "step": 11278 }, { "epoch": 2.3, "learning_rate": 0.00017166465174606654, "loss": 0.0089, "step": 11279 }, { "epoch": 2.3, "learning_rate": 0.0001716454694557709, "loss": 0.0524, "step": 11280 }, { "epoch": 2.3, "learning_rate": 0.000171626286803955, "loss": 0.0093, "step": 11281 }, { "epoch": 2.3, "learning_rate": 0.00017160710379093933, "loss": 0.0055, "step": 11282 }, { "epoch": 2.3, "learning_rate": 0.00017158792041704424, "loss": 0.0014, "step": 11283 }, { "epoch": 2.3, "learning_rate": 0.0001715687366825901, "loss": 0.0131, "step": 11284 }, { "epoch": 2.3, "learning_rate": 0.00017154955258789735, "loss": 0.0024, "step": 11285 }, { "epoch": 2.3, "learning_rate": 0.00017153036813328642, "loss": 0.0046, "step": 11286 }, { "epoch": 2.3, "learning_rate": 0.00017151118331907767, "loss": 0.0088, "step": 11287 }, { "epoch": 2.3, "learning_rate": 0.00017149199814559153, "loss": 0.0157, "step": 11288 }, { "epoch": 2.3, "learning_rate": 0.0001714728126131485, "loss": 0.0037, "step": 11289 }, { "epoch": 2.3, "learning_rate": 0.00017145362672206895, "loss": 0.0065, "step": 11290 }, { "epoch": 2.3, "learning_rate": 0.00017143444047267335, "loss": 0.0203, "step": 11291 }, { "epoch": 2.3, "learning_rate": 0.00017141525386528213, "loss": 0.0148, "step": 11292 }, { "epoch": 2.3, "learning_rate": 0.00017139606690021574, "loss": 0.0052, "step": 11293 }, { "epoch": 2.3, "learning_rate": 0.00017137687957779463, "loss": 0.0099, "step": 11294 }, { "epoch": 2.3, "learning_rate": 0.00017135769189833934, "loss": 0.0128, "step": 11295 }, { "epoch": 2.3, "learning_rate": 0.0001713385038621702, "loss": 0.0027, "step": 11296 }, { "epoch": 2.3, "learning_rate": 0.0001713193154696078, "loss": 0.0187, "step": 11297 }, { "epoch": 2.3, "learning_rate": 0.0001713001267209726, "loss": 0.0022, "step": 11298 }, { "epoch": 2.3, "learning_rate": 0.000171280937616585, "loss": 0.0076, "step": 11299 }, { "epoch": 2.3, "learning_rate": 0.00017126174815676568, "loss": 0.0109, "step": 11300 }, { "epoch": 2.3, "learning_rate": 0.00017124255834183498, "loss": 0.0136, "step": 11301 }, { "epoch": 2.3, "learning_rate": 0.00017122336817211345, "loss": 0.0067, "step": 11302 }, { "epoch": 2.3, "learning_rate": 0.00017120417764792165, "loss": 0.0126, "step": 11303 }, { "epoch": 2.3, "learning_rate": 0.00017118498676958003, "loss": 0.003, "step": 11304 }, { "epoch": 2.3, "learning_rate": 0.00017116579553740917, "loss": 0.0041, "step": 11305 }, { "epoch": 2.3, "learning_rate": 0.00017114660395172953, "loss": 0.0116, "step": 11306 }, { "epoch": 2.3, "learning_rate": 0.0001711274120128617, "loss": 0.0085, "step": 11307 }, { "epoch": 2.3, "learning_rate": 0.0001711082197211262, "loss": 0.0036, "step": 11308 }, { "epoch": 2.3, "learning_rate": 0.0001710890270768436, "loss": 0.0084, "step": 11309 }, { "epoch": 2.3, "learning_rate": 0.00017106983408033443, "loss": 0.0017, "step": 11310 }, { "epoch": 2.3, "learning_rate": 0.00017105064073191925, "loss": 0.0248, "step": 11311 }, { "epoch": 2.3, "learning_rate": 0.00017103144703191865, "loss": 0.0037, "step": 11312 }, { "epoch": 2.3, "learning_rate": 0.00017101225298065317, "loss": 0.0097, "step": 11313 }, { "epoch": 2.3, "learning_rate": 0.00017099305857844345, "loss": 0.0094, "step": 11314 }, { "epoch": 2.3, "learning_rate": 0.00017097386382561, "loss": 0.0086, "step": 11315 }, { "epoch": 2.3, "learning_rate": 0.00017095466872247344, "loss": 0.002, "step": 11316 }, { "epoch": 2.3, "learning_rate": 0.0001709354732693543, "loss": 0.0192, "step": 11317 }, { "epoch": 2.3, "learning_rate": 0.0001709162774665733, "loss": 0.0153, "step": 11318 }, { "epoch": 2.3, "learning_rate": 0.00017089708131445093, "loss": 0.007, "step": 11319 }, { "epoch": 2.3, "learning_rate": 0.00017087788481330788, "loss": 0.0294, "step": 11320 }, { "epoch": 2.31, "learning_rate": 0.00017085868796346476, "loss": 0.0043, "step": 11321 }, { "epoch": 2.31, "learning_rate": 0.00017083949076524216, "loss": 0.0064, "step": 11322 }, { "epoch": 2.31, "learning_rate": 0.00017082029321896077, "loss": 0.0106, "step": 11323 }, { "epoch": 2.31, "learning_rate": 0.00017080109532494113, "loss": 0.0063, "step": 11324 }, { "epoch": 2.31, "learning_rate": 0.00017078189708350397, "loss": 0.0081, "step": 11325 }, { "epoch": 2.31, "learning_rate": 0.00017076269849496987, "loss": 0.0057, "step": 11326 }, { "epoch": 2.31, "learning_rate": 0.00017074349955965954, "loss": 0.0087, "step": 11327 }, { "epoch": 2.31, "learning_rate": 0.00017072430027789362, "loss": 0.0119, "step": 11328 }, { "epoch": 2.31, "learning_rate": 0.0001707051006499927, "loss": 0.0073, "step": 11329 }, { "epoch": 2.31, "learning_rate": 0.00017068590067627757, "loss": 0.0107, "step": 11330 }, { "epoch": 2.31, "learning_rate": 0.00017066670035706882, "loss": 0.02, "step": 11331 }, { "epoch": 2.31, "learning_rate": 0.00017064749969268722, "loss": 0.0142, "step": 11332 }, { "epoch": 2.31, "learning_rate": 0.00017062829868345333, "loss": 0.0017, "step": 11333 }, { "epoch": 2.31, "learning_rate": 0.00017060909732968796, "loss": 0.0061, "step": 11334 }, { "epoch": 2.31, "learning_rate": 0.00017058989563171174, "loss": 0.0102, "step": 11335 }, { "epoch": 2.31, "learning_rate": 0.0001705706935898454, "loss": 0.0012, "step": 11336 }, { "epoch": 2.31, "learning_rate": 0.00017055149120440968, "loss": 0.0071, "step": 11337 }, { "epoch": 2.31, "learning_rate": 0.00017053228847572525, "loss": 0.0191, "step": 11338 }, { "epoch": 2.31, "learning_rate": 0.0001705130854041128, "loss": 0.0179, "step": 11339 }, { "epoch": 2.31, "learning_rate": 0.00017049388198989314, "loss": 0.0223, "step": 11340 }, { "epoch": 2.31, "learning_rate": 0.0001704746782333869, "loss": 0.0092, "step": 11341 }, { "epoch": 2.31, "learning_rate": 0.000170455474134915, "loss": 0.0038, "step": 11342 }, { "epoch": 2.31, "learning_rate": 0.000170436269694798, "loss": 0.0073, "step": 11343 }, { "epoch": 2.31, "learning_rate": 0.00017041706491335672, "loss": 0.0089, "step": 11344 }, { "epoch": 2.31, "learning_rate": 0.00017039785979091192, "loss": 0.0109, "step": 11345 }, { "epoch": 2.31, "learning_rate": 0.00017037865432778442, "loss": 0.009, "step": 11346 }, { "epoch": 2.31, "learning_rate": 0.00017035944852429483, "loss": 0.0219, "step": 11347 }, { "epoch": 2.31, "learning_rate": 0.00017034024238076406, "loss": 0.0097, "step": 11348 }, { "epoch": 2.31, "learning_rate": 0.00017032103589751285, "loss": 0.0124, "step": 11349 }, { "epoch": 2.31, "learning_rate": 0.000170301829074862, "loss": 0.0066, "step": 11350 }, { "epoch": 2.31, "learning_rate": 0.00017028262191313222, "loss": 0.0123, "step": 11351 }, { "epoch": 2.31, "learning_rate": 0.0001702634144126444, "loss": 0.0114, "step": 11352 }, { "epoch": 2.31, "learning_rate": 0.00017024420657371934, "loss": 0.0086, "step": 11353 }, { "epoch": 2.31, "learning_rate": 0.0001702249983966778, "loss": 0.0078, "step": 11354 }, { "epoch": 2.31, "learning_rate": 0.00017020578988184059, "loss": 0.0079, "step": 11355 }, { "epoch": 2.31, "learning_rate": 0.0001701865810295286, "loss": 0.0073, "step": 11356 }, { "epoch": 2.31, "learning_rate": 0.00017016737184006255, "loss": 0.0113, "step": 11357 }, { "epoch": 2.31, "learning_rate": 0.00017014816231376333, "loss": 0.0035, "step": 11358 }, { "epoch": 2.31, "learning_rate": 0.00017012895245095176, "loss": 0.0038, "step": 11359 }, { "epoch": 2.31, "learning_rate": 0.0001701097422519487, "loss": 0.0068, "step": 11360 }, { "epoch": 2.31, "learning_rate": 0.00017009053171707498, "loss": 0.0048, "step": 11361 }, { "epoch": 2.31, "learning_rate": 0.00017007132084665146, "loss": 0.021, "step": 11362 }, { "epoch": 2.31, "learning_rate": 0.000170052109640999, "loss": 0.0068, "step": 11363 }, { "epoch": 2.31, "learning_rate": 0.00017003289810043845, "loss": 0.0063, "step": 11364 }, { "epoch": 2.31, "learning_rate": 0.0001700136862252907, "loss": 0.0048, "step": 11365 }, { "epoch": 2.31, "learning_rate": 0.0001699944740158766, "loss": 0.006, "step": 11366 }, { "epoch": 2.31, "learning_rate": 0.00016997526147251706, "loss": 0.0126, "step": 11367 }, { "epoch": 2.31, "learning_rate": 0.00016995604859553292, "loss": 0.0077, "step": 11368 }, { "epoch": 2.31, "learning_rate": 0.00016993683538524514, "loss": 0.0049, "step": 11369 }, { "epoch": 2.32, "learning_rate": 0.00016991762184197454, "loss": 0.0158, "step": 11370 }, { "epoch": 2.32, "learning_rate": 0.00016989840796604203, "loss": 0.0008, "step": 11371 }, { "epoch": 2.32, "learning_rate": 0.00016987919375776854, "loss": 0.0094, "step": 11372 }, { "epoch": 2.32, "learning_rate": 0.00016985997921747505, "loss": 0.0121, "step": 11373 }, { "epoch": 2.32, "learning_rate": 0.00016984076434548243, "loss": 0.0022, "step": 11374 }, { "epoch": 2.32, "learning_rate": 0.00016982154914211157, "loss": 0.0046, "step": 11375 }, { "epoch": 2.32, "learning_rate": 0.0001698023336076834, "loss": 0.0187, "step": 11376 }, { "epoch": 2.32, "learning_rate": 0.0001697831177425189, "loss": 0.0107, "step": 11377 }, { "epoch": 2.32, "learning_rate": 0.00016976390154693896, "loss": 0.0077, "step": 11378 }, { "epoch": 2.32, "learning_rate": 0.0001697446850212646, "loss": 0.0198, "step": 11379 }, { "epoch": 2.32, "learning_rate": 0.00016972546816581673, "loss": 0.0016, "step": 11380 }, { "epoch": 2.32, "learning_rate": 0.00016970625098091627, "loss": 0.0029, "step": 11381 }, { "epoch": 2.32, "learning_rate": 0.00016968703346688423, "loss": 0.0008, "step": 11382 }, { "epoch": 2.32, "learning_rate": 0.0001696678156240416, "loss": 0.0082, "step": 11383 }, { "epoch": 2.32, "learning_rate": 0.00016964859745270927, "loss": 0.0173, "step": 11384 }, { "epoch": 2.32, "learning_rate": 0.00016962937895320833, "loss": 0.0079, "step": 11385 }, { "epoch": 2.32, "learning_rate": 0.00016961016012585967, "loss": 0.0029, "step": 11386 }, { "epoch": 2.32, "learning_rate": 0.00016959094097098433, "loss": 0.0024, "step": 11387 }, { "epoch": 2.32, "learning_rate": 0.00016957172148890332, "loss": 0.0093, "step": 11388 }, { "epoch": 2.32, "learning_rate": 0.00016955250167993762, "loss": 0.0099, "step": 11389 }, { "epoch": 2.32, "learning_rate": 0.00016953328154440818, "loss": 0.003, "step": 11390 }, { "epoch": 2.32, "learning_rate": 0.00016951406108263608, "loss": 0.0063, "step": 11391 }, { "epoch": 2.32, "learning_rate": 0.00016949484029494237, "loss": 0.0055, "step": 11392 }, { "epoch": 2.32, "learning_rate": 0.00016947561918164797, "loss": 0.0029, "step": 11393 }, { "epoch": 2.32, "learning_rate": 0.000169456397743074, "loss": 0.0059, "step": 11394 }, { "epoch": 2.32, "learning_rate": 0.00016943717597954142, "loss": 0.0127, "step": 11395 }, { "epoch": 2.32, "learning_rate": 0.00016941795389137135, "loss": 0.0211, "step": 11396 }, { "epoch": 2.32, "learning_rate": 0.00016939873147888484, "loss": 0.0346, "step": 11397 }, { "epoch": 2.32, "learning_rate": 0.00016937950874240285, "loss": 0.01, "step": 11398 }, { "epoch": 2.32, "learning_rate": 0.0001693602856822465, "loss": 0.0025, "step": 11399 }, { "epoch": 2.32, "learning_rate": 0.00016934106229873677, "loss": 0.0052, "step": 11400 }, { "epoch": 2.32, "learning_rate": 0.00016932183859219484, "loss": 0.0026, "step": 11401 }, { "epoch": 2.32, "learning_rate": 0.00016930261456294174, "loss": 0.0023, "step": 11402 }, { "epoch": 2.32, "learning_rate": 0.00016928339021129852, "loss": 0.0053, "step": 11403 }, { "epoch": 2.32, "learning_rate": 0.00016926416553758627, "loss": 0.0115, "step": 11404 }, { "epoch": 2.32, "learning_rate": 0.0001692449405421261, "loss": 0.0024, "step": 11405 }, { "epoch": 2.32, "learning_rate": 0.00016922571522523918, "loss": 0.004, "step": 11406 }, { "epoch": 2.32, "learning_rate": 0.00016920648958724643, "loss": 0.0147, "step": 11407 }, { "epoch": 2.32, "learning_rate": 0.00016918726362846908, "loss": 0.0118, "step": 11408 }, { "epoch": 2.32, "learning_rate": 0.0001691680373492282, "loss": 0.0043, "step": 11409 }, { "epoch": 2.32, "learning_rate": 0.00016914881074984488, "loss": 0.0107, "step": 11410 }, { "epoch": 2.32, "learning_rate": 0.00016912958383064037, "loss": 0.0056, "step": 11411 }, { "epoch": 2.32, "learning_rate": 0.0001691103565919356, "loss": 0.007, "step": 11412 }, { "epoch": 2.32, "learning_rate": 0.00016909112903405182, "loss": 0.0211, "step": 11413 }, { "epoch": 2.32, "learning_rate": 0.0001690719011573102, "loss": 0.0081, "step": 11414 }, { "epoch": 2.32, "learning_rate": 0.0001690526729620318, "loss": 0.0038, "step": 11415 }, { "epoch": 2.32, "learning_rate": 0.0001690334444485378, "loss": 0.0134, "step": 11416 }, { "epoch": 2.32, "learning_rate": 0.00016901421561714934, "loss": 0.0103, "step": 11417 }, { "epoch": 2.32, "learning_rate": 0.0001689949864681876, "loss": 0.0043, "step": 11418 }, { "epoch": 2.33, "learning_rate": 0.00016897575700197372, "loss": 0.0065, "step": 11419 }, { "epoch": 2.33, "learning_rate": 0.00016895652721882892, "loss": 0.0153, "step": 11420 }, { "epoch": 2.33, "learning_rate": 0.0001689372971190743, "loss": 0.0146, "step": 11421 }, { "epoch": 2.33, "learning_rate": 0.00016891806670303106, "loss": 0.0072, "step": 11422 }, { "epoch": 2.33, "learning_rate": 0.0001688988359710204, "loss": 0.0081, "step": 11423 }, { "epoch": 2.33, "learning_rate": 0.00016887960492336347, "loss": 0.028, "step": 11424 }, { "epoch": 2.33, "learning_rate": 0.00016886037356038155, "loss": 0.0276, "step": 11425 }, { "epoch": 2.33, "learning_rate": 0.0001688411418823958, "loss": 0.0035, "step": 11426 }, { "epoch": 2.33, "learning_rate": 0.00016882190988972738, "loss": 0.0179, "step": 11427 }, { "epoch": 2.33, "learning_rate": 0.00016880267758269754, "loss": 0.0147, "step": 11428 }, { "epoch": 2.33, "learning_rate": 0.0001687834449616275, "loss": 0.0057, "step": 11429 }, { "epoch": 2.33, "learning_rate": 0.00016876421202683854, "loss": 0.0022, "step": 11430 }, { "epoch": 2.33, "learning_rate": 0.00016874497877865174, "loss": 0.001, "step": 11431 }, { "epoch": 2.33, "learning_rate": 0.00016872574521738842, "loss": 0.005, "step": 11432 }, { "epoch": 2.33, "learning_rate": 0.00016870651134336982, "loss": 0.0024, "step": 11433 }, { "epoch": 2.33, "learning_rate": 0.00016868727715691712, "loss": 0.0206, "step": 11434 }, { "epoch": 2.33, "learning_rate": 0.00016866804265835167, "loss": 0.0072, "step": 11435 }, { "epoch": 2.33, "learning_rate": 0.00016864880784799464, "loss": 0.0039, "step": 11436 }, { "epoch": 2.33, "learning_rate": 0.00016862957272616736, "loss": 0.0091, "step": 11437 }, { "epoch": 2.33, "learning_rate": 0.00016861033729319102, "loss": 0.0055, "step": 11438 }, { "epoch": 2.33, "learning_rate": 0.00016859110154938695, "loss": 0.0046, "step": 11439 }, { "epoch": 2.33, "learning_rate": 0.00016857186549507636, "loss": 0.0064, "step": 11440 }, { "epoch": 2.33, "learning_rate": 0.00016855262913058054, "loss": 0.0025, "step": 11441 }, { "epoch": 2.33, "learning_rate": 0.00016853339245622082, "loss": 0.0074, "step": 11442 }, { "epoch": 2.33, "learning_rate": 0.00016851415547231846, "loss": 0.0166, "step": 11443 }, { "epoch": 2.33, "learning_rate": 0.00016849491817919475, "loss": 0.0128, "step": 11444 }, { "epoch": 2.33, "learning_rate": 0.000168475680577171, "loss": 0.0193, "step": 11445 }, { "epoch": 2.33, "learning_rate": 0.00016845644266656848, "loss": 0.0057, "step": 11446 }, { "epoch": 2.33, "learning_rate": 0.00016843720444770856, "loss": 0.02, "step": 11447 }, { "epoch": 2.33, "learning_rate": 0.00016841796592091256, "loss": 0.0162, "step": 11448 }, { "epoch": 2.33, "learning_rate": 0.0001683987270865017, "loss": 0.0029, "step": 11449 }, { "epoch": 2.33, "learning_rate": 0.00016837948794479738, "loss": 0.0225, "step": 11450 }, { "epoch": 2.33, "learning_rate": 0.00016836024849612095, "loss": 0.0051, "step": 11451 }, { "epoch": 2.33, "learning_rate": 0.00016834100874079367, "loss": 0.0066, "step": 11452 }, { "epoch": 2.33, "learning_rate": 0.00016832176867913697, "loss": 0.0073, "step": 11453 }, { "epoch": 2.33, "learning_rate": 0.00016830252831147207, "loss": 0.003, "step": 11454 }, { "epoch": 2.33, "learning_rate": 0.00016828328763812044, "loss": 0.0358, "step": 11455 }, { "epoch": 2.33, "learning_rate": 0.00016826404665940342, "loss": 0.0106, "step": 11456 }, { "epoch": 2.33, "learning_rate": 0.00016824480537564235, "loss": 0.0098, "step": 11457 }, { "epoch": 2.33, "learning_rate": 0.00016822556378715857, "loss": 0.0094, "step": 11458 }, { "epoch": 2.33, "learning_rate": 0.00016820632189427345, "loss": 0.0079, "step": 11459 }, { "epoch": 2.33, "learning_rate": 0.0001681870796973084, "loss": 0.0106, "step": 11460 }, { "epoch": 2.33, "learning_rate": 0.0001681678371965848, "loss": 0.0059, "step": 11461 }, { "epoch": 2.33, "learning_rate": 0.00016814859439242405, "loss": 0.0012, "step": 11462 }, { "epoch": 2.33, "learning_rate": 0.00016812935128514747, "loss": 0.0059, "step": 11463 }, { "epoch": 2.33, "learning_rate": 0.00016811010787507656, "loss": 0.001, "step": 11464 }, { "epoch": 2.33, "learning_rate": 0.00016809086416253255, "loss": 0.0141, "step": 11465 }, { "epoch": 2.33, "learning_rate": 0.00016807162014783705, "loss": 0.009, "step": 11466 }, { "epoch": 2.33, "learning_rate": 0.00016805237583131138, "loss": 0.0047, "step": 11467 }, { "epoch": 2.34, "learning_rate": 0.00016803313121327697, "loss": 0.0244, "step": 11468 }, { "epoch": 2.34, "learning_rate": 0.00016801388629405516, "loss": 0.0022, "step": 11469 }, { "epoch": 2.34, "learning_rate": 0.00016799464107396752, "loss": 0.0093, "step": 11470 }, { "epoch": 2.34, "learning_rate": 0.0001679753955533354, "loss": 0.0004, "step": 11471 }, { "epoch": 2.34, "learning_rate": 0.0001679561497324802, "loss": 0.0061, "step": 11472 }, { "epoch": 2.34, "learning_rate": 0.00016793690361172338, "loss": 0.0227, "step": 11473 }, { "epoch": 2.34, "learning_rate": 0.00016791765719138647, "loss": 0.0255, "step": 11474 }, { "epoch": 2.34, "learning_rate": 0.00016789841047179082, "loss": 0.0017, "step": 11475 }, { "epoch": 2.34, "learning_rate": 0.00016787916345325796, "loss": 0.0054, "step": 11476 }, { "epoch": 2.34, "learning_rate": 0.00016785991613610932, "loss": 0.017, "step": 11477 }, { "epoch": 2.34, "learning_rate": 0.00016784066852066633, "loss": 0.0056, "step": 11478 }, { "epoch": 2.34, "learning_rate": 0.00016782142060725054, "loss": 0.0083, "step": 11479 }, { "epoch": 2.34, "learning_rate": 0.0001678021723961834, "loss": 0.0132, "step": 11480 }, { "epoch": 2.34, "learning_rate": 0.00016778292388778634, "loss": 0.0026, "step": 11481 }, { "epoch": 2.34, "learning_rate": 0.00016776367508238092, "loss": 0.0032, "step": 11482 }, { "epoch": 2.34, "learning_rate": 0.00016774442598028856, "loss": 0.0073, "step": 11483 }, { "epoch": 2.34, "learning_rate": 0.00016772517658183078, "loss": 0.0019, "step": 11484 }, { "epoch": 2.34, "learning_rate": 0.00016770592688732913, "loss": 0.0038, "step": 11485 }, { "epoch": 2.34, "learning_rate": 0.00016768667689710505, "loss": 0.0087, "step": 11486 }, { "epoch": 2.34, "learning_rate": 0.0001676674266114801, "loss": 0.0253, "step": 11487 }, { "epoch": 2.34, "learning_rate": 0.00016764817603077576, "loss": 0.0065, "step": 11488 }, { "epoch": 2.34, "learning_rate": 0.0001676289251553136, "loss": 0.0125, "step": 11489 }, { "epoch": 2.34, "learning_rate": 0.00016760967398541507, "loss": 0.0042, "step": 11490 }, { "epoch": 2.34, "learning_rate": 0.00016759042252140178, "loss": 0.0043, "step": 11491 }, { "epoch": 2.34, "learning_rate": 0.00016757117076359523, "loss": 0.0055, "step": 11492 }, { "epoch": 2.34, "learning_rate": 0.0001675519187123169, "loss": 0.0108, "step": 11493 }, { "epoch": 2.34, "learning_rate": 0.0001675326663678885, "loss": 0.0039, "step": 11494 }, { "epoch": 2.34, "learning_rate": 0.00016751341373063137, "loss": 0.0031, "step": 11495 }, { "epoch": 2.34, "learning_rate": 0.00016749416080086722, "loss": 0.023, "step": 11496 }, { "epoch": 2.34, "learning_rate": 0.00016747490757891754, "loss": 0.007, "step": 11497 }, { "epoch": 2.34, "learning_rate": 0.00016745565406510395, "loss": 0.0052, "step": 11498 }, { "epoch": 2.34, "learning_rate": 0.00016743640025974798, "loss": 0.0169, "step": 11499 }, { "epoch": 2.34, "learning_rate": 0.00016741714616317122, "loss": 0.0044, "step": 11500 }, { "epoch": 2.34, "learning_rate": 0.0001673978917756952, "loss": 0.0073, "step": 11501 }, { "epoch": 2.34, "learning_rate": 0.0001673786370976416, "loss": 0.0042, "step": 11502 }, { "epoch": 2.34, "learning_rate": 0.0001673593821293319, "loss": 0.0095, "step": 11503 }, { "epoch": 2.34, "learning_rate": 0.0001673401268710878, "loss": 0.005, "step": 11504 }, { "epoch": 2.34, "learning_rate": 0.00016732087132323084, "loss": 0.0097, "step": 11505 }, { "epoch": 2.34, "learning_rate": 0.0001673016154860826, "loss": 0.0153, "step": 11506 }, { "epoch": 2.34, "learning_rate": 0.00016728235935996473, "loss": 0.0134, "step": 11507 }, { "epoch": 2.34, "learning_rate": 0.0001672631029451989, "loss": 0.012, "step": 11508 }, { "epoch": 2.34, "learning_rate": 0.0001672438462421066, "loss": 0.0164, "step": 11509 }, { "epoch": 2.34, "learning_rate": 0.00016722458925100953, "loss": 0.0052, "step": 11510 }, { "epoch": 2.34, "learning_rate": 0.0001672053319722293, "loss": 0.0048, "step": 11511 }, { "epoch": 2.34, "learning_rate": 0.00016718607440608757, "loss": 0.0115, "step": 11512 }, { "epoch": 2.34, "learning_rate": 0.00016716681655290597, "loss": 0.006, "step": 11513 }, { "epoch": 2.34, "learning_rate": 0.00016714755841300608, "loss": 0.0094, "step": 11514 }, { "epoch": 2.34, "learning_rate": 0.00016712829998670963, "loss": 0.007, "step": 11515 }, { "epoch": 2.34, "learning_rate": 0.0001671090412743382, "loss": 0.0171, "step": 11516 }, { "epoch": 2.35, "learning_rate": 0.00016708978227621355, "loss": 0.0146, "step": 11517 }, { "epoch": 2.35, "learning_rate": 0.00016707052299265722, "loss": 0.0103, "step": 11518 }, { "epoch": 2.35, "learning_rate": 0.00016705126342399094, "loss": 0.0044, "step": 11519 }, { "epoch": 2.35, "learning_rate": 0.0001670320035705364, "loss": 0.0164, "step": 11520 }, { "epoch": 2.35, "learning_rate": 0.00016701274343261524, "loss": 0.0123, "step": 11521 }, { "epoch": 2.35, "learning_rate": 0.00016699348301054916, "loss": 0.0143, "step": 11522 }, { "epoch": 2.35, "learning_rate": 0.00016697422230465983, "loss": 0.0213, "step": 11523 }, { "epoch": 2.35, "learning_rate": 0.00016695496131526893, "loss": 0.0056, "step": 11524 }, { "epoch": 2.35, "learning_rate": 0.00016693570004269815, "loss": 0.0108, "step": 11525 }, { "epoch": 2.35, "learning_rate": 0.00016691643848726925, "loss": 0.0031, "step": 11526 }, { "epoch": 2.35, "learning_rate": 0.00016689717664930388, "loss": 0.013, "step": 11527 }, { "epoch": 2.35, "learning_rate": 0.0001668779145291238, "loss": 0.0161, "step": 11528 }, { "epoch": 2.35, "learning_rate": 0.00016685865212705064, "loss": 0.0252, "step": 11529 }, { "epoch": 2.35, "learning_rate": 0.0001668393894434062, "loss": 0.0064, "step": 11530 }, { "epoch": 2.35, "learning_rate": 0.00016682012647851216, "loss": 0.0192, "step": 11531 }, { "epoch": 2.35, "learning_rate": 0.00016680086323269026, "loss": 0.001, "step": 11532 }, { "epoch": 2.35, "learning_rate": 0.00016678159970626223, "loss": 0.0025, "step": 11533 }, { "epoch": 2.35, "learning_rate": 0.00016676233589954978, "loss": 0.0081, "step": 11534 }, { "epoch": 2.35, "learning_rate": 0.0001667430718128747, "loss": 0.0199, "step": 11535 }, { "epoch": 2.35, "learning_rate": 0.00016672380744655875, "loss": 0.003, "step": 11536 }, { "epoch": 2.35, "learning_rate": 0.0001667045428009236, "loss": 0.0019, "step": 11537 }, { "epoch": 2.35, "learning_rate": 0.00016668527787629106, "loss": 0.0078, "step": 11538 }, { "epoch": 2.35, "learning_rate": 0.00016666601267298285, "loss": 0.0121, "step": 11539 }, { "epoch": 2.35, "learning_rate": 0.00016664674719132084, "loss": 0.012, "step": 11540 }, { "epoch": 2.35, "learning_rate": 0.0001666274814316267, "loss": 0.008, "step": 11541 }, { "epoch": 2.35, "learning_rate": 0.00016660821539422223, "loss": 0.009, "step": 11542 }, { "epoch": 2.35, "learning_rate": 0.00016658894907942923, "loss": 0.0144, "step": 11543 }, { "epoch": 2.35, "learning_rate": 0.00016656968248756945, "loss": 0.004, "step": 11544 }, { "epoch": 2.35, "learning_rate": 0.0001665504156189647, "loss": 0.0049, "step": 11545 }, { "epoch": 2.35, "learning_rate": 0.0001665311484739368, "loss": 0.0063, "step": 11546 }, { "epoch": 2.35, "learning_rate": 0.00016651188105280744, "loss": 0.0201, "step": 11547 }, { "epoch": 2.35, "learning_rate": 0.00016649261335589856, "loss": 0.0117, "step": 11548 }, { "epoch": 2.35, "learning_rate": 0.00016647334538353182, "loss": 0.0036, "step": 11549 }, { "epoch": 2.35, "learning_rate": 0.00016645407713602924, "loss": 0.0202, "step": 11550 }, { "epoch": 2.35, "learning_rate": 0.00016643480861371242, "loss": 0.0052, "step": 11551 }, { "epoch": 2.35, "learning_rate": 0.0001664155398169033, "loss": 0.0083, "step": 11552 }, { "epoch": 2.35, "learning_rate": 0.0001663962707459237, "loss": 0.0022, "step": 11553 }, { "epoch": 2.35, "learning_rate": 0.00016637700140109544, "loss": 0.0083, "step": 11554 }, { "epoch": 2.35, "learning_rate": 0.0001663577317827403, "loss": 0.002, "step": 11555 }, { "epoch": 2.35, "learning_rate": 0.00016633846189118018, "loss": 0.011, "step": 11556 }, { "epoch": 2.35, "learning_rate": 0.0001663191917267369, "loss": 0.0084, "step": 11557 }, { "epoch": 2.35, "learning_rate": 0.00016629992128973232, "loss": 0.0041, "step": 11558 }, { "epoch": 2.35, "learning_rate": 0.00016628065058048829, "loss": 0.0084, "step": 11559 }, { "epoch": 2.35, "learning_rate": 0.00016626137959932665, "loss": 0.0102, "step": 11560 }, { "epoch": 2.35, "learning_rate": 0.00016624210834656925, "loss": 0.011, "step": 11561 }, { "epoch": 2.35, "learning_rate": 0.00016622283682253802, "loss": 0.0064, "step": 11562 }, { "epoch": 2.35, "learning_rate": 0.00016620356502755477, "loss": 0.0096, "step": 11563 }, { "epoch": 2.35, "learning_rate": 0.00016618429296194146, "loss": 0.0065, "step": 11564 }, { "epoch": 2.35, "learning_rate": 0.00016616502062601987, "loss": 0.0034, "step": 11565 }, { "epoch": 2.36, "learning_rate": 0.0001661457480201119, "loss": 0.0195, "step": 11566 }, { "epoch": 2.36, "learning_rate": 0.00016612647514453946, "loss": 0.0026, "step": 11567 }, { "epoch": 2.36, "learning_rate": 0.00016610720199962444, "loss": 0.0148, "step": 11568 }, { "epoch": 2.36, "learning_rate": 0.00016608792858568877, "loss": 0.0044, "step": 11569 }, { "epoch": 2.36, "learning_rate": 0.0001660686549030543, "loss": 0.0071, "step": 11570 }, { "epoch": 2.36, "learning_rate": 0.00016604938095204298, "loss": 0.015, "step": 11571 }, { "epoch": 2.36, "learning_rate": 0.00016603010673297669, "loss": 0.0143, "step": 11572 }, { "epoch": 2.36, "learning_rate": 0.0001660108322461774, "loss": 0.0082, "step": 11573 }, { "epoch": 2.36, "learning_rate": 0.00016599155749196694, "loss": 0.0088, "step": 11574 }, { "epoch": 2.36, "learning_rate": 0.0001659722824706673, "loss": 0.0044, "step": 11575 }, { "epoch": 2.36, "learning_rate": 0.0001659530071826004, "loss": 0.0351, "step": 11576 }, { "epoch": 2.36, "learning_rate": 0.00016593373162808814, "loss": 0.0089, "step": 11577 }, { "epoch": 2.36, "learning_rate": 0.00016591445580745254, "loss": 0.0154, "step": 11578 }, { "epoch": 2.36, "learning_rate": 0.0001658951797210154, "loss": 0.0201, "step": 11579 }, { "epoch": 2.36, "learning_rate": 0.0001658759033690988, "loss": 0.0054, "step": 11580 }, { "epoch": 2.36, "learning_rate": 0.00016585662675202466, "loss": 0.0059, "step": 11581 }, { "epoch": 2.36, "learning_rate": 0.00016583734987011493, "loss": 0.0043, "step": 11582 }, { "epoch": 2.36, "learning_rate": 0.00016581807272369152, "loss": 0.0106, "step": 11583 }, { "epoch": 2.36, "learning_rate": 0.0001657987953130765, "loss": 0.0019, "step": 11584 }, { "epoch": 2.36, "learning_rate": 0.00016577951763859173, "loss": 0.0046, "step": 11585 }, { "epoch": 2.36, "learning_rate": 0.00016576023970055922, "loss": 0.0073, "step": 11586 }, { "epoch": 2.36, "learning_rate": 0.000165740961499301, "loss": 0.0115, "step": 11587 }, { "epoch": 2.36, "learning_rate": 0.00016572168303513897, "loss": 0.0055, "step": 11588 }, { "epoch": 2.36, "learning_rate": 0.00016570240430839516, "loss": 0.0073, "step": 11589 }, { "epoch": 2.36, "learning_rate": 0.00016568312531939155, "loss": 0.0038, "step": 11590 }, { "epoch": 2.36, "learning_rate": 0.00016566384606845017, "loss": 0.0031, "step": 11591 }, { "epoch": 2.36, "learning_rate": 0.000165644566555893, "loss": 0.0211, "step": 11592 }, { "epoch": 2.36, "learning_rate": 0.00016562528678204202, "loss": 0.0132, "step": 11593 }, { "epoch": 2.36, "learning_rate": 0.00016560600674721927, "loss": 0.0061, "step": 11594 }, { "epoch": 2.36, "learning_rate": 0.0001655867264517467, "loss": 0.0038, "step": 11595 }, { "epoch": 2.36, "learning_rate": 0.00016556744589594645, "loss": 0.0043, "step": 11596 }, { "epoch": 2.36, "learning_rate": 0.00016554816508014043, "loss": 0.008, "step": 11597 }, { "epoch": 2.36, "learning_rate": 0.0001655288840046507, "loss": 0.013, "step": 11598 }, { "epoch": 2.36, "learning_rate": 0.0001655096026697993, "loss": 0.0045, "step": 11599 }, { "epoch": 2.36, "learning_rate": 0.00016549032107590823, "loss": 0.0092, "step": 11600 }, { "epoch": 2.36, "learning_rate": 0.0001654710392232996, "loss": 0.0087, "step": 11601 }, { "epoch": 2.36, "learning_rate": 0.0001654517571122954, "loss": 0.0043, "step": 11602 }, { "epoch": 2.36, "learning_rate": 0.00016543247474321766, "loss": 0.0071, "step": 11603 }, { "epoch": 2.36, "learning_rate": 0.0001654131921163885, "loss": 0.0027, "step": 11604 }, { "epoch": 2.36, "learning_rate": 0.00016539390923212997, "loss": 0.0111, "step": 11605 }, { "epoch": 2.36, "learning_rate": 0.000165374626090764, "loss": 0.0054, "step": 11606 }, { "epoch": 2.36, "learning_rate": 0.00016535534269261284, "loss": 0.0091, "step": 11607 }, { "epoch": 2.36, "learning_rate": 0.00016533605903799843, "loss": 0.0137, "step": 11608 }, { "epoch": 2.36, "learning_rate": 0.0001653167751272429, "loss": 0.0136, "step": 11609 }, { "epoch": 2.36, "learning_rate": 0.00016529749096066827, "loss": 0.0104, "step": 11610 }, { "epoch": 2.36, "learning_rate": 0.0001652782065385967, "loss": 0.0067, "step": 11611 }, { "epoch": 2.36, "learning_rate": 0.00016525892186135025, "loss": 0.005, "step": 11612 }, { "epoch": 2.36, "learning_rate": 0.00016523963692925098, "loss": 0.0051, "step": 11613 }, { "epoch": 2.36, "learning_rate": 0.000165220351742621, "loss": 0.0031, "step": 11614 }, { "epoch": 2.37, "learning_rate": 0.00016520106630178247, "loss": 0.0108, "step": 11615 }, { "epoch": 2.37, "learning_rate": 0.0001651817806070574, "loss": 0.0077, "step": 11616 }, { "epoch": 2.37, "learning_rate": 0.00016516249465876794, "loss": 0.0343, "step": 11617 }, { "epoch": 2.37, "learning_rate": 0.0001651432084572362, "loss": 0.0008, "step": 11618 }, { "epoch": 2.37, "learning_rate": 0.00016512392200278433, "loss": 0.0205, "step": 11619 }, { "epoch": 2.37, "learning_rate": 0.00016510463529573432, "loss": 0.0056, "step": 11620 }, { "epoch": 2.37, "learning_rate": 0.00016508534833640845, "loss": 0.0217, "step": 11621 }, { "epoch": 2.37, "learning_rate": 0.00016506606112512876, "loss": 0.006, "step": 11622 }, { "epoch": 2.37, "learning_rate": 0.00016504677366221743, "loss": 0.0119, "step": 11623 }, { "epoch": 2.37, "learning_rate": 0.00016502748594799662, "loss": 0.0011, "step": 11624 }, { "epoch": 2.37, "learning_rate": 0.00016500819798278838, "loss": 0.0099, "step": 11625 }, { "epoch": 2.37, "learning_rate": 0.00016498890976691488, "loss": 0.0169, "step": 11626 }, { "epoch": 2.37, "learning_rate": 0.00016496962130069836, "loss": 0.0129, "step": 11627 }, { "epoch": 2.37, "learning_rate": 0.00016495033258446086, "loss": 0.0013, "step": 11628 }, { "epoch": 2.37, "learning_rate": 0.00016493104361852461, "loss": 0.0143, "step": 11629 }, { "epoch": 2.37, "learning_rate": 0.00016491175440321173, "loss": 0.0073, "step": 11630 }, { "epoch": 2.37, "learning_rate": 0.0001648924649388444, "loss": 0.0097, "step": 11631 }, { "epoch": 2.37, "learning_rate": 0.00016487317522574475, "loss": 0.0107, "step": 11632 }, { "epoch": 2.37, "learning_rate": 0.0001648538852642351, "loss": 0.0036, "step": 11633 }, { "epoch": 2.37, "learning_rate": 0.00016483459505463747, "loss": 0.0124, "step": 11634 }, { "epoch": 2.37, "learning_rate": 0.0001648153045972741, "loss": 0.0068, "step": 11635 }, { "epoch": 2.37, "learning_rate": 0.00016479601389246716, "loss": 0.0052, "step": 11636 }, { "epoch": 2.37, "learning_rate": 0.0001647767229405389, "loss": 0.0055, "step": 11637 }, { "epoch": 2.37, "learning_rate": 0.00016475743174181149, "loss": 0.0054, "step": 11638 }, { "epoch": 2.37, "learning_rate": 0.0001647381402966071, "loss": 0.0082, "step": 11639 }, { "epoch": 2.37, "learning_rate": 0.0001647188486052479, "loss": 0.0039, "step": 11640 }, { "epoch": 2.37, "learning_rate": 0.00016469955666805614, "loss": 0.0104, "step": 11641 }, { "epoch": 2.37, "learning_rate": 0.00016468026448535408, "loss": 0.0102, "step": 11642 }, { "epoch": 2.37, "learning_rate": 0.00016466097205746386, "loss": 0.0141, "step": 11643 }, { "epoch": 2.37, "learning_rate": 0.00016464167938470776, "loss": 0.0107, "step": 11644 }, { "epoch": 2.37, "learning_rate": 0.00016462238646740797, "loss": 0.0028, "step": 11645 }, { "epoch": 2.37, "learning_rate": 0.0001646030933058867, "loss": 0.0154, "step": 11646 }, { "epoch": 2.37, "learning_rate": 0.00016458379990046625, "loss": 0.0071, "step": 11647 }, { "epoch": 2.37, "learning_rate": 0.00016456450625146882, "loss": 0.0099, "step": 11648 }, { "epoch": 2.37, "learning_rate": 0.0001645452123592166, "loss": 0.0077, "step": 11649 }, { "epoch": 2.37, "learning_rate": 0.00016452591822403189, "loss": 0.0014, "step": 11650 }, { "epoch": 2.37, "learning_rate": 0.00016450662384623693, "loss": 0.0132, "step": 11651 }, { "epoch": 2.37, "learning_rate": 0.00016448732922615393, "loss": 0.0092, "step": 11652 }, { "epoch": 2.37, "learning_rate": 0.00016446803436410523, "loss": 0.0044, "step": 11653 }, { "epoch": 2.37, "learning_rate": 0.00016444873926041304, "loss": 0.0045, "step": 11654 }, { "epoch": 2.37, "learning_rate": 0.00016442944391539962, "loss": 0.0039, "step": 11655 }, { "epoch": 2.37, "learning_rate": 0.0001644101483293873, "loss": 0.0052, "step": 11656 }, { "epoch": 2.37, "learning_rate": 0.00016439085250269823, "loss": 0.0087, "step": 11657 }, { "epoch": 2.37, "learning_rate": 0.00016437155643565478, "loss": 0.0048, "step": 11658 }, { "epoch": 2.37, "learning_rate": 0.00016435226012857923, "loss": 0.0088, "step": 11659 }, { "epoch": 2.37, "learning_rate": 0.0001643329635817938, "loss": 0.003, "step": 11660 }, { "epoch": 2.37, "learning_rate": 0.0001643136667956209, "loss": 0.0084, "step": 11661 }, { "epoch": 2.37, "learning_rate": 0.00016429436977038268, "loss": 0.0027, "step": 11662 }, { "epoch": 2.37, "learning_rate": 0.00016427507250640149, "loss": 0.0018, "step": 11663 }, { "epoch": 2.38, "learning_rate": 0.0001642557750039997, "loss": 0.0191, "step": 11664 }, { "epoch": 2.38, "learning_rate": 0.00016423647726349953, "loss": 0.0059, "step": 11665 }, { "epoch": 2.38, "learning_rate": 0.00016421717928522334, "loss": 0.0104, "step": 11666 }, { "epoch": 2.38, "learning_rate": 0.00016419788106949336, "loss": 0.0018, "step": 11667 }, { "epoch": 2.38, "learning_rate": 0.000164178582616632, "loss": 0.0057, "step": 11668 }, { "epoch": 2.38, "learning_rate": 0.00016415928392696157, "loss": 0.012, "step": 11669 }, { "epoch": 2.38, "learning_rate": 0.00016413998500080439, "loss": 0.0107, "step": 11670 }, { "epoch": 2.38, "learning_rate": 0.0001641206858384827, "loss": 0.0101, "step": 11671 }, { "epoch": 2.38, "learning_rate": 0.00016410138644031895, "loss": 0.0066, "step": 11672 }, { "epoch": 2.38, "learning_rate": 0.00016408208680663536, "loss": 0.0033, "step": 11673 }, { "epoch": 2.38, "learning_rate": 0.00016406278693775438, "loss": 0.0041, "step": 11674 }, { "epoch": 2.38, "learning_rate": 0.00016404348683399838, "loss": 0.0148, "step": 11675 }, { "epoch": 2.38, "learning_rate": 0.00016402418649568955, "loss": 0.0049, "step": 11676 }, { "epoch": 2.38, "learning_rate": 0.0001640048859231504, "loss": 0.0045, "step": 11677 }, { "epoch": 2.38, "learning_rate": 0.00016398558511670315, "loss": 0.0092, "step": 11678 }, { "epoch": 2.38, "learning_rate": 0.00016396628407667026, "loss": 0.0121, "step": 11679 }, { "epoch": 2.38, "learning_rate": 0.0001639469828033741, "loss": 0.018, "step": 11680 }, { "epoch": 2.38, "learning_rate": 0.00016392768129713694, "loss": 0.0047, "step": 11681 }, { "epoch": 2.38, "learning_rate": 0.00016390837955828125, "loss": 0.0115, "step": 11682 }, { "epoch": 2.38, "learning_rate": 0.00016388907758712934, "loss": 0.0076, "step": 11683 }, { "epoch": 2.38, "learning_rate": 0.0001638697753840036, "loss": 0.0064, "step": 11684 }, { "epoch": 2.38, "learning_rate": 0.00016385047294922652, "loss": 0.004, "step": 11685 }, { "epoch": 2.38, "learning_rate": 0.0001638311702831203, "loss": 0.0052, "step": 11686 }, { "epoch": 2.38, "learning_rate": 0.00016381186738600746, "loss": 0.0008, "step": 11687 }, { "epoch": 2.38, "learning_rate": 0.00016379256425821037, "loss": 0.0008, "step": 11688 }, { "epoch": 2.38, "learning_rate": 0.00016377326090005146, "loss": 0.0147, "step": 11689 }, { "epoch": 2.38, "learning_rate": 0.00016375395731185304, "loss": 0.0074, "step": 11690 }, { "epoch": 2.38, "learning_rate": 0.0001637346534939376, "loss": 0.0055, "step": 11691 }, { "epoch": 2.38, "learning_rate": 0.00016371534944662752, "loss": 0.0138, "step": 11692 }, { "epoch": 2.38, "learning_rate": 0.00016369604517024516, "loss": 0.0104, "step": 11693 }, { "epoch": 2.38, "learning_rate": 0.00016367674066511303, "loss": 0.0021, "step": 11694 }, { "epoch": 2.38, "learning_rate": 0.00016365743593155352, "loss": 0.0017, "step": 11695 }, { "epoch": 2.38, "learning_rate": 0.00016363813096988904, "loss": 0.0166, "step": 11696 }, { "epoch": 2.38, "learning_rate": 0.00016361882578044202, "loss": 0.0037, "step": 11697 }, { "epoch": 2.38, "learning_rate": 0.00016359952036353498, "loss": 0.0161, "step": 11698 }, { "epoch": 2.38, "learning_rate": 0.0001635802147194902, "loss": 0.0145, "step": 11699 }, { "epoch": 2.38, "learning_rate": 0.0001635609088486302, "loss": 0.0076, "step": 11700 }, { "epoch": 2.38, "learning_rate": 0.00016354160275127745, "loss": 0.0053, "step": 11701 }, { "epoch": 2.38, "learning_rate": 0.0001635222964277544, "loss": 0.0067, "step": 11702 }, { "epoch": 2.38, "learning_rate": 0.0001635029898783834, "loss": 0.0105, "step": 11703 }, { "epoch": 2.38, "learning_rate": 0.00016348368310348702, "loss": 0.0009, "step": 11704 }, { "epoch": 2.38, "learning_rate": 0.00016346437610338766, "loss": 0.0282, "step": 11705 }, { "epoch": 2.38, "learning_rate": 0.00016344506887840785, "loss": 0.0045, "step": 11706 }, { "epoch": 2.38, "learning_rate": 0.00016342576142887, "loss": 0.0046, "step": 11707 }, { "epoch": 2.38, "learning_rate": 0.00016340645375509657, "loss": 0.0094, "step": 11708 }, { "epoch": 2.38, "learning_rate": 0.00016338714585741005, "loss": 0.0268, "step": 11709 }, { "epoch": 2.38, "learning_rate": 0.00016336783773613291, "loss": 0.0059, "step": 11710 }, { "epoch": 2.38, "learning_rate": 0.0001633485293915877, "loss": 0.0044, "step": 11711 }, { "epoch": 2.38, "learning_rate": 0.00016332922082409686, "loss": 0.0114, "step": 11712 }, { "epoch": 2.38, "learning_rate": 0.0001633099120339828, "loss": 0.0059, "step": 11713 }, { "epoch": 2.39, "learning_rate": 0.00016329060302156814, "loss": 0.0064, "step": 11714 }, { "epoch": 2.39, "learning_rate": 0.00016327129378717524, "loss": 0.0056, "step": 11715 }, { "epoch": 2.39, "learning_rate": 0.00016325198433112678, "loss": 0.004, "step": 11716 }, { "epoch": 2.39, "learning_rate": 0.0001632326746537451, "loss": 0.0085, "step": 11717 }, { "epoch": 2.39, "learning_rate": 0.00016321336475535285, "loss": 0.0187, "step": 11718 }, { "epoch": 2.39, "learning_rate": 0.0001631940546362724, "loss": 0.0099, "step": 11719 }, { "epoch": 2.39, "learning_rate": 0.00016317474429682633, "loss": 0.0177, "step": 11720 }, { "epoch": 2.39, "learning_rate": 0.0001631554337373372, "loss": 0.0156, "step": 11721 }, { "epoch": 2.39, "learning_rate": 0.0001631361229581275, "loss": 0.017, "step": 11722 }, { "epoch": 2.39, "learning_rate": 0.00016311681195951974, "loss": 0.0083, "step": 11723 }, { "epoch": 2.39, "learning_rate": 0.0001630975007418364, "loss": 0.0051, "step": 11724 }, { "epoch": 2.39, "learning_rate": 0.00016307818930540014, "loss": 0.0125, "step": 11725 }, { "epoch": 2.39, "learning_rate": 0.0001630588776505334, "loss": 0.0079, "step": 11726 }, { "epoch": 2.39, "learning_rate": 0.00016303956577755878, "loss": 0.0062, "step": 11727 }, { "epoch": 2.39, "learning_rate": 0.00016302025368679878, "loss": 0.0028, "step": 11728 }, { "epoch": 2.39, "learning_rate": 0.00016300094137857598, "loss": 0.0269, "step": 11729 }, { "epoch": 2.39, "learning_rate": 0.00016298162885321294, "loss": 0.0104, "step": 11730 }, { "epoch": 2.39, "learning_rate": 0.00016296231611103216, "loss": 0.0225, "step": 11731 }, { "epoch": 2.39, "learning_rate": 0.00016294300315235623, "loss": 0.0019, "step": 11732 }, { "epoch": 2.39, "learning_rate": 0.0001629236899775077, "loss": 0.0067, "step": 11733 }, { "epoch": 2.39, "learning_rate": 0.0001629043765868092, "loss": 0.0133, "step": 11734 }, { "epoch": 2.39, "learning_rate": 0.00016288506298058322, "loss": 0.0175, "step": 11735 }, { "epoch": 2.39, "learning_rate": 0.00016286574915915235, "loss": 0.0045, "step": 11736 }, { "epoch": 2.39, "learning_rate": 0.0001628464351228392, "loss": 0.0191, "step": 11737 }, { "epoch": 2.39, "learning_rate": 0.00016282712087196634, "loss": 0.0057, "step": 11738 }, { "epoch": 2.39, "learning_rate": 0.00016280780640685639, "loss": 0.0093, "step": 11739 }, { "epoch": 2.39, "learning_rate": 0.00016278849172783185, "loss": 0.0185, "step": 11740 }, { "epoch": 2.39, "learning_rate": 0.00016276917683521533, "loss": 0.0092, "step": 11741 }, { "epoch": 2.39, "learning_rate": 0.0001627498617293295, "loss": 0.0155, "step": 11742 }, { "epoch": 2.39, "learning_rate": 0.0001627305464104969, "loss": 0.009, "step": 11743 }, { "epoch": 2.39, "learning_rate": 0.00016271123087904018, "loss": 0.0041, "step": 11744 }, { "epoch": 2.39, "learning_rate": 0.0001626919151352818, "loss": 0.0074, "step": 11745 }, { "epoch": 2.39, "learning_rate": 0.0001626725991795446, "loss": 0.0084, "step": 11746 }, { "epoch": 2.39, "learning_rate": 0.000162653283012151, "loss": 0.003, "step": 11747 }, { "epoch": 2.39, "learning_rate": 0.0001626339666334237, "loss": 0.0063, "step": 11748 }, { "epoch": 2.39, "learning_rate": 0.00016261465004368533, "loss": 0.0019, "step": 11749 }, { "epoch": 2.39, "learning_rate": 0.00016259533324325848, "loss": 0.014, "step": 11750 }, { "epoch": 2.39, "learning_rate": 0.0001625760162324658, "loss": 0.0064, "step": 11751 }, { "epoch": 2.39, "learning_rate": 0.00016255669901162992, "loss": 0.0076, "step": 11752 }, { "epoch": 2.39, "learning_rate": 0.00016253738158107347, "loss": 0.0013, "step": 11753 }, { "epoch": 2.39, "learning_rate": 0.00016251806394111906, "loss": 0.007, "step": 11754 }, { "epoch": 2.39, "learning_rate": 0.00016249874609208933, "loss": 0.0055, "step": 11755 }, { "epoch": 2.39, "learning_rate": 0.00016247942803430693, "loss": 0.0041, "step": 11756 }, { "epoch": 2.39, "learning_rate": 0.00016246010976809458, "loss": 0.0142, "step": 11757 }, { "epoch": 2.39, "learning_rate": 0.00016244079129377489, "loss": 0.0104, "step": 11758 }, { "epoch": 2.39, "learning_rate": 0.00016242147261167044, "loss": 0.0244, "step": 11759 }, { "epoch": 2.39, "learning_rate": 0.00016240215372210402, "loss": 0.0122, "step": 11760 }, { "epoch": 2.39, "learning_rate": 0.00016238283462539815, "loss": 0.0058, "step": 11761 }, { "epoch": 2.39, "learning_rate": 0.00016236351532187562, "loss": 0.0174, "step": 11762 }, { "epoch": 2.4, "learning_rate": 0.00016234419581185905, "loss": 0.0063, "step": 11763 }, { "epoch": 2.4, "learning_rate": 0.0001623248760956711, "loss": 0.0091, "step": 11764 }, { "epoch": 2.4, "learning_rate": 0.00016230555617363445, "loss": 0.0008, "step": 11765 }, { "epoch": 2.4, "learning_rate": 0.00016228623604607175, "loss": 0.0066, "step": 11766 }, { "epoch": 2.4, "learning_rate": 0.00016226691571330577, "loss": 0.0032, "step": 11767 }, { "epoch": 2.4, "learning_rate": 0.00016224759517565908, "loss": 0.0049, "step": 11768 }, { "epoch": 2.4, "learning_rate": 0.00016222827443345444, "loss": 0.0034, "step": 11769 }, { "epoch": 2.4, "learning_rate": 0.00016220895348701458, "loss": 0.0047, "step": 11770 }, { "epoch": 2.4, "learning_rate": 0.00016218963233666215, "loss": 0.0052, "step": 11771 }, { "epoch": 2.4, "learning_rate": 0.00016217031098271986, "loss": 0.0227, "step": 11772 }, { "epoch": 2.4, "learning_rate": 0.00016215098942551037, "loss": 0.0029, "step": 11773 }, { "epoch": 2.4, "learning_rate": 0.0001621316676653564, "loss": 0.0152, "step": 11774 }, { "epoch": 2.4, "learning_rate": 0.0001621123457025807, "loss": 0.0121, "step": 11775 }, { "epoch": 2.4, "learning_rate": 0.000162093023537506, "loss": 0.0047, "step": 11776 }, { "epoch": 2.4, "learning_rate": 0.00016207370117045491, "loss": 0.0326, "step": 11777 }, { "epoch": 2.4, "learning_rate": 0.00016205437860175026, "loss": 0.0054, "step": 11778 }, { "epoch": 2.4, "learning_rate": 0.0001620350558317147, "loss": 0.005, "step": 11779 }, { "epoch": 2.4, "learning_rate": 0.00016201573286067105, "loss": 0.0027, "step": 11780 }, { "epoch": 2.4, "learning_rate": 0.00016199640968894198, "loss": 0.0043, "step": 11781 }, { "epoch": 2.4, "learning_rate": 0.00016197708631685018, "loss": 0.0063, "step": 11782 }, { "epoch": 2.4, "learning_rate": 0.00016195776274471844, "loss": 0.0169, "step": 11783 }, { "epoch": 2.4, "learning_rate": 0.00016193843897286948, "loss": 0.006, "step": 11784 }, { "epoch": 2.4, "learning_rate": 0.0001619191150016261, "loss": 0.0115, "step": 11785 }, { "epoch": 2.4, "learning_rate": 0.00016189979083131096, "loss": 0.0255, "step": 11786 }, { "epoch": 2.4, "learning_rate": 0.00016188046646224683, "loss": 0.0116, "step": 11787 }, { "epoch": 2.4, "learning_rate": 0.00016186114189475648, "loss": 0.0156, "step": 11788 }, { "epoch": 2.4, "learning_rate": 0.00016184181712916273, "loss": 0.0074, "step": 11789 }, { "epoch": 2.4, "learning_rate": 0.0001618224921657883, "loss": 0.0011, "step": 11790 }, { "epoch": 2.4, "learning_rate": 0.00016180316700495587, "loss": 0.0067, "step": 11791 }, { "epoch": 2.4, "learning_rate": 0.00016178384164698827, "loss": 0.0084, "step": 11792 }, { "epoch": 2.4, "learning_rate": 0.0001617645160922083, "loss": 0.0171, "step": 11793 }, { "epoch": 2.4, "learning_rate": 0.0001617451903409387, "loss": 0.0157, "step": 11794 }, { "epoch": 2.4, "learning_rate": 0.00016172586439350227, "loss": 0.004, "step": 11795 }, { "epoch": 2.4, "learning_rate": 0.00016170653825022175, "loss": 0.0076, "step": 11796 }, { "epoch": 2.4, "learning_rate": 0.00016168721191141993, "loss": 0.0042, "step": 11797 }, { "epoch": 2.4, "learning_rate": 0.0001616678853774196, "loss": 0.0046, "step": 11798 }, { "epoch": 2.4, "learning_rate": 0.00016164855864854357, "loss": 0.007, "step": 11799 }, { "epoch": 2.4, "learning_rate": 0.00016162923172511465, "loss": 0.0011, "step": 11800 }, { "epoch": 2.4, "learning_rate": 0.00016160990460745557, "loss": 0.0028, "step": 11801 }, { "epoch": 2.4, "learning_rate": 0.0001615905772958892, "loss": 0.0086, "step": 11802 }, { "epoch": 2.4, "learning_rate": 0.0001615712497907383, "loss": 0.003, "step": 11803 }, { "epoch": 2.4, "learning_rate": 0.0001615519220923257, "loss": 0.0107, "step": 11804 }, { "epoch": 2.4, "learning_rate": 0.0001615325942009742, "loss": 0.0035, "step": 11805 }, { "epoch": 2.4, "learning_rate": 0.00016151326611700656, "loss": 0.0091, "step": 11806 }, { "epoch": 2.4, "learning_rate": 0.00016149393784074568, "loss": 0.0043, "step": 11807 }, { "epoch": 2.4, "learning_rate": 0.00016147460937251433, "loss": 0.0135, "step": 11808 }, { "epoch": 2.4, "learning_rate": 0.00016145528071263534, "loss": 0.0142, "step": 11809 }, { "epoch": 2.4, "learning_rate": 0.00016143595186143153, "loss": 0.0077, "step": 11810 }, { "epoch": 2.4, "learning_rate": 0.00016141662281922577, "loss": 0.0193, "step": 11811 }, { "epoch": 2.41, "learning_rate": 0.0001613972935863408, "loss": 0.0025, "step": 11812 }, { "epoch": 2.41, "learning_rate": 0.00016137796416309958, "loss": 0.0247, "step": 11813 }, { "epoch": 2.41, "learning_rate": 0.00016135863454982488, "loss": 0.0066, "step": 11814 }, { "epoch": 2.41, "learning_rate": 0.00016133930474683953, "loss": 0.0092, "step": 11815 }, { "epoch": 2.41, "learning_rate": 0.00016131997475446634, "loss": 0.0016, "step": 11816 }, { "epoch": 2.41, "learning_rate": 0.00016130064457302822, "loss": 0.0123, "step": 11817 }, { "epoch": 2.41, "learning_rate": 0.00016128131420284806, "loss": 0.0161, "step": 11818 }, { "epoch": 2.41, "learning_rate": 0.0001612619836442486, "loss": 0.0046, "step": 11819 }, { "epoch": 2.41, "learning_rate": 0.00016124265289755275, "loss": 0.0169, "step": 11820 }, { "epoch": 2.41, "learning_rate": 0.0001612233219630834, "loss": 0.015, "step": 11821 }, { "epoch": 2.41, "learning_rate": 0.00016120399084116338, "loss": 0.0063, "step": 11822 }, { "epoch": 2.41, "learning_rate": 0.0001611846595321156, "loss": 0.0193, "step": 11823 }, { "epoch": 2.41, "learning_rate": 0.00016116532803626287, "loss": 0.014, "step": 11824 }, { "epoch": 2.41, "learning_rate": 0.0001611459963539281, "loss": 0.0163, "step": 11825 }, { "epoch": 2.41, "learning_rate": 0.0001611266644854341, "loss": 0.0083, "step": 11826 }, { "epoch": 2.41, "learning_rate": 0.00016110733243110384, "loss": 0.0041, "step": 11827 }, { "epoch": 2.41, "learning_rate": 0.00016108800019126013, "loss": 0.0109, "step": 11828 }, { "epoch": 2.41, "learning_rate": 0.0001610686677662259, "loss": 0.0034, "step": 11829 }, { "epoch": 2.41, "learning_rate": 0.00016104933515632402, "loss": 0.0099, "step": 11830 }, { "epoch": 2.41, "learning_rate": 0.0001610300023618774, "loss": 0.0173, "step": 11831 }, { "epoch": 2.41, "learning_rate": 0.00016101066938320897, "loss": 0.0036, "step": 11832 }, { "epoch": 2.41, "learning_rate": 0.0001609913362206415, "loss": 0.0036, "step": 11833 }, { "epoch": 2.41, "learning_rate": 0.000160972002874498, "loss": 0.0124, "step": 11834 }, { "epoch": 2.41, "learning_rate": 0.00016095266934510133, "loss": 0.0052, "step": 11835 }, { "epoch": 2.41, "learning_rate": 0.0001609333356327744, "loss": 0.0157, "step": 11836 }, { "epoch": 2.41, "learning_rate": 0.0001609140017378402, "loss": 0.0112, "step": 11837 }, { "epoch": 2.41, "learning_rate": 0.00016089466766062147, "loss": 0.0136, "step": 11838 }, { "epoch": 2.41, "learning_rate": 0.00016087533340144127, "loss": 0.015, "step": 11839 }, { "epoch": 2.41, "learning_rate": 0.00016085599896062242, "loss": 0.0043, "step": 11840 }, { "epoch": 2.41, "learning_rate": 0.00016083666433848798, "loss": 0.0016, "step": 11841 }, { "epoch": 2.41, "learning_rate": 0.00016081732953536075, "loss": 0.0171, "step": 11842 }, { "epoch": 2.41, "learning_rate": 0.00016079799455156368, "loss": 0.0302, "step": 11843 }, { "epoch": 2.41, "learning_rate": 0.00016077865938741976, "loss": 0.0179, "step": 11844 }, { "epoch": 2.41, "learning_rate": 0.00016075932404325182, "loss": 0.0217, "step": 11845 }, { "epoch": 2.41, "learning_rate": 0.00016073998851938293, "loss": 0.0055, "step": 11846 }, { "epoch": 2.41, "learning_rate": 0.00016072065281613594, "loss": 0.0107, "step": 11847 }, { "epoch": 2.41, "learning_rate": 0.0001607013169338338, "loss": 0.0091, "step": 11848 }, { "epoch": 2.41, "learning_rate": 0.00016068198087279946, "loss": 0.0034, "step": 11849 }, { "epoch": 2.41, "learning_rate": 0.00016066264463335587, "loss": 0.0096, "step": 11850 }, { "epoch": 2.41, "learning_rate": 0.000160643308215826, "loss": 0.0029, "step": 11851 }, { "epoch": 2.41, "learning_rate": 0.00016062397162053277, "loss": 0.0103, "step": 11852 }, { "epoch": 2.41, "learning_rate": 0.00016060463484779918, "loss": 0.003, "step": 11853 }, { "epoch": 2.41, "learning_rate": 0.00016058529789794815, "loss": 0.0084, "step": 11854 }, { "epoch": 2.41, "learning_rate": 0.00016056596077130273, "loss": 0.0111, "step": 11855 }, { "epoch": 2.41, "learning_rate": 0.0001605466234681858, "loss": 0.006, "step": 11856 }, { "epoch": 2.41, "learning_rate": 0.00016052728598892028, "loss": 0.0053, "step": 11857 }, { "epoch": 2.41, "learning_rate": 0.00016050794833382927, "loss": 0.0181, "step": 11858 }, { "epoch": 2.41, "learning_rate": 0.0001604886105032357, "loss": 0.006, "step": 11859 }, { "epoch": 2.41, "learning_rate": 0.0001604692724974625, "loss": 0.008, "step": 11860 }, { "epoch": 2.42, "learning_rate": 0.00016044993431683265, "loss": 0.0057, "step": 11861 }, { "epoch": 2.42, "learning_rate": 0.00016043059596166926, "loss": 0.0092, "step": 11862 }, { "epoch": 2.42, "learning_rate": 0.00016041125743229516, "loss": 0.0052, "step": 11863 }, { "epoch": 2.42, "learning_rate": 0.00016039191872903346, "loss": 0.0081, "step": 11864 }, { "epoch": 2.42, "learning_rate": 0.00016037257985220706, "loss": 0.0023, "step": 11865 }, { "epoch": 2.42, "learning_rate": 0.00016035324080213904, "loss": 0.0061, "step": 11866 }, { "epoch": 2.42, "learning_rate": 0.0001603339015791523, "loss": 0.0184, "step": 11867 }, { "epoch": 2.42, "learning_rate": 0.00016031456218356993, "loss": 0.0034, "step": 11868 }, { "epoch": 2.42, "learning_rate": 0.00016029522261571495, "loss": 0.0126, "step": 11869 }, { "epoch": 2.42, "learning_rate": 0.0001602758828759102, "loss": 0.0143, "step": 11870 }, { "epoch": 2.42, "learning_rate": 0.00016025654296447888, "loss": 0.0031, "step": 11871 }, { "epoch": 2.42, "learning_rate": 0.0001602372028817439, "loss": 0.0064, "step": 11872 }, { "epoch": 2.42, "learning_rate": 0.00016021786262802835, "loss": 0.0168, "step": 11873 }, { "epoch": 2.42, "learning_rate": 0.00016019852220365522, "loss": 0.009, "step": 11874 }, { "epoch": 2.42, "learning_rate": 0.0001601791816089475, "loss": 0.0071, "step": 11875 }, { "epoch": 2.42, "learning_rate": 0.0001601598408442282, "loss": 0.0092, "step": 11876 }, { "epoch": 2.42, "learning_rate": 0.0001601404999098204, "loss": 0.0068, "step": 11877 }, { "epoch": 2.42, "learning_rate": 0.00016012115880604716, "loss": 0.0023, "step": 11878 }, { "epoch": 2.42, "learning_rate": 0.00016010181753323138, "loss": 0.0076, "step": 11879 }, { "epoch": 2.42, "learning_rate": 0.00016008247609169623, "loss": 0.0114, "step": 11880 }, { "epoch": 2.42, "learning_rate": 0.00016006313448176465, "loss": 0.0067, "step": 11881 }, { "epoch": 2.42, "learning_rate": 0.00016004379270375974, "loss": 0.0083, "step": 11882 }, { "epoch": 2.42, "learning_rate": 0.0001600244507580046, "loss": 0.011, "step": 11883 }, { "epoch": 2.42, "learning_rate": 0.00016000510864482215, "loss": 0.0069, "step": 11884 }, { "epoch": 2.42, "learning_rate": 0.00015998576636453552, "loss": 0.0238, "step": 11885 }, { "epoch": 2.42, "learning_rate": 0.00015996642391746772, "loss": 0.0259, "step": 11886 }, { "epoch": 2.42, "learning_rate": 0.00015994708130394184, "loss": 0.0121, "step": 11887 }, { "epoch": 2.42, "learning_rate": 0.00015992773852428093, "loss": 0.0039, "step": 11888 }, { "epoch": 2.42, "learning_rate": 0.00015990839557880805, "loss": 0.0106, "step": 11889 }, { "epoch": 2.42, "learning_rate": 0.00015988905246784626, "loss": 0.0069, "step": 11890 }, { "epoch": 2.42, "learning_rate": 0.0001598697091917186, "loss": 0.0036, "step": 11891 }, { "epoch": 2.42, "learning_rate": 0.0001598503657507482, "loss": 0.0017, "step": 11892 }, { "epoch": 2.42, "learning_rate": 0.00015983102214525807, "loss": 0.0104, "step": 11893 }, { "epoch": 2.42, "learning_rate": 0.00015981167837557134, "loss": 0.0056, "step": 11894 }, { "epoch": 2.42, "learning_rate": 0.00015979233444201105, "loss": 0.0053, "step": 11895 }, { "epoch": 2.42, "learning_rate": 0.00015977299034490027, "loss": 0.0133, "step": 11896 }, { "epoch": 2.42, "learning_rate": 0.00015975364608456215, "loss": 0.0053, "step": 11897 }, { "epoch": 2.42, "learning_rate": 0.0001597343016613197, "loss": 0.0015, "step": 11898 }, { "epoch": 2.42, "learning_rate": 0.00015971495707549604, "loss": 0.0108, "step": 11899 }, { "epoch": 2.42, "learning_rate": 0.00015969561232741426, "loss": 0.019, "step": 11900 }, { "epoch": 2.42, "learning_rate": 0.00015967626741739745, "loss": 0.0051, "step": 11901 }, { "epoch": 2.42, "learning_rate": 0.00015965692234576868, "loss": 0.0143, "step": 11902 }, { "epoch": 2.42, "learning_rate": 0.00015963757711285112, "loss": 0.0041, "step": 11903 }, { "epoch": 2.42, "learning_rate": 0.0001596182317189678, "loss": 0.0056, "step": 11904 }, { "epoch": 2.42, "learning_rate": 0.00015959888616444187, "loss": 0.0089, "step": 11905 }, { "epoch": 2.42, "learning_rate": 0.00015957954044959648, "loss": 0.0052, "step": 11906 }, { "epoch": 2.42, "learning_rate": 0.0001595601945747546, "loss": 0.0035, "step": 11907 }, { "epoch": 2.42, "learning_rate": 0.00015954084854023944, "loss": 0.0039, "step": 11908 }, { "epoch": 2.42, "learning_rate": 0.0001595215023463741, "loss": 0.0134, "step": 11909 }, { "epoch": 2.43, "learning_rate": 0.00015950215599348173, "loss": 0.0106, "step": 11910 }, { "epoch": 2.43, "learning_rate": 0.00015948280948188537, "loss": 0.0061, "step": 11911 }, { "epoch": 2.43, "learning_rate": 0.00015946346281190822, "loss": 0.0096, "step": 11912 }, { "epoch": 2.43, "learning_rate": 0.00015944411598387337, "loss": 0.0112, "step": 11913 }, { "epoch": 2.43, "learning_rate": 0.00015942476899810396, "loss": 0.0042, "step": 11914 }, { "epoch": 2.43, "learning_rate": 0.00015940542185492314, "loss": 0.0135, "step": 11915 }, { "epoch": 2.43, "learning_rate": 0.000159386074554654, "loss": 0.0086, "step": 11916 }, { "epoch": 2.43, "learning_rate": 0.0001593667270976197, "loss": 0.0054, "step": 11917 }, { "epoch": 2.43, "learning_rate": 0.00015934737948414333, "loss": 0.0105, "step": 11918 }, { "epoch": 2.43, "learning_rate": 0.00015932803171454812, "loss": 0.0335, "step": 11919 }, { "epoch": 2.43, "learning_rate": 0.00015930868378915725, "loss": 0.0144, "step": 11920 }, { "epoch": 2.43, "learning_rate": 0.0001592893357082937, "loss": 0.0025, "step": 11921 }, { "epoch": 2.43, "learning_rate": 0.0001592699874722807, "loss": 0.0018, "step": 11922 }, { "epoch": 2.43, "learning_rate": 0.0001592506390814414, "loss": 0.0023, "step": 11923 }, { "epoch": 2.43, "learning_rate": 0.000159231290536099, "loss": 0.0086, "step": 11924 }, { "epoch": 2.43, "learning_rate": 0.00015921194183657664, "loss": 0.0048, "step": 11925 }, { "epoch": 2.43, "learning_rate": 0.00015919259298319743, "loss": 0.0071, "step": 11926 }, { "epoch": 2.43, "learning_rate": 0.00015917324397628457, "loss": 0.0076, "step": 11927 }, { "epoch": 2.43, "learning_rate": 0.00015915389481616123, "loss": 0.004, "step": 11928 }, { "epoch": 2.43, "learning_rate": 0.00015913454550315058, "loss": 0.0047, "step": 11929 }, { "epoch": 2.43, "learning_rate": 0.00015911519603757578, "loss": 0.0073, "step": 11930 }, { "epoch": 2.43, "learning_rate": 0.00015909584641975999, "loss": 0.0015, "step": 11931 }, { "epoch": 2.43, "learning_rate": 0.00015907649665002635, "loss": 0.0041, "step": 11932 }, { "epoch": 2.43, "learning_rate": 0.00015905714672869817, "loss": 0.0107, "step": 11933 }, { "epoch": 2.43, "learning_rate": 0.00015903779665609846, "loss": 0.0183, "step": 11934 }, { "epoch": 2.43, "learning_rate": 0.00015901844643255051, "loss": 0.0059, "step": 11935 }, { "epoch": 2.43, "learning_rate": 0.0001589990960583775, "loss": 0.0057, "step": 11936 }, { "epoch": 2.43, "learning_rate": 0.00015897974553390258, "loss": 0.0017, "step": 11937 }, { "epoch": 2.43, "learning_rate": 0.000158960394859449, "loss": 0.0024, "step": 11938 }, { "epoch": 2.43, "learning_rate": 0.0001589410440353399, "loss": 0.0133, "step": 11939 }, { "epoch": 2.43, "learning_rate": 0.00015892169306189844, "loss": 0.0186, "step": 11940 }, { "epoch": 2.43, "learning_rate": 0.00015890234193944788, "loss": 0.0158, "step": 11941 }, { "epoch": 2.43, "learning_rate": 0.00015888299066831144, "loss": 0.0086, "step": 11942 }, { "epoch": 2.43, "learning_rate": 0.00015886363924881225, "loss": 0.0056, "step": 11943 }, { "epoch": 2.43, "learning_rate": 0.00015884428768127358, "loss": 0.0059, "step": 11944 }, { "epoch": 2.43, "learning_rate": 0.00015882493596601857, "loss": 0.0018, "step": 11945 }, { "epoch": 2.43, "learning_rate": 0.00015880558410337052, "loss": 0.0183, "step": 11946 }, { "epoch": 2.43, "learning_rate": 0.00015878623209365255, "loss": 0.016, "step": 11947 }, { "epoch": 2.43, "learning_rate": 0.00015876687993718796, "loss": 0.0221, "step": 11948 }, { "epoch": 2.43, "learning_rate": 0.00015874752763429993, "loss": 0.0391, "step": 11949 }, { "epoch": 2.43, "learning_rate": 0.00015872817518531164, "loss": 0.0026, "step": 11950 }, { "epoch": 2.43, "learning_rate": 0.00015870882259054635, "loss": 0.0049, "step": 11951 }, { "epoch": 2.43, "learning_rate": 0.00015868946985032734, "loss": 0.0061, "step": 11952 }, { "epoch": 2.43, "learning_rate": 0.0001586701169649777, "loss": 0.0047, "step": 11953 }, { "epoch": 2.43, "learning_rate": 0.0001586507639348208, "loss": 0.0044, "step": 11954 }, { "epoch": 2.43, "learning_rate": 0.00015863141076017978, "loss": 0.0062, "step": 11955 }, { "epoch": 2.43, "learning_rate": 0.0001586120574413779, "loss": 0.0013, "step": 11956 }, { "epoch": 2.43, "learning_rate": 0.00015859270397873846, "loss": 0.0081, "step": 11957 }, { "epoch": 2.43, "learning_rate": 0.0001585733503725846, "loss": 0.0027, "step": 11958 }, { "epoch": 2.44, "learning_rate": 0.00015855399662323964, "loss": 0.002, "step": 11959 }, { "epoch": 2.44, "learning_rate": 0.00015853464273102674, "loss": 0.0082, "step": 11960 }, { "epoch": 2.44, "learning_rate": 0.0001585152886962692, "loss": 0.0058, "step": 11961 }, { "epoch": 2.44, "learning_rate": 0.00015849593451929033, "loss": 0.0016, "step": 11962 }, { "epoch": 2.44, "learning_rate": 0.00015847658020041327, "loss": 0.0203, "step": 11963 }, { "epoch": 2.44, "learning_rate": 0.0001584572257399613, "loss": 0.0185, "step": 11964 }, { "epoch": 2.44, "learning_rate": 0.0001584378711382577, "loss": 0.0123, "step": 11965 }, { "epoch": 2.44, "learning_rate": 0.00015841851639562576, "loss": 0.0074, "step": 11966 }, { "epoch": 2.44, "learning_rate": 0.00015839916151238868, "loss": 0.0032, "step": 11967 }, { "epoch": 2.44, "learning_rate": 0.00015837980648886977, "loss": 0.0098, "step": 11968 }, { "epoch": 2.44, "learning_rate": 0.00015836045132539226, "loss": 0.0103, "step": 11969 }, { "epoch": 2.44, "learning_rate": 0.0001583410960222794, "loss": 0.007, "step": 11970 }, { "epoch": 2.44, "learning_rate": 0.00015832174057985455, "loss": 0.0148, "step": 11971 }, { "epoch": 2.44, "learning_rate": 0.0001583023849984409, "loss": 0.0083, "step": 11972 }, { "epoch": 2.44, "learning_rate": 0.00015828302927836177, "loss": 0.0124, "step": 11973 }, { "epoch": 2.44, "learning_rate": 0.00015826367341994038, "loss": 0.0059, "step": 11974 }, { "epoch": 2.44, "learning_rate": 0.0001582443174235, "loss": 0.0041, "step": 11975 }, { "epoch": 2.44, "learning_rate": 0.00015822496128936405, "loss": 0.0214, "step": 11976 }, { "epoch": 2.44, "learning_rate": 0.00015820560501785566, "loss": 0.0123, "step": 11977 }, { "epoch": 2.44, "learning_rate": 0.0001581862486092982, "loss": 0.0082, "step": 11978 }, { "epoch": 2.44, "learning_rate": 0.00015816689206401495, "loss": 0.021, "step": 11979 }, { "epoch": 2.44, "learning_rate": 0.0001581475353823292, "loss": 0.0151, "step": 11980 }, { "epoch": 2.44, "learning_rate": 0.00015812817856456418, "loss": 0.0119, "step": 11981 }, { "epoch": 2.44, "learning_rate": 0.00015810882161104324, "loss": 0.0048, "step": 11982 }, { "epoch": 2.44, "learning_rate": 0.00015808946452208972, "loss": 0.0101, "step": 11983 }, { "epoch": 2.44, "learning_rate": 0.00015807010729802684, "loss": 0.0057, "step": 11984 }, { "epoch": 2.44, "learning_rate": 0.00015805074993917792, "loss": 0.0102, "step": 11985 }, { "epoch": 2.44, "learning_rate": 0.00015803139244586627, "loss": 0.0084, "step": 11986 }, { "epoch": 2.44, "learning_rate": 0.00015801203481841523, "loss": 0.012, "step": 11987 }, { "epoch": 2.44, "learning_rate": 0.00015799267705714809, "loss": 0.0015, "step": 11988 }, { "epoch": 2.44, "learning_rate": 0.00015797331916238817, "loss": 0.0144, "step": 11989 }, { "epoch": 2.44, "learning_rate": 0.00015795396113445876, "loss": 0.0139, "step": 11990 }, { "epoch": 2.44, "learning_rate": 0.00015793460297368315, "loss": 0.0039, "step": 11991 }, { "epoch": 2.44, "learning_rate": 0.00015791524468038474, "loss": 0.0093, "step": 11992 }, { "epoch": 2.44, "learning_rate": 0.00015789588625488677, "loss": 0.0093, "step": 11993 }, { "epoch": 2.44, "learning_rate": 0.0001578765276975126, "loss": 0.0144, "step": 11994 }, { "epoch": 2.44, "learning_rate": 0.00015785716900858557, "loss": 0.0007, "step": 11995 }, { "epoch": 2.44, "learning_rate": 0.00015783781018842896, "loss": 0.0119, "step": 11996 }, { "epoch": 2.44, "learning_rate": 0.00015781845123736613, "loss": 0.0024, "step": 11997 }, { "epoch": 2.44, "learning_rate": 0.00015779909215572042, "loss": 0.0121, "step": 11998 }, { "epoch": 2.44, "learning_rate": 0.00015777973294381516, "loss": 0.0089, "step": 11999 }, { "epoch": 2.44, "learning_rate": 0.00015776037360197367, "loss": 0.0004, "step": 12000 }, { "epoch": 2.44, "learning_rate": 0.00015774101413051927, "loss": 0.0141, "step": 12001 }, { "epoch": 2.44, "learning_rate": 0.0001577216545297753, "loss": 0.0261, "step": 12002 }, { "epoch": 2.44, "learning_rate": 0.0001577022948000652, "loss": 0.0101, "step": 12003 }, { "epoch": 2.44, "learning_rate": 0.00015768293494171216, "loss": 0.0193, "step": 12004 }, { "epoch": 2.44, "learning_rate": 0.00015766357495503963, "loss": 0.0076, "step": 12005 }, { "epoch": 2.44, "learning_rate": 0.00015764421484037094, "loss": 0.0211, "step": 12006 }, { "epoch": 2.44, "learning_rate": 0.00015762485459802942, "loss": 0.0061, "step": 12007 }, { "epoch": 2.45, "learning_rate": 0.00015760549422833846, "loss": 0.0198, "step": 12008 }, { "epoch": 2.45, "learning_rate": 0.00015758613373162138, "loss": 0.0031, "step": 12009 }, { "epoch": 2.45, "learning_rate": 0.00015756677310820155, "loss": 0.0062, "step": 12010 }, { "epoch": 2.45, "learning_rate": 0.0001575474123584023, "loss": 0.0073, "step": 12011 }, { "epoch": 2.45, "learning_rate": 0.00015752805148254708, "loss": 0.0065, "step": 12012 }, { "epoch": 2.45, "learning_rate": 0.0001575086904809591, "loss": 0.0046, "step": 12013 }, { "epoch": 2.45, "learning_rate": 0.00015748932935396188, "loss": 0.0101, "step": 12014 }, { "epoch": 2.45, "learning_rate": 0.00015746996810187872, "loss": 0.0065, "step": 12015 }, { "epoch": 2.45, "learning_rate": 0.00015745060672503296, "loss": 0.0209, "step": 12016 }, { "epoch": 2.45, "learning_rate": 0.00015743124522374802, "loss": 0.0082, "step": 12017 }, { "epoch": 2.45, "learning_rate": 0.00015741188359834723, "loss": 0.0015, "step": 12018 }, { "epoch": 2.45, "learning_rate": 0.00015739252184915405, "loss": 0.0064, "step": 12019 }, { "epoch": 2.45, "learning_rate": 0.00015737315997649176, "loss": 0.0202, "step": 12020 }, { "epoch": 2.45, "learning_rate": 0.00015735379798068375, "loss": 0.0094, "step": 12021 }, { "epoch": 2.45, "learning_rate": 0.00015733443586205353, "loss": 0.0119, "step": 12022 }, { "epoch": 2.45, "learning_rate": 0.0001573150736209243, "loss": 0.0088, "step": 12023 }, { "epoch": 2.45, "learning_rate": 0.0001572957112576196, "loss": 0.02, "step": 12024 }, { "epoch": 2.45, "learning_rate": 0.0001572763487724627, "loss": 0.0116, "step": 12025 }, { "epoch": 2.45, "learning_rate": 0.00015725698616577704, "loss": 0.0058, "step": 12026 }, { "epoch": 2.45, "learning_rate": 0.00015723762343788602, "loss": 0.0129, "step": 12027 }, { "epoch": 2.45, "learning_rate": 0.00015721826058911304, "loss": 0.0153, "step": 12028 }, { "epoch": 2.45, "learning_rate": 0.00015719889761978145, "loss": 0.0112, "step": 12029 }, { "epoch": 2.45, "learning_rate": 0.0001571795345302147, "loss": 0.0039, "step": 12030 }, { "epoch": 2.45, "learning_rate": 0.00015716017132073618, "loss": 0.0107, "step": 12031 }, { "epoch": 2.45, "learning_rate": 0.00015714080799166932, "loss": 0.0217, "step": 12032 }, { "epoch": 2.45, "learning_rate": 0.00015712144454333742, "loss": 0.0029, "step": 12033 }, { "epoch": 2.45, "learning_rate": 0.00015710208097606396, "loss": 0.0088, "step": 12034 }, { "epoch": 2.45, "learning_rate": 0.00015708271729017237, "loss": 0.0125, "step": 12035 }, { "epoch": 2.45, "learning_rate": 0.00015706335348598604, "loss": 0.0148, "step": 12036 }, { "epoch": 2.45, "learning_rate": 0.00015704398956382833, "loss": 0.0113, "step": 12037 }, { "epoch": 2.45, "learning_rate": 0.00015702462552402276, "loss": 0.0064, "step": 12038 }, { "epoch": 2.45, "learning_rate": 0.0001570052613668926, "loss": 0.0128, "step": 12039 }, { "epoch": 2.45, "learning_rate": 0.00015698589709276146, "loss": 0.0072, "step": 12040 }, { "epoch": 2.45, "learning_rate": 0.00015696653270195256, "loss": 0.0195, "step": 12041 }, { "epoch": 2.45, "learning_rate": 0.00015694716819478948, "loss": 0.007, "step": 12042 }, { "epoch": 2.45, "learning_rate": 0.00015692780357159553, "loss": 0.0092, "step": 12043 }, { "epoch": 2.45, "learning_rate": 0.0001569084388326942, "loss": 0.0014, "step": 12044 }, { "epoch": 2.45, "learning_rate": 0.0001568890739784089, "loss": 0.0226, "step": 12045 }, { "epoch": 2.45, "learning_rate": 0.0001568697090090631, "loss": 0.0082, "step": 12046 }, { "epoch": 2.45, "learning_rate": 0.00015685034392498012, "loss": 0.0051, "step": 12047 }, { "epoch": 2.45, "learning_rate": 0.00015683097872648346, "loss": 0.0149, "step": 12048 }, { "epoch": 2.45, "learning_rate": 0.0001568116134138966, "loss": 0.0111, "step": 12049 }, { "epoch": 2.45, "learning_rate": 0.00015679224798754296, "loss": 0.0122, "step": 12050 }, { "epoch": 2.45, "learning_rate": 0.00015677288244774593, "loss": 0.0142, "step": 12051 }, { "epoch": 2.45, "learning_rate": 0.00015675351679482897, "loss": 0.006, "step": 12052 }, { "epoch": 2.45, "learning_rate": 0.00015673415102911552, "loss": 0.0059, "step": 12053 }, { "epoch": 2.45, "learning_rate": 0.0001567147851509291, "loss": 0.0148, "step": 12054 }, { "epoch": 2.45, "learning_rate": 0.00015669541916059305, "loss": 0.0148, "step": 12055 }, { "epoch": 2.45, "learning_rate": 0.00015667605305843085, "loss": 0.0063, "step": 12056 }, { "epoch": 2.46, "learning_rate": 0.00015665668684476598, "loss": 0.0039, "step": 12057 }, { "epoch": 2.46, "learning_rate": 0.00015663732051992188, "loss": 0.0069, "step": 12058 }, { "epoch": 2.46, "learning_rate": 0.00015661795408422195, "loss": 0.0149, "step": 12059 }, { "epoch": 2.46, "learning_rate": 0.00015659858753798973, "loss": 0.0034, "step": 12060 }, { "epoch": 2.46, "learning_rate": 0.00015657922088154863, "loss": 0.0065, "step": 12061 }, { "epoch": 2.46, "learning_rate": 0.00015655985411522214, "loss": 0.0021, "step": 12062 }, { "epoch": 2.46, "learning_rate": 0.00015654048723933375, "loss": 0.0116, "step": 12063 }, { "epoch": 2.46, "learning_rate": 0.00015652112025420683, "loss": 0.0018, "step": 12064 }, { "epoch": 2.46, "learning_rate": 0.00015650175316016488, "loss": 0.0162, "step": 12065 }, { "epoch": 2.46, "learning_rate": 0.0001564823859575314, "loss": 0.014, "step": 12066 }, { "epoch": 2.46, "learning_rate": 0.0001564630186466298, "loss": 0.0228, "step": 12067 }, { "epoch": 2.46, "learning_rate": 0.0001564436512277836, "loss": 0.0048, "step": 12068 }, { "epoch": 2.46, "learning_rate": 0.00015642428370131627, "loss": 0.0124, "step": 12069 }, { "epoch": 2.46, "learning_rate": 0.00015640491606755129, "loss": 0.0021, "step": 12070 }, { "epoch": 2.46, "learning_rate": 0.0001563855483268121, "loss": 0.0014, "step": 12071 }, { "epoch": 2.46, "learning_rate": 0.00015636618047942222, "loss": 0.0048, "step": 12072 }, { "epoch": 2.46, "learning_rate": 0.00015634681252570514, "loss": 0.0088, "step": 12073 }, { "epoch": 2.46, "learning_rate": 0.00015632744446598425, "loss": 0.0342, "step": 12074 }, { "epoch": 2.46, "learning_rate": 0.00015630807630058314, "loss": 0.0162, "step": 12075 }, { "epoch": 2.46, "learning_rate": 0.0001562887080298252, "loss": 0.0076, "step": 12076 }, { "epoch": 2.46, "learning_rate": 0.00015626933965403402, "loss": 0.0042, "step": 12077 }, { "epoch": 2.46, "learning_rate": 0.000156249971173533, "loss": 0.0354, "step": 12078 }, { "epoch": 2.46, "learning_rate": 0.00015623060258864563, "loss": 0.0059, "step": 12079 }, { "epoch": 2.46, "learning_rate": 0.0001562112338996955, "loss": 0.0068, "step": 12080 }, { "epoch": 2.46, "learning_rate": 0.00015619186510700597, "loss": 0.0004, "step": 12081 }, { "epoch": 2.46, "learning_rate": 0.00015617249621090068, "loss": 0.015, "step": 12082 }, { "epoch": 2.46, "learning_rate": 0.00015615312721170303, "loss": 0.0033, "step": 12083 }, { "epoch": 2.46, "learning_rate": 0.0001561337581097365, "loss": 0.0104, "step": 12084 }, { "epoch": 2.46, "learning_rate": 0.0001561143889053247, "loss": 0.0082, "step": 12085 }, { "epoch": 2.46, "learning_rate": 0.00015609501959879104, "loss": 0.0044, "step": 12086 }, { "epoch": 2.46, "learning_rate": 0.00015607565019045902, "loss": 0.009, "step": 12087 }, { "epoch": 2.46, "learning_rate": 0.00015605628068065218, "loss": 0.0107, "step": 12088 }, { "epoch": 2.46, "learning_rate": 0.000156036911069694, "loss": 0.0183, "step": 12089 }, { "epoch": 2.46, "learning_rate": 0.000156017541357908, "loss": 0.0265, "step": 12090 }, { "epoch": 2.46, "learning_rate": 0.0001559981715456178, "loss": 0.0096, "step": 12091 }, { "epoch": 2.46, "learning_rate": 0.00015597880163314672, "loss": 0.0157, "step": 12092 }, { "epoch": 2.46, "learning_rate": 0.0001559594316208184, "loss": 0.0086, "step": 12093 }, { "epoch": 2.46, "learning_rate": 0.0001559400615089563, "loss": 0.0071, "step": 12094 }, { "epoch": 2.46, "learning_rate": 0.00015592069129788397, "loss": 0.0018, "step": 12095 }, { "epoch": 2.46, "learning_rate": 0.00015590132098792497, "loss": 0.0021, "step": 12096 }, { "epoch": 2.46, "learning_rate": 0.00015588195057940273, "loss": 0.016, "step": 12097 }, { "epoch": 2.46, "learning_rate": 0.00015586258007264082, "loss": 0.0041, "step": 12098 }, { "epoch": 2.46, "learning_rate": 0.00015584320946796274, "loss": 0.0223, "step": 12099 }, { "epoch": 2.46, "learning_rate": 0.000155823838765692, "loss": 0.0028, "step": 12100 }, { "epoch": 2.46, "learning_rate": 0.0001558044679661522, "loss": 0.005, "step": 12101 }, { "epoch": 2.46, "learning_rate": 0.0001557850970696668, "loss": 0.0154, "step": 12102 }, { "epoch": 2.46, "learning_rate": 0.0001557657260765594, "loss": 0.0065, "step": 12103 }, { "epoch": 2.46, "learning_rate": 0.00015574635498715348, "loss": 0.0118, "step": 12104 }, { "epoch": 2.46, "learning_rate": 0.0001557269838017726, "loss": 0.0019, "step": 12105 }, { "epoch": 2.47, "learning_rate": 0.00015570761252074026, "loss": 0.0067, "step": 12106 }, { "epoch": 2.47, "learning_rate": 0.00015568824114438, "loss": 0.0067, "step": 12107 }, { "epoch": 2.47, "learning_rate": 0.0001556688696730154, "loss": 0.0094, "step": 12108 }, { "epoch": 2.47, "learning_rate": 0.00015564949810696995, "loss": 0.0101, "step": 12109 }, { "epoch": 2.47, "learning_rate": 0.00015563012644656725, "loss": 0.0058, "step": 12110 }, { "epoch": 2.47, "learning_rate": 0.0001556107546921308, "loss": 0.01, "step": 12111 }, { "epoch": 2.47, "learning_rate": 0.00015559138284398417, "loss": 0.04, "step": 12112 }, { "epoch": 2.47, "learning_rate": 0.00015557201090245085, "loss": 0.0106, "step": 12113 }, { "epoch": 2.47, "learning_rate": 0.00015555263886785447, "loss": 0.0025, "step": 12114 }, { "epoch": 2.47, "learning_rate": 0.00015553326674051852, "loss": 0.0035, "step": 12115 }, { "epoch": 2.47, "learning_rate": 0.0001555138945207666, "loss": 0.0074, "step": 12116 }, { "epoch": 2.47, "learning_rate": 0.00015549452220892218, "loss": 0.0067, "step": 12117 }, { "epoch": 2.47, "learning_rate": 0.00015547514980530892, "loss": 0.0023, "step": 12118 }, { "epoch": 2.47, "learning_rate": 0.00015545577731025027, "loss": 0.0163, "step": 12119 }, { "epoch": 2.47, "learning_rate": 0.00015543640472406986, "loss": 0.0168, "step": 12120 }, { "epoch": 2.47, "learning_rate": 0.00015541703204709125, "loss": 0.0068, "step": 12121 }, { "epoch": 2.47, "learning_rate": 0.00015539765927963795, "loss": 0.015, "step": 12122 }, { "epoch": 2.47, "learning_rate": 0.0001553782864220336, "loss": 0.0199, "step": 12123 }, { "epoch": 2.47, "learning_rate": 0.00015535891347460168, "loss": 0.0146, "step": 12124 }, { "epoch": 2.47, "learning_rate": 0.00015533954043766578, "loss": 0.0051, "step": 12125 }, { "epoch": 2.47, "learning_rate": 0.00015532016731154949, "loss": 0.0228, "step": 12126 }, { "epoch": 2.47, "learning_rate": 0.00015530079409657637, "loss": 0.0089, "step": 12127 }, { "epoch": 2.47, "learning_rate": 0.00015528142079307, "loss": 0.0038, "step": 12128 }, { "epoch": 2.47, "learning_rate": 0.0001552620474013539, "loss": 0.0028, "step": 12129 }, { "epoch": 2.47, "learning_rate": 0.0001552426739217517, "loss": 0.0056, "step": 12130 }, { "epoch": 2.47, "learning_rate": 0.00015522330035458687, "loss": 0.0042, "step": 12131 }, { "epoch": 2.47, "learning_rate": 0.00015520392670018311, "loss": 0.0103, "step": 12132 }, { "epoch": 2.47, "learning_rate": 0.000155184552958864, "loss": 0.0035, "step": 12133 }, { "epoch": 2.47, "learning_rate": 0.00015516517913095307, "loss": 0.0018, "step": 12134 }, { "epoch": 2.47, "learning_rate": 0.00015514580521677385, "loss": 0.0039, "step": 12135 }, { "epoch": 2.47, "learning_rate": 0.00015512643121664999, "loss": 0.0014, "step": 12136 }, { "epoch": 2.47, "learning_rate": 0.00015510705713090505, "loss": 0.0095, "step": 12137 }, { "epoch": 2.47, "learning_rate": 0.00015508768295986261, "loss": 0.0172, "step": 12138 }, { "epoch": 2.47, "learning_rate": 0.00015506830870384627, "loss": 0.0222, "step": 12139 }, { "epoch": 2.47, "learning_rate": 0.00015504893436317957, "loss": 0.0047, "step": 12140 }, { "epoch": 2.47, "learning_rate": 0.00015502955993818617, "loss": 0.0048, "step": 12141 }, { "epoch": 2.47, "learning_rate": 0.00015501018542918963, "loss": 0.0047, "step": 12142 }, { "epoch": 2.47, "learning_rate": 0.00015499081083651352, "loss": 0.0004, "step": 12143 }, { "epoch": 2.47, "learning_rate": 0.00015497143616048143, "loss": 0.0105, "step": 12144 }, { "epoch": 2.47, "learning_rate": 0.000154952061401417, "loss": 0.0111, "step": 12145 }, { "epoch": 2.47, "learning_rate": 0.00015493268655964379, "loss": 0.0071, "step": 12146 }, { "epoch": 2.47, "learning_rate": 0.00015491331163548544, "loss": 0.0077, "step": 12147 }, { "epoch": 2.47, "learning_rate": 0.0001548939366292655, "loss": 0.0076, "step": 12148 }, { "epoch": 2.47, "learning_rate": 0.00015487456154130753, "loss": 0.0135, "step": 12149 }, { "epoch": 2.47, "learning_rate": 0.00015485518637193524, "loss": 0.0215, "step": 12150 }, { "epoch": 2.47, "learning_rate": 0.0001548358111214721, "loss": 0.0008, "step": 12151 }, { "epoch": 2.47, "learning_rate": 0.00015481643579024187, "loss": 0.0046, "step": 12152 }, { "epoch": 2.47, "learning_rate": 0.00015479706037856798, "loss": 0.0074, "step": 12153 }, { "epoch": 2.47, "learning_rate": 0.0001547776848867742, "loss": 0.0065, "step": 12154 }, { "epoch": 2.47, "learning_rate": 0.00015475830931518402, "loss": 0.0038, "step": 12155 }, { "epoch": 2.48, "learning_rate": 0.00015473893366412114, "loss": 0.0065, "step": 12156 }, { "epoch": 2.48, "learning_rate": 0.0001547195579339091, "loss": 0.0048, "step": 12157 }, { "epoch": 2.48, "learning_rate": 0.00015470018212487152, "loss": 0.0005, "step": 12158 }, { "epoch": 2.48, "learning_rate": 0.00015468080623733203, "loss": 0.0068, "step": 12159 }, { "epoch": 2.48, "learning_rate": 0.0001546614302716143, "loss": 0.0175, "step": 12160 }, { "epoch": 2.48, "learning_rate": 0.0001546420542280418, "loss": 0.0103, "step": 12161 }, { "epoch": 2.48, "learning_rate": 0.00015462267810693823, "loss": 0.0157, "step": 12162 }, { "epoch": 2.48, "learning_rate": 0.00015460330190862723, "loss": 0.013, "step": 12163 }, { "epoch": 2.48, "learning_rate": 0.0001545839256334324, "loss": 0.0075, "step": 12164 }, { "epoch": 2.48, "learning_rate": 0.00015456454928167743, "loss": 0.007, "step": 12165 }, { "epoch": 2.48, "learning_rate": 0.00015454517285368578, "loss": 0.0028, "step": 12166 }, { "epoch": 2.48, "learning_rate": 0.0001545257963497812, "loss": 0.0217, "step": 12167 }, { "epoch": 2.48, "learning_rate": 0.00015450641977028727, "loss": 0.0035, "step": 12168 }, { "epoch": 2.48, "learning_rate": 0.00015448704311552761, "loss": 0.0096, "step": 12169 }, { "epoch": 2.48, "learning_rate": 0.00015446766638582593, "loss": 0.004, "step": 12170 }, { "epoch": 2.48, "learning_rate": 0.00015444828958150573, "loss": 0.0113, "step": 12171 }, { "epoch": 2.48, "learning_rate": 0.00015442891270289066, "loss": 0.0106, "step": 12172 }, { "epoch": 2.48, "learning_rate": 0.0001544095357503044, "loss": 0.0139, "step": 12173 }, { "epoch": 2.48, "learning_rate": 0.00015439015872407066, "loss": 0.0302, "step": 12174 }, { "epoch": 2.48, "learning_rate": 0.0001543707816245129, "loss": 0.0024, "step": 12175 }, { "epoch": 2.48, "learning_rate": 0.00015435140445195484, "loss": 0.0072, "step": 12176 }, { "epoch": 2.48, "learning_rate": 0.00015433202720672014, "loss": 0.0022, "step": 12177 }, { "epoch": 2.48, "learning_rate": 0.0001543126498891324, "loss": 0.0099, "step": 12178 }, { "epoch": 2.48, "learning_rate": 0.00015429327249951528, "loss": 0.0156, "step": 12179 }, { "epoch": 2.48, "learning_rate": 0.0001542738950381924, "loss": 0.0014, "step": 12180 }, { "epoch": 2.48, "learning_rate": 0.00015425451750548737, "loss": 0.0076, "step": 12181 }, { "epoch": 2.48, "learning_rate": 0.0001542351399017239, "loss": 0.0182, "step": 12182 }, { "epoch": 2.48, "learning_rate": 0.0001542157622272256, "loss": 0.0116, "step": 12183 }, { "epoch": 2.48, "learning_rate": 0.00015419638448231607, "loss": 0.0034, "step": 12184 }, { "epoch": 2.48, "learning_rate": 0.00015417700666731904, "loss": 0.0026, "step": 12185 }, { "epoch": 2.48, "learning_rate": 0.0001541576287825581, "loss": 0.0049, "step": 12186 }, { "epoch": 2.48, "learning_rate": 0.0001541382508283569, "loss": 0.0126, "step": 12187 }, { "epoch": 2.48, "learning_rate": 0.00015411887280503917, "loss": 0.0058, "step": 12188 }, { "epoch": 2.48, "learning_rate": 0.0001540994947129284, "loss": 0.0036, "step": 12189 }, { "epoch": 2.48, "learning_rate": 0.00015408011655234838, "loss": 0.0035, "step": 12190 }, { "epoch": 2.48, "learning_rate": 0.00015406073832362267, "loss": 0.0081, "step": 12191 }, { "epoch": 2.48, "learning_rate": 0.000154041360027075, "loss": 0.0046, "step": 12192 }, { "epoch": 2.48, "learning_rate": 0.00015402198166302898, "loss": 0.0156, "step": 12193 }, { "epoch": 2.48, "learning_rate": 0.00015400260323180826, "loss": 0.0137, "step": 12194 }, { "epoch": 2.48, "learning_rate": 0.0001539832247337365, "loss": 0.017, "step": 12195 }, { "epoch": 2.48, "learning_rate": 0.00015396384616913743, "loss": 0.0057, "step": 12196 }, { "epoch": 2.48, "learning_rate": 0.00015394446753833461, "loss": 0.0097, "step": 12197 }, { "epoch": 2.48, "learning_rate": 0.00015392508884165177, "loss": 0.0032, "step": 12198 }, { "epoch": 2.48, "learning_rate": 0.0001539057100794125, "loss": 0.0091, "step": 12199 }, { "epoch": 2.48, "learning_rate": 0.00015388633125194048, "loss": 0.0123, "step": 12200 }, { "epoch": 2.48, "learning_rate": 0.0001538669523595594, "loss": 0.0056, "step": 12201 }, { "epoch": 2.48, "learning_rate": 0.00015384757340259294, "loss": 0.01, "step": 12202 }, { "epoch": 2.48, "learning_rate": 0.00015382819438136471, "loss": 0.0051, "step": 12203 }, { "epoch": 2.48, "learning_rate": 0.00015380881529619843, "loss": 0.0012, "step": 12204 }, { "epoch": 2.49, "learning_rate": 0.00015378943614741776, "loss": 0.0108, "step": 12205 }, { "epoch": 2.49, "learning_rate": 0.00015377005693534634, "loss": 0.0063, "step": 12206 }, { "epoch": 2.49, "learning_rate": 0.00015375067766030788, "loss": 0.0201, "step": 12207 }, { "epoch": 2.49, "learning_rate": 0.00015373129832262598, "loss": 0.0198, "step": 12208 }, { "epoch": 2.49, "learning_rate": 0.0001537119189226244, "loss": 0.0011, "step": 12209 }, { "epoch": 2.49, "learning_rate": 0.0001536925394606267, "loss": 0.0166, "step": 12210 }, { "epoch": 2.49, "learning_rate": 0.00015367315993695667, "loss": 0.0072, "step": 12211 }, { "epoch": 2.49, "learning_rate": 0.00015365378035193795, "loss": 0.0027, "step": 12212 }, { "epoch": 2.49, "learning_rate": 0.00015363440070589415, "loss": 0.0122, "step": 12213 }, { "epoch": 2.49, "learning_rate": 0.00015361502099914897, "loss": 0.008, "step": 12214 }, { "epoch": 2.49, "learning_rate": 0.00015359564123202616, "loss": 0.0144, "step": 12215 }, { "epoch": 2.49, "learning_rate": 0.0001535762614048494, "loss": 0.0087, "step": 12216 }, { "epoch": 2.49, "learning_rate": 0.00015355688151794228, "loss": 0.0007, "step": 12217 }, { "epoch": 2.49, "learning_rate": 0.00015353750157162853, "loss": 0.0072, "step": 12218 }, { "epoch": 2.49, "learning_rate": 0.00015351812156623183, "loss": 0.0035, "step": 12219 }, { "epoch": 2.49, "learning_rate": 0.00015349874150207582, "loss": 0.0031, "step": 12220 }, { "epoch": 2.49, "learning_rate": 0.0001534793613794843, "loss": 0.0051, "step": 12221 }, { "epoch": 2.49, "learning_rate": 0.00015345998119878083, "loss": 0.0063, "step": 12222 }, { "epoch": 2.49, "learning_rate": 0.00015344060096028915, "loss": 0.0088, "step": 12223 }, { "epoch": 2.49, "learning_rate": 0.0001534212206643329, "loss": 0.0038, "step": 12224 }, { "epoch": 2.49, "learning_rate": 0.00015340184031123588, "loss": 0.0084, "step": 12225 }, { "epoch": 2.49, "learning_rate": 0.00015338245990132165, "loss": 0.0029, "step": 12226 }, { "epoch": 2.49, "learning_rate": 0.00015336307943491397, "loss": 0.0185, "step": 12227 }, { "epoch": 2.49, "learning_rate": 0.00015334369891233652, "loss": 0.0108, "step": 12228 }, { "epoch": 2.49, "learning_rate": 0.00015332431833391298, "loss": 0.019, "step": 12229 }, { "epoch": 2.49, "learning_rate": 0.0001533049376999671, "loss": 0.0222, "step": 12230 }, { "epoch": 2.49, "learning_rate": 0.00015328555701082247, "loss": 0.0024, "step": 12231 }, { "epoch": 2.49, "learning_rate": 0.00015326617626680282, "loss": 0.0009, "step": 12232 }, { "epoch": 2.49, "learning_rate": 0.0001532467954682319, "loss": 0.0035, "step": 12233 }, { "epoch": 2.49, "learning_rate": 0.00015322741461543332, "loss": 0.022, "step": 12234 }, { "epoch": 2.49, "learning_rate": 0.00015320803370873085, "loss": 0.0138, "step": 12235 }, { "epoch": 2.49, "learning_rate": 0.00015318865274844816, "loss": 0.001, "step": 12236 }, { "epoch": 2.49, "learning_rate": 0.00015316927173490897, "loss": 0.0078, "step": 12237 }, { "epoch": 2.49, "learning_rate": 0.00015314989066843695, "loss": 0.0132, "step": 12238 }, { "epoch": 2.49, "learning_rate": 0.00015313050954935583, "loss": 0.0029, "step": 12239 }, { "epoch": 2.49, "learning_rate": 0.00015311112837798925, "loss": 0.0207, "step": 12240 }, { "epoch": 2.49, "learning_rate": 0.00015309174715466095, "loss": 0.0133, "step": 12241 }, { "epoch": 2.49, "learning_rate": 0.00015307236587969468, "loss": 0.0278, "step": 12242 }, { "epoch": 2.49, "learning_rate": 0.00015305298455341407, "loss": 0.0079, "step": 12243 }, { "epoch": 2.49, "learning_rate": 0.00015303360317614283, "loss": 0.0097, "step": 12244 }, { "epoch": 2.49, "learning_rate": 0.00015301422174820471, "loss": 0.0148, "step": 12245 }, { "epoch": 2.49, "learning_rate": 0.00015299484026992343, "loss": 0.007, "step": 12246 }, { "epoch": 2.49, "learning_rate": 0.00015297545874162262, "loss": 0.0036, "step": 12247 }, { "epoch": 2.49, "learning_rate": 0.0001529560771636261, "loss": 0.0183, "step": 12248 }, { "epoch": 2.49, "learning_rate": 0.00015293669553625747, "loss": 0.0034, "step": 12249 }, { "epoch": 2.49, "learning_rate": 0.00015291731385984046, "loss": 0.0088, "step": 12250 }, { "epoch": 2.49, "learning_rate": 0.0001528979321346988, "loss": 0.0113, "step": 12251 }, { "epoch": 2.49, "learning_rate": 0.00015287855036115623, "loss": 0.0021, "step": 12252 }, { "epoch": 2.49, "learning_rate": 0.00015285916853953645, "loss": 0.0038, "step": 12253 }, { "epoch": 2.5, "learning_rate": 0.00015283978667016314, "loss": 0.0139, "step": 12254 }, { "epoch": 2.5, "learning_rate": 0.00015282040475336, "loss": 0.0031, "step": 12255 }, { "epoch": 2.5, "learning_rate": 0.00015280102278945082, "loss": 0.0015, "step": 12256 }, { "epoch": 2.5, "learning_rate": 0.00015278164077875924, "loss": 0.005, "step": 12257 }, { "epoch": 2.5, "learning_rate": 0.00015276225872160902, "loss": 0.0099, "step": 12258 }, { "epoch": 2.5, "learning_rate": 0.0001527428766183239, "loss": 0.0131, "step": 12259 }, { "epoch": 2.5, "learning_rate": 0.0001527234944692275, "loss": 0.0047, "step": 12260 }, { "epoch": 2.5, "learning_rate": 0.00015270411227464366, "loss": 0.0019, "step": 12261 }, { "epoch": 2.5, "learning_rate": 0.00015268473003489602, "loss": 0.0125, "step": 12262 }, { "epoch": 2.5, "learning_rate": 0.00015266534775030833, "loss": 0.0065, "step": 12263 }, { "epoch": 2.5, "learning_rate": 0.00015264596542120427, "loss": 0.0074, "step": 12264 }, { "epoch": 2.5, "learning_rate": 0.00015262658304790761, "loss": 0.0069, "step": 12265 }, { "epoch": 2.5, "learning_rate": 0.00015260720063074208, "loss": 0.0043, "step": 12266 }, { "epoch": 2.5, "learning_rate": 0.00015258781817003135, "loss": 0.0075, "step": 12267 }, { "epoch": 2.5, "learning_rate": 0.00015256843566609915, "loss": 0.0047, "step": 12268 }, { "epoch": 2.5, "learning_rate": 0.00015254905311926924, "loss": 0.0361, "step": 12269 }, { "epoch": 2.5, "learning_rate": 0.00015252967052986535, "loss": 0.0183, "step": 12270 }, { "epoch": 2.5, "learning_rate": 0.00015251028789821123, "loss": 0.0054, "step": 12271 }, { "epoch": 2.5, "learning_rate": 0.0001524909052246305, "loss": 0.0033, "step": 12272 }, { "epoch": 2.5, "learning_rate": 0.00015247152250944692, "loss": 0.0201, "step": 12273 }, { "epoch": 2.5, "learning_rate": 0.00015245213975298433, "loss": 0.0072, "step": 12274 }, { "epoch": 2.5, "learning_rate": 0.00015243275695556632, "loss": 0.0009, "step": 12275 }, { "epoch": 2.5, "learning_rate": 0.0001524133741175167, "loss": 0.0025, "step": 12276 }, { "epoch": 2.5, "learning_rate": 0.00015239399123915916, "loss": 0.005, "step": 12277 }, { "epoch": 2.5, "learning_rate": 0.00015237460832081748, "loss": 0.011, "step": 12278 }, { "epoch": 2.5, "learning_rate": 0.0001523552253628153, "loss": 0.0076, "step": 12279 }, { "epoch": 2.5, "learning_rate": 0.00015233584236547647, "loss": 0.0024, "step": 12280 }, { "epoch": 2.5, "learning_rate": 0.00015231645932912467, "loss": 0.0027, "step": 12281 }, { "epoch": 2.5, "learning_rate": 0.00015229707625408358, "loss": 0.0048, "step": 12282 }, { "epoch": 2.5, "learning_rate": 0.000152277693140677, "loss": 0.0156, "step": 12283 }, { "epoch": 2.5, "learning_rate": 0.00015225830998922865, "loss": 0.0137, "step": 12284 }, { "epoch": 2.5, "learning_rate": 0.0001522389268000623, "loss": 0.0091, "step": 12285 }, { "epoch": 2.5, "learning_rate": 0.00015221954357350155, "loss": 0.0143, "step": 12286 }, { "epoch": 2.5, "learning_rate": 0.0001522001603098703, "loss": 0.0178, "step": 12287 }, { "epoch": 2.5, "learning_rate": 0.0001521807770094922, "loss": 0.007, "step": 12288 }, { "epoch": 2.5, "learning_rate": 0.000152161393672691, "loss": 0.0056, "step": 12289 }, { "epoch": 2.5, "learning_rate": 0.00015214201029979047, "loss": 0.0046, "step": 12290 }, { "epoch": 2.5, "learning_rate": 0.00015212262689111433, "loss": 0.0015, "step": 12291 }, { "epoch": 2.5, "learning_rate": 0.0001521032434469863, "loss": 0.0109, "step": 12292 }, { "epoch": 2.5, "learning_rate": 0.0001520838599677301, "loss": 0.0105, "step": 12293 }, { "epoch": 2.5, "learning_rate": 0.00015206447645366953, "loss": 0.012, "step": 12294 }, { "epoch": 2.5, "learning_rate": 0.00015204509290512835, "loss": 0.0024, "step": 12295 }, { "epoch": 2.5, "learning_rate": 0.00015202570932243021, "loss": 0.0043, "step": 12296 }, { "epoch": 2.5, "learning_rate": 0.00015200632570589888, "loss": 0.01, "step": 12297 }, { "epoch": 2.5, "learning_rate": 0.00015198694205585816, "loss": 0.0039, "step": 12298 }, { "epoch": 2.5, "learning_rate": 0.00015196755837263177, "loss": 0.0018, "step": 12299 }, { "epoch": 2.5, "learning_rate": 0.0001519481746565434, "loss": 0.0055, "step": 12300 }, { "epoch": 2.5, "learning_rate": 0.0001519287909079169, "loss": 0.0031, "step": 12301 }, { "epoch": 2.5, "learning_rate": 0.00015190940712707588, "loss": 0.0267, "step": 12302 }, { "epoch": 2.51, "learning_rate": 0.00015189002331434417, "loss": 0.0223, "step": 12303 }, { "epoch": 2.51, "learning_rate": 0.00015187063947004557, "loss": 0.0115, "step": 12304 }, { "epoch": 2.51, "learning_rate": 0.00015185125559450367, "loss": 0.0039, "step": 12305 }, { "epoch": 2.51, "learning_rate": 0.00015183187168804236, "loss": 0.0066, "step": 12306 }, { "epoch": 2.51, "learning_rate": 0.00015181248775098533, "loss": 0.0061, "step": 12307 }, { "epoch": 2.51, "learning_rate": 0.0001517931037836563, "loss": 0.0097, "step": 12308 }, { "epoch": 2.51, "learning_rate": 0.00015177371978637908, "loss": 0.0078, "step": 12309 }, { "epoch": 2.51, "learning_rate": 0.00015175433575947736, "loss": 0.0117, "step": 12310 }, { "epoch": 2.51, "learning_rate": 0.00015173495170327497, "loss": 0.0083, "step": 12311 }, { "epoch": 2.51, "learning_rate": 0.00015171556761809559, "loss": 0.0102, "step": 12312 }, { "epoch": 2.51, "learning_rate": 0.00015169618350426302, "loss": 0.0103, "step": 12313 }, { "epoch": 2.51, "learning_rate": 0.00015167679936210096, "loss": 0.0081, "step": 12314 }, { "epoch": 2.51, "learning_rate": 0.0001516574151919332, "loss": 0.0042, "step": 12315 }, { "epoch": 2.51, "learning_rate": 0.0001516380309940834, "loss": 0.0098, "step": 12316 }, { "epoch": 2.51, "learning_rate": 0.00015161864676887547, "loss": 0.0083, "step": 12317 }, { "epoch": 2.51, "learning_rate": 0.00015159926251663306, "loss": 0.0069, "step": 12318 }, { "epoch": 2.51, "learning_rate": 0.00015157987823767995, "loss": 0.0187, "step": 12319 }, { "epoch": 2.51, "learning_rate": 0.00015156049393233987, "loss": 0.0208, "step": 12320 }, { "epoch": 2.51, "learning_rate": 0.0001515411096009366, "loss": 0.0114, "step": 12321 }, { "epoch": 2.51, "learning_rate": 0.00015152172524379398, "loss": 0.0099, "step": 12322 }, { "epoch": 2.51, "learning_rate": 0.0001515023408612356, "loss": 0.0017, "step": 12323 }, { "epoch": 2.51, "learning_rate": 0.00015148295645358526, "loss": 0.0067, "step": 12324 }, { "epoch": 2.51, "learning_rate": 0.00015146357202116683, "loss": 0.0112, "step": 12325 }, { "epoch": 2.51, "learning_rate": 0.00015144418756430391, "loss": 0.0098, "step": 12326 }, { "epoch": 2.51, "learning_rate": 0.00015142480308332038, "loss": 0.0068, "step": 12327 }, { "epoch": 2.51, "learning_rate": 0.0001514054185785399, "loss": 0.0181, "step": 12328 }, { "epoch": 2.51, "learning_rate": 0.0001513860340502863, "loss": 0.0199, "step": 12329 }, { "epoch": 2.51, "learning_rate": 0.0001513666494988833, "loss": 0.0046, "step": 12330 }, { "epoch": 2.51, "learning_rate": 0.0001513472649246547, "loss": 0.0092, "step": 12331 }, { "epoch": 2.51, "learning_rate": 0.00015132788032792428, "loss": 0.0022, "step": 12332 }, { "epoch": 2.51, "learning_rate": 0.00015130849570901567, "loss": 0.0071, "step": 12333 }, { "epoch": 2.51, "learning_rate": 0.00015128911106825272, "loss": 0.0057, "step": 12334 }, { "epoch": 2.51, "learning_rate": 0.00015126972640595922, "loss": 0.0061, "step": 12335 }, { "epoch": 2.51, "learning_rate": 0.00015125034172245891, "loss": 0.0033, "step": 12336 }, { "epoch": 2.51, "learning_rate": 0.0001512309570180755, "loss": 0.0031, "step": 12337 }, { "epoch": 2.51, "learning_rate": 0.00015121157229313278, "loss": 0.0061, "step": 12338 }, { "epoch": 2.51, "learning_rate": 0.00015119218754795446, "loss": 0.0073, "step": 12339 }, { "epoch": 2.51, "learning_rate": 0.00015117280278286442, "loss": 0.0098, "step": 12340 }, { "epoch": 2.51, "learning_rate": 0.00015115341799818636, "loss": 0.0236, "step": 12341 }, { "epoch": 2.51, "learning_rate": 0.00015113403319424405, "loss": 0.0058, "step": 12342 }, { "epoch": 2.51, "learning_rate": 0.00015111464837136123, "loss": 0.0026, "step": 12343 }, { "epoch": 2.51, "learning_rate": 0.00015109526352986169, "loss": 0.009, "step": 12344 }, { "epoch": 2.51, "learning_rate": 0.0001510758786700692, "loss": 0.0034, "step": 12345 }, { "epoch": 2.51, "learning_rate": 0.00015105649379230744, "loss": 0.0055, "step": 12346 }, { "epoch": 2.51, "learning_rate": 0.0001510371088969003, "loss": 0.0213, "step": 12347 }, { "epoch": 2.51, "learning_rate": 0.00015101772398417148, "loss": 0.0065, "step": 12348 }, { "epoch": 2.51, "learning_rate": 0.0001509983390544447, "loss": 0.0077, "step": 12349 }, { "epoch": 2.51, "learning_rate": 0.0001509789541080438, "loss": 0.0101, "step": 12350 }, { "epoch": 2.51, "learning_rate": 0.00015095956914529252, "loss": 0.0055, "step": 12351 }, { "epoch": 2.52, "learning_rate": 0.00015094018416651463, "loss": 0.0105, "step": 12352 }, { "epoch": 2.52, "learning_rate": 0.00015092079917203386, "loss": 0.0176, "step": 12353 }, { "epoch": 2.52, "learning_rate": 0.00015090141416217406, "loss": 0.0111, "step": 12354 }, { "epoch": 2.52, "learning_rate": 0.0001508820291372589, "loss": 0.0303, "step": 12355 }, { "epoch": 2.52, "learning_rate": 0.00015086264409761222, "loss": 0.0103, "step": 12356 }, { "epoch": 2.52, "learning_rate": 0.00015084325904355771, "loss": 0.004, "step": 12357 }, { "epoch": 2.52, "learning_rate": 0.0001508238739754192, "loss": 0.014, "step": 12358 }, { "epoch": 2.52, "learning_rate": 0.00015080448889352046, "loss": 0.004, "step": 12359 }, { "epoch": 2.52, "learning_rate": 0.0001507851037981852, "loss": 0.0046, "step": 12360 }, { "epoch": 2.52, "learning_rate": 0.00015076571868973725, "loss": 0.0104, "step": 12361 }, { "epoch": 2.52, "learning_rate": 0.00015074633356850037, "loss": 0.0055, "step": 12362 }, { "epoch": 2.52, "learning_rate": 0.0001507269484347983, "loss": 0.0092, "step": 12363 }, { "epoch": 2.52, "learning_rate": 0.00015070756328895485, "loss": 0.0227, "step": 12364 }, { "epoch": 2.52, "learning_rate": 0.00015068817813129368, "loss": 0.0047, "step": 12365 }, { "epoch": 2.52, "learning_rate": 0.00015066879296213867, "loss": 0.0393, "step": 12366 }, { "epoch": 2.52, "learning_rate": 0.00015064940778181357, "loss": 0.0071, "step": 12367 }, { "epoch": 2.52, "learning_rate": 0.0001506300225906421, "loss": 0.0138, "step": 12368 }, { "epoch": 2.52, "learning_rate": 0.0001506106373889481, "loss": 0.0123, "step": 12369 }, { "epoch": 2.52, "learning_rate": 0.00015059125217705527, "loss": 0.0634, "step": 12370 }, { "epoch": 2.52, "learning_rate": 0.00015057186695528743, "loss": 0.0043, "step": 12371 }, { "epoch": 2.52, "learning_rate": 0.00015055248172396836, "loss": 0.0019, "step": 12372 }, { "epoch": 2.52, "learning_rate": 0.0001505330964834218, "loss": 0.0169, "step": 12373 }, { "epoch": 2.52, "learning_rate": 0.00015051371123397147, "loss": 0.018, "step": 12374 }, { "epoch": 2.52, "learning_rate": 0.00015049432597594124, "loss": 0.0047, "step": 12375 }, { "epoch": 2.52, "learning_rate": 0.0001504749407096548, "loss": 0.0122, "step": 12376 }, { "epoch": 2.52, "learning_rate": 0.00015045555543543598, "loss": 0.0079, "step": 12377 }, { "epoch": 2.52, "learning_rate": 0.0001504361701536085, "loss": 0.0019, "step": 12378 }, { "epoch": 2.52, "learning_rate": 0.0001504167848644962, "loss": 0.0107, "step": 12379 }, { "epoch": 2.52, "learning_rate": 0.00015039739956842273, "loss": 0.0076, "step": 12380 }, { "epoch": 2.52, "learning_rate": 0.000150378014265712, "loss": 0.0082, "step": 12381 }, { "epoch": 2.52, "learning_rate": 0.0001503586289566877, "loss": 0.0404, "step": 12382 }, { "epoch": 2.52, "learning_rate": 0.0001503392436416736, "loss": 0.0034, "step": 12383 }, { "epoch": 2.52, "learning_rate": 0.0001503198583209935, "loss": 0.0087, "step": 12384 }, { "epoch": 2.52, "learning_rate": 0.0001503004729949712, "loss": 0.0091, "step": 12385 }, { "epoch": 2.52, "learning_rate": 0.00015028108766393042, "loss": 0.002, "step": 12386 }, { "epoch": 2.52, "learning_rate": 0.00015026170232819493, "loss": 0.0129, "step": 12387 }, { "epoch": 2.52, "learning_rate": 0.00015024231698808853, "loss": 0.0103, "step": 12388 }, { "epoch": 2.52, "learning_rate": 0.00015022293164393497, "loss": 0.0076, "step": 12389 }, { "epoch": 2.52, "learning_rate": 0.00015020354629605802, "loss": 0.0423, "step": 12390 }, { "epoch": 2.52, "learning_rate": 0.00015018416094478147, "loss": 0.017, "step": 12391 }, { "epoch": 2.52, "learning_rate": 0.0001501647755904291, "loss": 0.0025, "step": 12392 }, { "epoch": 2.52, "learning_rate": 0.00015014539023332462, "loss": 0.0138, "step": 12393 }, { "epoch": 2.52, "learning_rate": 0.00015012600487379187, "loss": 0.0031, "step": 12394 }, { "epoch": 2.52, "learning_rate": 0.00015010661951215463, "loss": 0.0175, "step": 12395 }, { "epoch": 2.52, "learning_rate": 0.00015008723414873667, "loss": 0.0148, "step": 12396 }, { "epoch": 2.52, "learning_rate": 0.00015006784878386165, "loss": 0.0064, "step": 12397 }, { "epoch": 2.52, "learning_rate": 0.00015004846341785347, "loss": 0.0055, "step": 12398 }, { "epoch": 2.52, "learning_rate": 0.00015002907805103583, "loss": 0.0038, "step": 12399 }, { "epoch": 2.52, "learning_rate": 0.00015000969268373258, "loss": 0.0069, "step": 12400 }, { "epoch": 2.53, "learning_rate": 0.00014999030731626742, "loss": 0.0065, "step": 12401 }, { "epoch": 2.53, "learning_rate": 0.00014997092194896414, "loss": 0.017, "step": 12402 }, { "epoch": 2.53, "learning_rate": 0.00014995153658214656, "loss": 0.0155, "step": 12403 }, { "epoch": 2.53, "learning_rate": 0.00014993215121613833, "loss": 0.0088, "step": 12404 }, { "epoch": 2.53, "learning_rate": 0.00014991276585126339, "loss": 0.0102, "step": 12405 }, { "epoch": 2.53, "learning_rate": 0.00014989338048784534, "loss": 0.0016, "step": 12406 }, { "epoch": 2.53, "learning_rate": 0.0001498739951262081, "loss": 0.0039, "step": 12407 }, { "epoch": 2.53, "learning_rate": 0.0001498546097666754, "loss": 0.0138, "step": 12408 }, { "epoch": 2.53, "learning_rate": 0.00014983522440957091, "loss": 0.0385, "step": 12409 }, { "epoch": 2.53, "learning_rate": 0.00014981583905521853, "loss": 0.0078, "step": 12410 }, { "epoch": 2.53, "learning_rate": 0.00014979645370394198, "loss": 0.0171, "step": 12411 }, { "epoch": 2.53, "learning_rate": 0.00014977706835606503, "loss": 0.0012, "step": 12412 }, { "epoch": 2.53, "learning_rate": 0.0001497576830119115, "loss": 0.0044, "step": 12413 }, { "epoch": 2.53, "learning_rate": 0.00014973829767180505, "loss": 0.0238, "step": 12414 }, { "epoch": 2.53, "learning_rate": 0.00014971891233606959, "loss": 0.0122, "step": 12415 }, { "epoch": 2.53, "learning_rate": 0.00014969952700502877, "loss": 0.0031, "step": 12416 }, { "epoch": 2.53, "learning_rate": 0.00014968014167900646, "loss": 0.0036, "step": 12417 }, { "epoch": 2.53, "learning_rate": 0.0001496607563583264, "loss": 0.0069, "step": 12418 }, { "epoch": 2.53, "learning_rate": 0.00014964137104331229, "loss": 0.0065, "step": 12419 }, { "epoch": 2.53, "learning_rate": 0.00014962198573428801, "loss": 0.0061, "step": 12420 }, { "epoch": 2.53, "learning_rate": 0.00014960260043157722, "loss": 0.0083, "step": 12421 }, { "epoch": 2.53, "learning_rate": 0.0001495832151355038, "loss": 0.0045, "step": 12422 }, { "epoch": 2.53, "learning_rate": 0.0001495638298463915, "loss": 0.0015, "step": 12423 }, { "epoch": 2.53, "learning_rate": 0.000149544444564564, "loss": 0.0043, "step": 12424 }, { "epoch": 2.53, "learning_rate": 0.0001495250592903452, "loss": 0.0101, "step": 12425 }, { "epoch": 2.53, "learning_rate": 0.0001495056740240588, "loss": 0.011, "step": 12426 }, { "epoch": 2.53, "learning_rate": 0.0001494862887660285, "loss": 0.0024, "step": 12427 }, { "epoch": 2.53, "learning_rate": 0.00014946690351657824, "loss": 0.0101, "step": 12428 }, { "epoch": 2.53, "learning_rate": 0.0001494475182760316, "loss": 0.0015, "step": 12429 }, { "epoch": 2.53, "learning_rate": 0.00014942813304471254, "loss": 0.0057, "step": 12430 }, { "epoch": 2.53, "learning_rate": 0.0001494087478229447, "loss": 0.0299, "step": 12431 }, { "epoch": 2.53, "learning_rate": 0.0001493893626110519, "loss": 0.0123, "step": 12432 }, { "epoch": 2.53, "learning_rate": 0.00014936997740935788, "loss": 0.007, "step": 12433 }, { "epoch": 2.53, "learning_rate": 0.0001493505922181864, "loss": 0.0099, "step": 12434 }, { "epoch": 2.53, "learning_rate": 0.00014933120703786133, "loss": 0.0088, "step": 12435 }, { "epoch": 2.53, "learning_rate": 0.00014931182186870635, "loss": 0.0103, "step": 12436 }, { "epoch": 2.53, "learning_rate": 0.00014929243671104518, "loss": 0.003, "step": 12437 }, { "epoch": 2.53, "learning_rate": 0.0001492730515652017, "loss": 0.0112, "step": 12438 }, { "epoch": 2.53, "learning_rate": 0.0001492536664314996, "loss": 0.0081, "step": 12439 }, { "epoch": 2.53, "learning_rate": 0.00014923428131026272, "loss": 0.0178, "step": 12440 }, { "epoch": 2.53, "learning_rate": 0.00014921489620181477, "loss": 0.0051, "step": 12441 }, { "epoch": 2.53, "learning_rate": 0.00014919551110647954, "loss": 0.0052, "step": 12442 }, { "epoch": 2.53, "learning_rate": 0.00014917612602458077, "loss": 0.0239, "step": 12443 }, { "epoch": 2.53, "learning_rate": 0.00014915674095644226, "loss": 0.01, "step": 12444 }, { "epoch": 2.53, "learning_rate": 0.00014913735590238778, "loss": 0.0114, "step": 12445 }, { "epoch": 2.53, "learning_rate": 0.00014911797086274113, "loss": 0.0179, "step": 12446 }, { "epoch": 2.53, "learning_rate": 0.0001490985858378259, "loss": 0.0038, "step": 12447 }, { "epoch": 2.53, "learning_rate": 0.00014907920082796611, "loss": 0.0157, "step": 12448 }, { "epoch": 2.53, "learning_rate": 0.00014905981583348535, "loss": 0.0076, "step": 12449 }, { "epoch": 2.54, "learning_rate": 0.00014904043085470746, "loss": 0.0043, "step": 12450 }, { "epoch": 2.54, "learning_rate": 0.00014902104589195622, "loss": 0.0081, "step": 12451 }, { "epoch": 2.54, "learning_rate": 0.0001490016609455553, "loss": 0.0082, "step": 12452 }, { "epoch": 2.54, "learning_rate": 0.00014898227601582855, "loss": 0.0015, "step": 12453 }, { "epoch": 2.54, "learning_rate": 0.00014896289110309972, "loss": 0.0064, "step": 12454 }, { "epoch": 2.54, "learning_rate": 0.00014894350620769253, "loss": 0.0036, "step": 12455 }, { "epoch": 2.54, "learning_rate": 0.00014892412132993084, "loss": 0.0047, "step": 12456 }, { "epoch": 2.54, "learning_rate": 0.0001489047364701383, "loss": 0.015, "step": 12457 }, { "epoch": 2.54, "learning_rate": 0.00014888535162863874, "loss": 0.0082, "step": 12458 }, { "epoch": 2.54, "learning_rate": 0.00014886596680575596, "loss": 0.0099, "step": 12459 }, { "epoch": 2.54, "learning_rate": 0.0001488465820018136, "loss": 0.0029, "step": 12460 }, { "epoch": 2.54, "learning_rate": 0.00014882719721713556, "loss": 0.0092, "step": 12461 }, { "epoch": 2.54, "learning_rate": 0.0001488078124520455, "loss": 0.0022, "step": 12462 }, { "epoch": 2.54, "learning_rate": 0.00014878842770686722, "loss": 0.0204, "step": 12463 }, { "epoch": 2.54, "learning_rate": 0.00014876904298192454, "loss": 0.0024, "step": 12464 }, { "epoch": 2.54, "learning_rate": 0.0001487496582775411, "loss": 0.0023, "step": 12465 }, { "epoch": 2.54, "learning_rate": 0.00014873027359404075, "loss": 0.0041, "step": 12466 }, { "epoch": 2.54, "learning_rate": 0.0001487108889317472, "loss": 0.0029, "step": 12467 }, { "epoch": 2.54, "learning_rate": 0.0001486915042909843, "loss": 0.0106, "step": 12468 }, { "epoch": 2.54, "learning_rate": 0.00014867211967207577, "loss": 0.0046, "step": 12469 }, { "epoch": 2.54, "learning_rate": 0.00014865273507534525, "loss": 0.0168, "step": 12470 }, { "epoch": 2.54, "learning_rate": 0.00014863335050111667, "loss": 0.0082, "step": 12471 }, { "epoch": 2.54, "learning_rate": 0.00014861396594971366, "loss": 0.0063, "step": 12472 }, { "epoch": 2.54, "learning_rate": 0.0001485945814214601, "loss": 0.0008, "step": 12473 }, { "epoch": 2.54, "learning_rate": 0.00014857519691667965, "loss": 0.0049, "step": 12474 }, { "epoch": 2.54, "learning_rate": 0.00014855581243569606, "loss": 0.0051, "step": 12475 }, { "epoch": 2.54, "learning_rate": 0.0001485364279788332, "loss": 0.0059, "step": 12476 }, { "epoch": 2.54, "learning_rate": 0.00014851704354641474, "loss": 0.0055, "step": 12477 }, { "epoch": 2.54, "learning_rate": 0.00014849765913876441, "loss": 0.0035, "step": 12478 }, { "epoch": 2.54, "learning_rate": 0.00014847827475620605, "loss": 0.0109, "step": 12479 }, { "epoch": 2.54, "learning_rate": 0.0001484588903990633, "loss": 0.0029, "step": 12480 }, { "epoch": 2.54, "learning_rate": 0.0001484395060676601, "loss": 0.0064, "step": 12481 }, { "epoch": 2.54, "learning_rate": 0.00014842012176232003, "loss": 0.0029, "step": 12482 }, { "epoch": 2.54, "learning_rate": 0.00014840073748336694, "loss": 0.011, "step": 12483 }, { "epoch": 2.54, "learning_rate": 0.00014838135323112453, "loss": 0.0129, "step": 12484 }, { "epoch": 2.54, "learning_rate": 0.00014836196900591656, "loss": 0.0099, "step": 12485 }, { "epoch": 2.54, "learning_rate": 0.0001483425848080668, "loss": 0.0079, "step": 12486 }, { "epoch": 2.54, "learning_rate": 0.00014832320063789907, "loss": 0.0117, "step": 12487 }, { "epoch": 2.54, "learning_rate": 0.00014830381649573695, "loss": 0.0113, "step": 12488 }, { "epoch": 2.54, "learning_rate": 0.0001482844323819044, "loss": 0.0037, "step": 12489 }, { "epoch": 2.54, "learning_rate": 0.00014826504829672498, "loss": 0.0008, "step": 12490 }, { "epoch": 2.54, "learning_rate": 0.0001482456642405226, "loss": 0.0264, "step": 12491 }, { "epoch": 2.54, "learning_rate": 0.00014822628021362094, "loss": 0.0048, "step": 12492 }, { "epoch": 2.54, "learning_rate": 0.0001482068962163437, "loss": 0.0047, "step": 12493 }, { "epoch": 2.54, "learning_rate": 0.00014818751224901467, "loss": 0.0035, "step": 12494 }, { "epoch": 2.54, "learning_rate": 0.00014816812831195764, "loss": 0.0063, "step": 12495 }, { "epoch": 2.54, "learning_rate": 0.0001481487444054963, "loss": 0.0167, "step": 12496 }, { "epoch": 2.54, "learning_rate": 0.00014812936052995446, "loss": 0.0215, "step": 12497 }, { "epoch": 2.54, "learning_rate": 0.00014810997668565577, "loss": 0.0082, "step": 12498 }, { "epoch": 2.55, "learning_rate": 0.00014809059287292412, "loss": 0.0032, "step": 12499 }, { "epoch": 2.55, "learning_rate": 0.00014807120909208316, "loss": 0.0147, "step": 12500 }, { "epoch": 2.55, "learning_rate": 0.00014805182534345657, "loss": 0.0076, "step": 12501 }, { "epoch": 2.55, "learning_rate": 0.00014803244162736826, "loss": 0.0174, "step": 12502 }, { "epoch": 2.55, "learning_rate": 0.00014801305794414182, "loss": 0.0143, "step": 12503 }, { "epoch": 2.55, "learning_rate": 0.00014799367429410112, "loss": 0.0077, "step": 12504 }, { "epoch": 2.55, "learning_rate": 0.0001479742906775698, "loss": 0.005, "step": 12505 }, { "epoch": 2.55, "learning_rate": 0.00014795490709487163, "loss": 0.0126, "step": 12506 }, { "epoch": 2.55, "learning_rate": 0.00014793552354633045, "loss": 0.0066, "step": 12507 }, { "epoch": 2.55, "learning_rate": 0.00014791614003226985, "loss": 0.0118, "step": 12508 }, { "epoch": 2.55, "learning_rate": 0.0001478967565530137, "loss": 0.0035, "step": 12509 }, { "epoch": 2.55, "learning_rate": 0.0001478773731088857, "loss": 0.0138, "step": 12510 }, { "epoch": 2.55, "learning_rate": 0.00014785798970020953, "loss": 0.0164, "step": 12511 }, { "epoch": 2.55, "learning_rate": 0.00014783860632730902, "loss": 0.0079, "step": 12512 }, { "epoch": 2.55, "learning_rate": 0.00014781922299050777, "loss": 0.0011, "step": 12513 }, { "epoch": 2.55, "learning_rate": 0.0001477998396901297, "loss": 0.0038, "step": 12514 }, { "epoch": 2.55, "learning_rate": 0.00014778045642649846, "loss": 0.0181, "step": 12515 }, { "epoch": 2.55, "learning_rate": 0.0001477610731999377, "loss": 0.003, "step": 12516 }, { "epoch": 2.55, "learning_rate": 0.00014774169001077135, "loss": 0.0223, "step": 12517 }, { "epoch": 2.55, "learning_rate": 0.00014772230685932295, "loss": 0.0092, "step": 12518 }, { "epoch": 2.55, "learning_rate": 0.0001477029237459164, "loss": 0.0042, "step": 12519 }, { "epoch": 2.55, "learning_rate": 0.00014768354067087536, "loss": 0.0074, "step": 12520 }, { "epoch": 2.55, "learning_rate": 0.00014766415763452348, "loss": 0.0106, "step": 12521 }, { "epoch": 2.55, "learning_rate": 0.00014764477463718466, "loss": 0.0144, "step": 12522 }, { "epoch": 2.55, "learning_rate": 0.0001476253916791825, "loss": 0.0088, "step": 12523 }, { "epoch": 2.55, "learning_rate": 0.00014760600876084082, "loss": 0.0015, "step": 12524 }, { "epoch": 2.55, "learning_rate": 0.0001475866258824833, "loss": 0.0091, "step": 12525 }, { "epoch": 2.55, "learning_rate": 0.00014756724304443365, "loss": 0.0072, "step": 12526 }, { "epoch": 2.55, "learning_rate": 0.00014754786024701567, "loss": 0.0089, "step": 12527 }, { "epoch": 2.55, "learning_rate": 0.00014752847749055308, "loss": 0.0029, "step": 12528 }, { "epoch": 2.55, "learning_rate": 0.0001475090947753695, "loss": 0.0041, "step": 12529 }, { "epoch": 2.55, "learning_rate": 0.00014748971210178883, "loss": 0.0144, "step": 12530 }, { "epoch": 2.55, "learning_rate": 0.0001474703294701346, "loss": 0.0132, "step": 12531 }, { "epoch": 2.55, "learning_rate": 0.00014745094688073073, "loss": 0.0034, "step": 12532 }, { "epoch": 2.55, "learning_rate": 0.00014743156433390088, "loss": 0.0102, "step": 12533 }, { "epoch": 2.55, "learning_rate": 0.00014741218182996867, "loss": 0.0236, "step": 12534 }, { "epoch": 2.55, "learning_rate": 0.00014739279936925792, "loss": 0.0019, "step": 12535 }, { "epoch": 2.55, "learning_rate": 0.00014737341695209239, "loss": 0.0152, "step": 12536 }, { "epoch": 2.55, "learning_rate": 0.0001473540345787957, "loss": 0.0168, "step": 12537 }, { "epoch": 2.55, "learning_rate": 0.0001473346522496917, "loss": 0.0078, "step": 12538 }, { "epoch": 2.55, "learning_rate": 0.00014731526996510395, "loss": 0.0059, "step": 12539 }, { "epoch": 2.55, "learning_rate": 0.00014729588772535634, "loss": 0.0173, "step": 12540 }, { "epoch": 2.55, "learning_rate": 0.00014727650553077244, "loss": 0.0053, "step": 12541 }, { "epoch": 2.55, "learning_rate": 0.0001472571233816761, "loss": 0.0095, "step": 12542 }, { "epoch": 2.55, "learning_rate": 0.00014723774127839098, "loss": 0.0163, "step": 12543 }, { "epoch": 2.55, "learning_rate": 0.00014721835922124074, "loss": 0.0062, "step": 12544 }, { "epoch": 2.55, "learning_rate": 0.00014719897721054918, "loss": 0.008, "step": 12545 }, { "epoch": 2.55, "learning_rate": 0.00014717959524663998, "loss": 0.0011, "step": 12546 }, { "epoch": 2.55, "learning_rate": 0.00014716021332983684, "loss": 0.0031, "step": 12547 }, { "epoch": 2.56, "learning_rate": 0.00014714083146046355, "loss": 0.0031, "step": 12548 }, { "epoch": 2.56, "learning_rate": 0.0001471214496388437, "loss": 0.0121, "step": 12549 }, { "epoch": 2.56, "learning_rate": 0.0001471020678653012, "loss": 0.0108, "step": 12550 }, { "epoch": 2.56, "learning_rate": 0.00014708268614015957, "loss": 0.0053, "step": 12551 }, { "epoch": 2.56, "learning_rate": 0.00014706330446374253, "loss": 0.0164, "step": 12552 }, { "epoch": 2.56, "learning_rate": 0.00014704392283637394, "loss": 0.0026, "step": 12553 }, { "epoch": 2.56, "learning_rate": 0.00014702454125837733, "loss": 0.0073, "step": 12554 }, { "epoch": 2.56, "learning_rate": 0.00014700515973007657, "loss": 0.0033, "step": 12555 }, { "epoch": 2.56, "learning_rate": 0.00014698577825179526, "loss": 0.0098, "step": 12556 }, { "epoch": 2.56, "learning_rate": 0.00014696639682385714, "loss": 0.0312, "step": 12557 }, { "epoch": 2.56, "learning_rate": 0.00014694701544658596, "loss": 0.0066, "step": 12558 }, { "epoch": 2.56, "learning_rate": 0.0001469276341203053, "loss": 0.002, "step": 12559 }, { "epoch": 2.56, "learning_rate": 0.00014690825284533902, "loss": 0.0018, "step": 12560 }, { "epoch": 2.56, "learning_rate": 0.00014688887162201078, "loss": 0.017, "step": 12561 }, { "epoch": 2.56, "learning_rate": 0.0001468694904506442, "loss": 0.0034, "step": 12562 }, { "epoch": 2.56, "learning_rate": 0.00014685010933156308, "loss": 0.013, "step": 12563 }, { "epoch": 2.56, "learning_rate": 0.000146830728265091, "loss": 0.0037, "step": 12564 }, { "epoch": 2.56, "learning_rate": 0.00014681134725155181, "loss": 0.0053, "step": 12565 }, { "epoch": 2.56, "learning_rate": 0.00014679196629126912, "loss": 0.005, "step": 12566 }, { "epoch": 2.56, "learning_rate": 0.00014677258538456665, "loss": 0.0111, "step": 12567 }, { "epoch": 2.56, "learning_rate": 0.00014675320453176813, "loss": 0.0103, "step": 12568 }, { "epoch": 2.56, "learning_rate": 0.00014673382373319712, "loss": 0.0052, "step": 12569 }, { "epoch": 2.56, "learning_rate": 0.00014671444298917753, "loss": 0.0052, "step": 12570 }, { "epoch": 2.56, "learning_rate": 0.00014669506230003296, "loss": 0.0085, "step": 12571 }, { "epoch": 2.56, "learning_rate": 0.00014667568166608697, "loss": 0.0084, "step": 12572 }, { "epoch": 2.56, "learning_rate": 0.00014665630108766348, "loss": 0.0009, "step": 12573 }, { "epoch": 2.56, "learning_rate": 0.00014663692056508606, "loss": 0.0169, "step": 12574 }, { "epoch": 2.56, "learning_rate": 0.00014661754009867833, "loss": 0.0092, "step": 12575 }, { "epoch": 2.56, "learning_rate": 0.00014659815968876417, "loss": 0.0412, "step": 12576 }, { "epoch": 2.56, "learning_rate": 0.00014657877933566706, "loss": 0.0076, "step": 12577 }, { "epoch": 2.56, "learning_rate": 0.00014655939903971085, "loss": 0.0021, "step": 12578 }, { "epoch": 2.56, "learning_rate": 0.00014654001880121917, "loss": 0.0017, "step": 12579 }, { "epoch": 2.56, "learning_rate": 0.00014652063862051568, "loss": 0.0071, "step": 12580 }, { "epoch": 2.56, "learning_rate": 0.00014650125849792416, "loss": 0.0051, "step": 12581 }, { "epoch": 2.56, "learning_rate": 0.00014648187843376814, "loss": 0.0065, "step": 12582 }, { "epoch": 2.56, "learning_rate": 0.00014646249842837147, "loss": 0.0147, "step": 12583 }, { "epoch": 2.56, "learning_rate": 0.00014644311848205775, "loss": 0.0065, "step": 12584 }, { "epoch": 2.56, "learning_rate": 0.00014642373859515058, "loss": 0.0086, "step": 12585 }, { "epoch": 2.56, "learning_rate": 0.00014640435876797381, "loss": 0.0049, "step": 12586 }, { "epoch": 2.56, "learning_rate": 0.00014638497900085098, "loss": 0.0081, "step": 12587 }, { "epoch": 2.56, "learning_rate": 0.00014636559929410585, "loss": 0.0026, "step": 12588 }, { "epoch": 2.56, "learning_rate": 0.0001463462196480621, "loss": 0.0009, "step": 12589 }, { "epoch": 2.56, "learning_rate": 0.0001463268400630433, "loss": 0.0038, "step": 12590 }, { "epoch": 2.56, "learning_rate": 0.0001463074605393733, "loss": 0.0017, "step": 12591 }, { "epoch": 2.56, "learning_rate": 0.0001462880810773756, "loss": 0.0191, "step": 12592 }, { "epoch": 2.56, "learning_rate": 0.00014626870167737402, "loss": 0.0073, "step": 12593 }, { "epoch": 2.56, "learning_rate": 0.00014624932233969217, "loss": 0.0042, "step": 12594 }, { "epoch": 2.56, "learning_rate": 0.00014622994306465363, "loss": 0.0115, "step": 12595 }, { "epoch": 2.56, "learning_rate": 0.00014621056385258224, "loss": 0.0035, "step": 12596 }, { "epoch": 2.56, "learning_rate": 0.0001461911847038015, "loss": 0.0313, "step": 12597 }, { "epoch": 2.57, "learning_rate": 0.00014617180561863526, "loss": 0.0171, "step": 12598 }, { "epoch": 2.57, "learning_rate": 0.00014615242659740706, "loss": 0.0004, "step": 12599 }, { "epoch": 2.57, "learning_rate": 0.00014613304764044053, "loss": 0.0162, "step": 12600 }, { "epoch": 2.57, "learning_rate": 0.00014611366874805952, "loss": 0.0064, "step": 12601 }, { "epoch": 2.57, "learning_rate": 0.00014609428992058755, "loss": 0.0135, "step": 12602 }, { "epoch": 2.57, "learning_rate": 0.00014607491115834823, "loss": 0.0164, "step": 12603 }, { "epoch": 2.57, "learning_rate": 0.00014605553246166539, "loss": 0.0046, "step": 12604 }, { "epoch": 2.57, "learning_rate": 0.00014603615383086254, "loss": 0.0073, "step": 12605 }, { "epoch": 2.57, "learning_rate": 0.00014601677526626346, "loss": 0.0031, "step": 12606 }, { "epoch": 2.57, "learning_rate": 0.00014599739676819174, "loss": 0.0084, "step": 12607 }, { "epoch": 2.57, "learning_rate": 0.000145978018336971, "loss": 0.0095, "step": 12608 }, { "epoch": 2.57, "learning_rate": 0.00014595863997292498, "loss": 0.0068, "step": 12609 }, { "epoch": 2.57, "learning_rate": 0.0001459392616763773, "loss": 0.0089, "step": 12610 }, { "epoch": 2.57, "learning_rate": 0.00014591988344765162, "loss": 0.0014, "step": 12611 }, { "epoch": 2.57, "learning_rate": 0.00014590050528707162, "loss": 0.0014, "step": 12612 }, { "epoch": 2.57, "learning_rate": 0.00014588112719496086, "loss": 0.0051, "step": 12613 }, { "epoch": 2.57, "learning_rate": 0.00014586174917164308, "loss": 0.0084, "step": 12614 }, { "epoch": 2.57, "learning_rate": 0.00014584237121744185, "loss": 0.0062, "step": 12615 }, { "epoch": 2.57, "learning_rate": 0.00014582299333268096, "loss": 0.0207, "step": 12616 }, { "epoch": 2.57, "learning_rate": 0.00014580361551768395, "loss": 0.0006, "step": 12617 }, { "epoch": 2.57, "learning_rate": 0.0001457842377727744, "loss": 0.01, "step": 12618 }, { "epoch": 2.57, "learning_rate": 0.0001457648600982761, "loss": 0.0053, "step": 12619 }, { "epoch": 2.57, "learning_rate": 0.00014574548249451263, "loss": 0.0042, "step": 12620 }, { "epoch": 2.57, "learning_rate": 0.0001457261049618076, "loss": 0.0126, "step": 12621 }, { "epoch": 2.57, "learning_rate": 0.00014570672750048474, "loss": 0.0045, "step": 12622 }, { "epoch": 2.57, "learning_rate": 0.00014568735011086757, "loss": 0.0085, "step": 12623 }, { "epoch": 2.57, "learning_rate": 0.00014566797279327986, "loss": 0.0026, "step": 12624 }, { "epoch": 2.57, "learning_rate": 0.00014564859554804516, "loss": 0.002, "step": 12625 }, { "epoch": 2.57, "learning_rate": 0.00014562921837548708, "loss": 0.0196, "step": 12626 }, { "epoch": 2.57, "learning_rate": 0.0001456098412759294, "loss": 0.0059, "step": 12627 }, { "epoch": 2.57, "learning_rate": 0.00014559046424969554, "loss": 0.0027, "step": 12628 }, { "epoch": 2.57, "learning_rate": 0.00014557108729710934, "loss": 0.0069, "step": 12629 }, { "epoch": 2.57, "learning_rate": 0.0001455517104184943, "loss": 0.022, "step": 12630 }, { "epoch": 2.57, "learning_rate": 0.00014553233361417408, "loss": 0.012, "step": 12631 }, { "epoch": 2.57, "learning_rate": 0.00014551295688447236, "loss": 0.0109, "step": 12632 }, { "epoch": 2.57, "learning_rate": 0.00014549358022971268, "loss": 0.0053, "step": 12633 }, { "epoch": 2.57, "learning_rate": 0.0001454742036502188, "loss": 0.0072, "step": 12634 }, { "epoch": 2.57, "learning_rate": 0.00014545482714631424, "loss": 0.006, "step": 12635 }, { "epoch": 2.57, "learning_rate": 0.00014543545071832257, "loss": 0.0019, "step": 12636 }, { "epoch": 2.57, "learning_rate": 0.00014541607436656758, "loss": 0.0036, "step": 12637 }, { "epoch": 2.57, "learning_rate": 0.00014539669809137271, "loss": 0.0029, "step": 12638 }, { "epoch": 2.57, "learning_rate": 0.00014537732189306177, "loss": 0.0034, "step": 12639 }, { "epoch": 2.57, "learning_rate": 0.0001453579457719582, "loss": 0.0161, "step": 12640 }, { "epoch": 2.57, "learning_rate": 0.0001453385697283857, "loss": 0.0093, "step": 12641 }, { "epoch": 2.57, "learning_rate": 0.00014531919376266795, "loss": 0.0138, "step": 12642 }, { "epoch": 2.57, "learning_rate": 0.00014529981787512843, "loss": 0.0025, "step": 12643 }, { "epoch": 2.57, "learning_rate": 0.0001452804420660909, "loss": 0.0009, "step": 12644 }, { "epoch": 2.57, "learning_rate": 0.00014526106633587886, "loss": 0.0034, "step": 12645 }, { "epoch": 2.57, "learning_rate": 0.00014524169068481593, "loss": 0.0022, "step": 12646 }, { "epoch": 2.58, "learning_rate": 0.0001452223151132258, "loss": 0.0099, "step": 12647 }, { "epoch": 2.58, "learning_rate": 0.000145202939621432, "loss": 0.0131, "step": 12648 }, { "epoch": 2.58, "learning_rate": 0.00014518356420975816, "loss": 0.0046, "step": 12649 }, { "epoch": 2.58, "learning_rate": 0.00014516418887852787, "loss": 0.0069, "step": 12650 }, { "epoch": 2.58, "learning_rate": 0.00014514481362806476, "loss": 0.0106, "step": 12651 }, { "epoch": 2.58, "learning_rate": 0.00014512543845869244, "loss": 0.0027, "step": 12652 }, { "epoch": 2.58, "learning_rate": 0.00014510606337073454, "loss": 0.0032, "step": 12653 }, { "epoch": 2.58, "learning_rate": 0.00014508668836451453, "loss": 0.0028, "step": 12654 }, { "epoch": 2.58, "learning_rate": 0.0001450673134403562, "loss": 0.007, "step": 12655 }, { "epoch": 2.58, "learning_rate": 0.00014504793859858293, "loss": 0.0151, "step": 12656 }, { "epoch": 2.58, "learning_rate": 0.00014502856383951854, "loss": 0.006, "step": 12657 }, { "epoch": 2.58, "learning_rate": 0.0001450091891634865, "loss": 0.0036, "step": 12658 }, { "epoch": 2.58, "learning_rate": 0.00014498981457081037, "loss": 0.0135, "step": 12659 }, { "epoch": 2.58, "learning_rate": 0.0001449704400618138, "loss": 0.0079, "step": 12660 }, { "epoch": 2.58, "learning_rate": 0.0001449510656368204, "loss": 0.0033, "step": 12661 }, { "epoch": 2.58, "learning_rate": 0.00014493169129615373, "loss": 0.0435, "step": 12662 }, { "epoch": 2.58, "learning_rate": 0.0001449123170401374, "loss": 0.0177, "step": 12663 }, { "epoch": 2.58, "learning_rate": 0.00014489294286909493, "loss": 0.0134, "step": 12664 }, { "epoch": 2.58, "learning_rate": 0.00014487356878335002, "loss": 0.0087, "step": 12665 }, { "epoch": 2.58, "learning_rate": 0.00014485419478322612, "loss": 0.0085, "step": 12666 }, { "epoch": 2.58, "learning_rate": 0.00014483482086904696, "loss": 0.0033, "step": 12667 }, { "epoch": 2.58, "learning_rate": 0.00014481544704113603, "loss": 0.0017, "step": 12668 }, { "epoch": 2.58, "learning_rate": 0.00014479607329981683, "loss": 0.0041, "step": 12669 }, { "epoch": 2.58, "learning_rate": 0.00014477669964541314, "loss": 0.016, "step": 12670 }, { "epoch": 2.58, "learning_rate": 0.0001447573260782483, "loss": 0.0047, "step": 12671 }, { "epoch": 2.58, "learning_rate": 0.0001447379525986461, "loss": 0.0097, "step": 12672 }, { "epoch": 2.58, "learning_rate": 0.00014471857920693004, "loss": 0.0019, "step": 12673 }, { "epoch": 2.58, "learning_rate": 0.0001446992059034236, "loss": 0.0228, "step": 12674 }, { "epoch": 2.58, "learning_rate": 0.0001446798326884505, "loss": 0.0046, "step": 12675 }, { "epoch": 2.58, "learning_rate": 0.00014466045956233422, "loss": 0.01, "step": 12676 }, { "epoch": 2.58, "learning_rate": 0.00014464108652539832, "loss": 0.0201, "step": 12677 }, { "epoch": 2.58, "learning_rate": 0.0001446217135779664, "loss": 0.004, "step": 12678 }, { "epoch": 2.58, "learning_rate": 0.000144602340720362, "loss": 0.0101, "step": 12679 }, { "epoch": 2.58, "learning_rate": 0.00014458296795290875, "loss": 0.0023, "step": 12680 }, { "epoch": 2.58, "learning_rate": 0.00014456359527593012, "loss": 0.0086, "step": 12681 }, { "epoch": 2.58, "learning_rate": 0.00014454422268974973, "loss": 0.0204, "step": 12682 }, { "epoch": 2.58, "learning_rate": 0.0001445248501946911, "loss": 0.012, "step": 12683 }, { "epoch": 2.58, "learning_rate": 0.00014450547779107777, "loss": 0.0037, "step": 12684 }, { "epoch": 2.58, "learning_rate": 0.0001444861054792334, "loss": 0.0046, "step": 12685 }, { "epoch": 2.58, "learning_rate": 0.00014446673325948148, "loss": 0.0061, "step": 12686 }, { "epoch": 2.58, "learning_rate": 0.0001444473611321455, "loss": 0.0062, "step": 12687 }, { "epoch": 2.58, "learning_rate": 0.00014442798909754915, "loss": 0.0045, "step": 12688 }, { "epoch": 2.58, "learning_rate": 0.0001444086171560158, "loss": 0.0125, "step": 12689 }, { "epoch": 2.58, "learning_rate": 0.0001443892453078692, "loss": 0.0164, "step": 12690 }, { "epoch": 2.58, "learning_rate": 0.00014436987355343273, "loss": 0.0043, "step": 12691 }, { "epoch": 2.58, "learning_rate": 0.00014435050189303002, "loss": 0.0035, "step": 12692 }, { "epoch": 2.58, "learning_rate": 0.0001443311303269846, "loss": 0.0145, "step": 12693 }, { "epoch": 2.58, "learning_rate": 0.00014431175885561994, "loss": 0.014, "step": 12694 }, { "epoch": 2.58, "learning_rate": 0.00014429238747925972, "loss": 0.0127, "step": 12695 }, { "epoch": 2.59, "learning_rate": 0.0001442730161982274, "loss": 0.0032, "step": 12696 }, { "epoch": 2.59, "learning_rate": 0.00014425364501284647, "loss": 0.0108, "step": 12697 }, { "epoch": 2.59, "learning_rate": 0.00014423427392344057, "loss": 0.0111, "step": 12698 }, { "epoch": 2.59, "learning_rate": 0.0001442149029303332, "loss": 0.0078, "step": 12699 }, { "epoch": 2.59, "learning_rate": 0.0001441955320338478, "loss": 0.008, "step": 12700 }, { "epoch": 2.59, "learning_rate": 0.00014417616123430798, "loss": 0.0093, "step": 12701 }, { "epoch": 2.59, "learning_rate": 0.00014415679053203726, "loss": 0.0042, "step": 12702 }, { "epoch": 2.59, "learning_rate": 0.0001441374199273592, "loss": 0.0059, "step": 12703 }, { "epoch": 2.59, "learning_rate": 0.0001441180494205973, "loss": 0.0048, "step": 12704 }, { "epoch": 2.59, "learning_rate": 0.00014409867901207503, "loss": 0.016, "step": 12705 }, { "epoch": 2.59, "learning_rate": 0.000144079308702116, "loss": 0.0034, "step": 12706 }, { "epoch": 2.59, "learning_rate": 0.00014405993849104365, "loss": 0.0076, "step": 12707 }, { "epoch": 2.59, "learning_rate": 0.0001440405683791816, "loss": 0.0024, "step": 12708 }, { "epoch": 2.59, "learning_rate": 0.0001440211983668533, "loss": 0.0057, "step": 12709 }, { "epoch": 2.59, "learning_rate": 0.0001440018284543822, "loss": 0.0119, "step": 12710 }, { "epoch": 2.59, "learning_rate": 0.000143982458642092, "loss": 0.0113, "step": 12711 }, { "epoch": 2.59, "learning_rate": 0.00014396308893030598, "loss": 0.0102, "step": 12712 }, { "epoch": 2.59, "learning_rate": 0.00014394371931934782, "loss": 0.0052, "step": 12713 }, { "epoch": 2.59, "learning_rate": 0.000143924349809541, "loss": 0.0044, "step": 12714 }, { "epoch": 2.59, "learning_rate": 0.00014390498040120896, "loss": 0.009, "step": 12715 }, { "epoch": 2.59, "learning_rate": 0.00014388561109467533, "loss": 0.0013, "step": 12716 }, { "epoch": 2.59, "learning_rate": 0.00014386624189026344, "loss": 0.0027, "step": 12717 }, { "epoch": 2.59, "learning_rate": 0.00014384687278829698, "loss": 0.0083, "step": 12718 }, { "epoch": 2.59, "learning_rate": 0.00014382750378909932, "loss": 0.0135, "step": 12719 }, { "epoch": 2.59, "learning_rate": 0.00014380813489299398, "loss": 0.0224, "step": 12720 }, { "epoch": 2.59, "learning_rate": 0.00014378876610030453, "loss": 0.0067, "step": 12721 }, { "epoch": 2.59, "learning_rate": 0.00014376939741135437, "loss": 0.021, "step": 12722 }, { "epoch": 2.59, "learning_rate": 0.00014375002882646704, "loss": 0.0072, "step": 12723 }, { "epoch": 2.59, "learning_rate": 0.000143730660345966, "loss": 0.0089, "step": 12724 }, { "epoch": 2.59, "learning_rate": 0.00014371129197017477, "loss": 0.0028, "step": 12725 }, { "epoch": 2.59, "learning_rate": 0.00014369192369941686, "loss": 0.005, "step": 12726 }, { "epoch": 2.59, "learning_rate": 0.00014367255553401578, "loss": 0.0034, "step": 12727 }, { "epoch": 2.59, "learning_rate": 0.00014365318747429487, "loss": 0.0018, "step": 12728 }, { "epoch": 2.59, "learning_rate": 0.00014363381952057778, "loss": 0.0031, "step": 12729 }, { "epoch": 2.59, "learning_rate": 0.00014361445167318786, "loss": 0.0072, "step": 12730 }, { "epoch": 2.59, "learning_rate": 0.0001435950839324487, "loss": 0.0053, "step": 12731 }, { "epoch": 2.59, "learning_rate": 0.0001435757162986837, "loss": 0.0104, "step": 12732 }, { "epoch": 2.59, "learning_rate": 0.00014355634877221638, "loss": 0.0066, "step": 12733 }, { "epoch": 2.59, "learning_rate": 0.0001435369813533702, "loss": 0.0106, "step": 12734 }, { "epoch": 2.59, "learning_rate": 0.00014351761404246863, "loss": 0.0275, "step": 12735 }, { "epoch": 2.59, "learning_rate": 0.00014349824683983513, "loss": 0.0036, "step": 12736 }, { "epoch": 2.59, "learning_rate": 0.00014347887974579322, "loss": 0.0169, "step": 12737 }, { "epoch": 2.59, "learning_rate": 0.00014345951276066625, "loss": 0.0029, "step": 12738 }, { "epoch": 2.59, "learning_rate": 0.00014344014588477783, "loss": 0.0134, "step": 12739 }, { "epoch": 2.59, "learning_rate": 0.0001434207791184513, "loss": 0.0128, "step": 12740 }, { "epoch": 2.59, "learning_rate": 0.00014340141246201024, "loss": 0.0351, "step": 12741 }, { "epoch": 2.59, "learning_rate": 0.00014338204591577805, "loss": 0.0034, "step": 12742 }, { "epoch": 2.59, "learning_rate": 0.00014336267948007815, "loss": 0.0049, "step": 12743 }, { "epoch": 2.59, "learning_rate": 0.00014334331315523402, "loss": 0.0028, "step": 12744 }, { "epoch": 2.6, "learning_rate": 0.00014332394694156913, "loss": 0.0127, "step": 12745 }, { "epoch": 2.6, "learning_rate": 0.00014330458083940695, "loss": 0.0072, "step": 12746 }, { "epoch": 2.6, "learning_rate": 0.00014328521484907093, "loss": 0.0126, "step": 12747 }, { "epoch": 2.6, "learning_rate": 0.00014326584897088443, "loss": 0.0259, "step": 12748 }, { "epoch": 2.6, "learning_rate": 0.00014324648320517103, "loss": 0.0086, "step": 12749 }, { "epoch": 2.6, "learning_rate": 0.00014322711755225412, "loss": 0.0228, "step": 12750 }, { "epoch": 2.6, "learning_rate": 0.00014320775201245704, "loss": 0.0052, "step": 12751 }, { "epoch": 2.6, "learning_rate": 0.0001431883865861034, "loss": 0.011, "step": 12752 }, { "epoch": 2.6, "learning_rate": 0.0001431690212735165, "loss": 0.0078, "step": 12753 }, { "epoch": 2.6, "learning_rate": 0.00014314965607501988, "loss": 0.0123, "step": 12754 }, { "epoch": 2.6, "learning_rate": 0.00014313029099093696, "loss": 0.0035, "step": 12755 }, { "epoch": 2.6, "learning_rate": 0.00014311092602159106, "loss": 0.004, "step": 12756 }, { "epoch": 2.6, "learning_rate": 0.00014309156116730582, "loss": 0.0116, "step": 12757 }, { "epoch": 2.6, "learning_rate": 0.00014307219642840444, "loss": 0.0108, "step": 12758 }, { "epoch": 2.6, "learning_rate": 0.00014305283180521052, "loss": 0.0201, "step": 12759 }, { "epoch": 2.6, "learning_rate": 0.00014303346729804744, "loss": 0.0352, "step": 12760 }, { "epoch": 2.6, "learning_rate": 0.00014301410290723854, "loss": 0.0092, "step": 12761 }, { "epoch": 2.6, "learning_rate": 0.00014299473863310736, "loss": 0.0146, "step": 12762 }, { "epoch": 2.6, "learning_rate": 0.0001429753744759772, "loss": 0.0105, "step": 12763 }, { "epoch": 2.6, "learning_rate": 0.00014295601043617164, "loss": 0.0148, "step": 12764 }, { "epoch": 2.6, "learning_rate": 0.00014293664651401396, "loss": 0.0063, "step": 12765 }, { "epoch": 2.6, "learning_rate": 0.00014291728270982758, "loss": 0.0016, "step": 12766 }, { "epoch": 2.6, "learning_rate": 0.000142897919023936, "loss": 0.002, "step": 12767 }, { "epoch": 2.6, "learning_rate": 0.00014287855545666253, "loss": 0.0059, "step": 12768 }, { "epoch": 2.6, "learning_rate": 0.00014285919200833068, "loss": 0.0117, "step": 12769 }, { "epoch": 2.6, "learning_rate": 0.00014283982867926382, "loss": 0.0118, "step": 12770 }, { "epoch": 2.6, "learning_rate": 0.00014282046546978527, "loss": 0.0012, "step": 12771 }, { "epoch": 2.6, "learning_rate": 0.00014280110238021855, "loss": 0.0176, "step": 12772 }, { "epoch": 2.6, "learning_rate": 0.00014278173941088698, "loss": 0.0245, "step": 12773 }, { "epoch": 2.6, "learning_rate": 0.00014276237656211398, "loss": 0.0093, "step": 12774 }, { "epoch": 2.6, "learning_rate": 0.00014274301383422296, "loss": 0.0093, "step": 12775 }, { "epoch": 2.6, "learning_rate": 0.00014272365122753732, "loss": 0.003, "step": 12776 }, { "epoch": 2.6, "learning_rate": 0.00014270428874238044, "loss": 0.019, "step": 12777 }, { "epoch": 2.6, "learning_rate": 0.0001426849263790757, "loss": 0.0279, "step": 12778 }, { "epoch": 2.6, "learning_rate": 0.00014266556413794647, "loss": 0.0133, "step": 12779 }, { "epoch": 2.6, "learning_rate": 0.00014264620201931622, "loss": 0.0064, "step": 12780 }, { "epoch": 2.6, "learning_rate": 0.00014262684002350822, "loss": 0.0161, "step": 12781 }, { "epoch": 2.6, "learning_rate": 0.00014260747815084596, "loss": 0.0038, "step": 12782 }, { "epoch": 2.6, "learning_rate": 0.00014258811640165277, "loss": 0.0089, "step": 12783 }, { "epoch": 2.6, "learning_rate": 0.00014256875477625198, "loss": 0.0205, "step": 12784 }, { "epoch": 2.6, "learning_rate": 0.00014254939327496704, "loss": 0.0075, "step": 12785 }, { "epoch": 2.6, "learning_rate": 0.00014253003189812128, "loss": 0.0069, "step": 12786 }, { "epoch": 2.6, "learning_rate": 0.00014251067064603812, "loss": 0.0008, "step": 12787 }, { "epoch": 2.6, "learning_rate": 0.0001424913095190409, "loss": 0.0073, "step": 12788 }, { "epoch": 2.6, "learning_rate": 0.00014247194851745292, "loss": 0.0118, "step": 12789 }, { "epoch": 2.6, "learning_rate": 0.0001424525876415977, "loss": 0.0051, "step": 12790 }, { "epoch": 2.6, "learning_rate": 0.00014243322689179842, "loss": 0.0115, "step": 12791 }, { "epoch": 2.6, "learning_rate": 0.0001424138662683786, "loss": 0.0091, "step": 12792 }, { "epoch": 2.6, "learning_rate": 0.00014239450577166156, "loss": 0.0085, "step": 12793 }, { "epoch": 2.61, "learning_rate": 0.00014237514540197055, "loss": 0.0098, "step": 12794 }, { "epoch": 2.61, "learning_rate": 0.0001423557851596291, "loss": 0.01, "step": 12795 }, { "epoch": 2.61, "learning_rate": 0.00014233642504496034, "loss": 0.0091, "step": 12796 }, { "epoch": 2.61, "learning_rate": 0.00014231706505828782, "loss": 0.012, "step": 12797 }, { "epoch": 2.61, "learning_rate": 0.00014229770519993482, "loss": 0.0095, "step": 12798 }, { "epoch": 2.61, "learning_rate": 0.00014227834547022466, "loss": 0.0096, "step": 12799 }, { "epoch": 2.61, "learning_rate": 0.00014225898586948076, "loss": 0.0045, "step": 12800 }, { "epoch": 2.61, "learning_rate": 0.00014223962639802636, "loss": 0.0046, "step": 12801 }, { "epoch": 2.61, "learning_rate": 0.00014222026705618484, "loss": 0.005, "step": 12802 }, { "epoch": 2.61, "learning_rate": 0.00014220090784427958, "loss": 0.013, "step": 12803 }, { "epoch": 2.61, "learning_rate": 0.00014218154876263382, "loss": 0.0116, "step": 12804 }, { "epoch": 2.61, "learning_rate": 0.00014216218981157104, "loss": 0.0025, "step": 12805 }, { "epoch": 2.61, "learning_rate": 0.00014214283099141443, "loss": 0.0128, "step": 12806 }, { "epoch": 2.61, "learning_rate": 0.00014212347230248737, "loss": 0.0167, "step": 12807 }, { "epoch": 2.61, "learning_rate": 0.0001421041137451132, "loss": 0.0033, "step": 12808 }, { "epoch": 2.61, "learning_rate": 0.00014208475531961523, "loss": 0.0044, "step": 12809 }, { "epoch": 2.61, "learning_rate": 0.00014206539702631683, "loss": 0.0028, "step": 12810 }, { "epoch": 2.61, "learning_rate": 0.00014204603886554127, "loss": 0.0037, "step": 12811 }, { "epoch": 2.61, "learning_rate": 0.0001420266808376118, "loss": 0.0051, "step": 12812 }, { "epoch": 2.61, "learning_rate": 0.00014200732294285191, "loss": 0.0118, "step": 12813 }, { "epoch": 2.61, "learning_rate": 0.00014198796518158471, "loss": 0.0044, "step": 12814 }, { "epoch": 2.61, "learning_rate": 0.0001419686075541337, "loss": 0.0159, "step": 12815 }, { "epoch": 2.61, "learning_rate": 0.00014194925006082208, "loss": 0.007, "step": 12816 }, { "epoch": 2.61, "learning_rate": 0.0001419298927019732, "loss": 0.0039, "step": 12817 }, { "epoch": 2.61, "learning_rate": 0.0001419105354779103, "loss": 0.0106, "step": 12818 }, { "epoch": 2.61, "learning_rate": 0.00014189117838895668, "loss": 0.022, "step": 12819 }, { "epoch": 2.61, "learning_rate": 0.00014187182143543582, "loss": 0.0254, "step": 12820 }, { "epoch": 2.61, "learning_rate": 0.00014185246461767084, "loss": 0.0076, "step": 12821 }, { "epoch": 2.61, "learning_rate": 0.00014183310793598503, "loss": 0.0005, "step": 12822 }, { "epoch": 2.61, "learning_rate": 0.0001418137513907018, "loss": 0.0064, "step": 12823 }, { "epoch": 2.61, "learning_rate": 0.00014179439498214437, "loss": 0.0177, "step": 12824 }, { "epoch": 2.61, "learning_rate": 0.00014177503871063595, "loss": 0.0074, "step": 12825 }, { "epoch": 2.61, "learning_rate": 0.00014175568257649996, "loss": 0.0102, "step": 12826 }, { "epoch": 2.61, "learning_rate": 0.00014173632658005963, "loss": 0.0052, "step": 12827 }, { "epoch": 2.61, "learning_rate": 0.00014171697072163825, "loss": 0.0104, "step": 12828 }, { "epoch": 2.61, "learning_rate": 0.0001416976150015591, "loss": 0.0033, "step": 12829 }, { "epoch": 2.61, "learning_rate": 0.00014167825942014542, "loss": 0.0142, "step": 12830 }, { "epoch": 2.61, "learning_rate": 0.00014165890397772058, "loss": 0.0029, "step": 12831 }, { "epoch": 2.61, "learning_rate": 0.00014163954867460772, "loss": 0.0045, "step": 12832 }, { "epoch": 2.61, "learning_rate": 0.00014162019351113023, "loss": 0.0044, "step": 12833 }, { "epoch": 2.61, "learning_rate": 0.00014160083848761135, "loss": 0.0188, "step": 12834 }, { "epoch": 2.61, "learning_rate": 0.0001415814836043742, "loss": 0.0213, "step": 12835 }, { "epoch": 2.61, "learning_rate": 0.0001415621288617423, "loss": 0.0066, "step": 12836 }, { "epoch": 2.61, "learning_rate": 0.00014154277426003866, "loss": 0.0267, "step": 12837 }, { "epoch": 2.61, "learning_rate": 0.00014152341979958673, "loss": 0.009, "step": 12838 }, { "epoch": 2.61, "learning_rate": 0.0001415040654807097, "loss": 0.0099, "step": 12839 }, { "epoch": 2.61, "learning_rate": 0.00014148471130373075, "loss": 0.0022, "step": 12840 }, { "epoch": 2.61, "learning_rate": 0.00014146535726897326, "loss": 0.0082, "step": 12841 }, { "epoch": 2.61, "learning_rate": 0.00014144600337676034, "loss": 0.0071, "step": 12842 }, { "epoch": 2.62, "learning_rate": 0.0001414266496274154, "loss": 0.0046, "step": 12843 }, { "epoch": 2.62, "learning_rate": 0.00014140729602126156, "loss": 0.0017, "step": 12844 }, { "epoch": 2.62, "learning_rate": 0.00014138794255862206, "loss": 0.0093, "step": 12845 }, { "epoch": 2.62, "learning_rate": 0.00014136858923982022, "loss": 0.0136, "step": 12846 }, { "epoch": 2.62, "learning_rate": 0.0001413492360651792, "loss": 0.0053, "step": 12847 }, { "epoch": 2.62, "learning_rate": 0.0001413298830350223, "loss": 0.0105, "step": 12848 }, { "epoch": 2.62, "learning_rate": 0.00014131053014967268, "loss": 0.0089, "step": 12849 }, { "epoch": 2.62, "learning_rate": 0.00014129117740945357, "loss": 0.0005, "step": 12850 }, { "epoch": 2.62, "learning_rate": 0.00014127182481468833, "loss": 0.0059, "step": 12851 }, { "epoch": 2.62, "learning_rate": 0.0001412524723657001, "loss": 0.0086, "step": 12852 }, { "epoch": 2.62, "learning_rate": 0.000141233120062812, "loss": 0.0071, "step": 12853 }, { "epoch": 2.62, "learning_rate": 0.00014121376790634743, "loss": 0.0059, "step": 12854 }, { "epoch": 2.62, "learning_rate": 0.00014119441589662945, "loss": 0.0099, "step": 12855 }, { "epoch": 2.62, "learning_rate": 0.0001411750640339814, "loss": 0.009, "step": 12856 }, { "epoch": 2.62, "learning_rate": 0.00014115571231872642, "loss": 0.0019, "step": 12857 }, { "epoch": 2.62, "learning_rate": 0.00014113636075118775, "loss": 0.0187, "step": 12858 }, { "epoch": 2.62, "learning_rate": 0.00014111700933168856, "loss": 0.0118, "step": 12859 }, { "epoch": 2.62, "learning_rate": 0.0001410976580605521, "loss": 0.0108, "step": 12860 }, { "epoch": 2.62, "learning_rate": 0.00014107830693810156, "loss": 0.0251, "step": 12861 }, { "epoch": 2.62, "learning_rate": 0.00014105895596466014, "loss": 0.0079, "step": 12862 }, { "epoch": 2.62, "learning_rate": 0.00014103960514055098, "loss": 0.007, "step": 12863 }, { "epoch": 2.62, "learning_rate": 0.0001410202544660974, "loss": 0.0081, "step": 12864 }, { "epoch": 2.62, "learning_rate": 0.00014100090394162247, "loss": 0.0075, "step": 12865 }, { "epoch": 2.62, "learning_rate": 0.00014098155356744946, "loss": 0.0014, "step": 12866 }, { "epoch": 2.62, "learning_rate": 0.00014096220334390157, "loss": 0.011, "step": 12867 }, { "epoch": 2.62, "learning_rate": 0.00014094285327130183, "loss": 0.0183, "step": 12868 }, { "epoch": 2.62, "learning_rate": 0.00014092350334997362, "loss": 0.0186, "step": 12869 }, { "epoch": 2.62, "learning_rate": 0.00014090415358024002, "loss": 0.0081, "step": 12870 }, { "epoch": 2.62, "learning_rate": 0.0001408848039624242, "loss": 0.0009, "step": 12871 }, { "epoch": 2.62, "learning_rate": 0.00014086545449684942, "loss": 0.0017, "step": 12872 }, { "epoch": 2.62, "learning_rate": 0.00014084610518383872, "loss": 0.0059, "step": 12873 }, { "epoch": 2.62, "learning_rate": 0.0001408267560237154, "loss": 0.0127, "step": 12874 }, { "epoch": 2.62, "learning_rate": 0.00014080740701680257, "loss": 0.0115, "step": 12875 }, { "epoch": 2.62, "learning_rate": 0.00014078805816342336, "loss": 0.0107, "step": 12876 }, { "epoch": 2.62, "learning_rate": 0.000140768709463901, "loss": 0.0166, "step": 12877 }, { "epoch": 2.62, "learning_rate": 0.00014074936091855857, "loss": 0.0045, "step": 12878 }, { "epoch": 2.62, "learning_rate": 0.00014073001252771928, "loss": 0.0042, "step": 12879 }, { "epoch": 2.62, "learning_rate": 0.00014071066429170633, "loss": 0.0071, "step": 12880 }, { "epoch": 2.62, "learning_rate": 0.00014069131621084277, "loss": 0.0223, "step": 12881 }, { "epoch": 2.62, "learning_rate": 0.00014067196828545185, "loss": 0.0159, "step": 12882 }, { "epoch": 2.62, "learning_rate": 0.0001406526205158566, "loss": 0.0071, "step": 12883 }, { "epoch": 2.62, "learning_rate": 0.0001406332729023803, "loss": 0.0059, "step": 12884 }, { "epoch": 2.62, "learning_rate": 0.00014061392544534602, "loss": 0.0032, "step": 12885 }, { "epoch": 2.62, "learning_rate": 0.00014059457814507686, "loss": 0.0129, "step": 12886 }, { "epoch": 2.62, "learning_rate": 0.00014057523100189604, "loss": 0.0014, "step": 12887 }, { "epoch": 2.62, "learning_rate": 0.0001405558840161266, "loss": 0.006, "step": 12888 }, { "epoch": 2.62, "learning_rate": 0.00014053653718809178, "loss": 0.0047, "step": 12889 }, { "epoch": 2.62, "learning_rate": 0.00014051719051811463, "loss": 0.0051, "step": 12890 }, { "epoch": 2.62, "learning_rate": 0.00014049784400651825, "loss": 0.0142, "step": 12891 }, { "epoch": 2.63, "learning_rate": 0.0001404784976536259, "loss": 0.0093, "step": 12892 }, { "epoch": 2.63, "learning_rate": 0.0001404591514597605, "loss": 0.0043, "step": 12893 }, { "epoch": 2.63, "learning_rate": 0.0001404398054252454, "loss": 0.0071, "step": 12894 }, { "epoch": 2.63, "learning_rate": 0.00014042045955040358, "loss": 0.0085, "step": 12895 }, { "epoch": 2.63, "learning_rate": 0.00014040111383555807, "loss": 0.0112, "step": 12896 }, { "epoch": 2.63, "learning_rate": 0.0001403817682810322, "loss": 0.0121, "step": 12897 }, { "epoch": 2.63, "learning_rate": 0.00014036242288714888, "loss": 0.0207, "step": 12898 }, { "epoch": 2.63, "learning_rate": 0.0001403430776542313, "loss": 0.0082, "step": 12899 }, { "epoch": 2.63, "learning_rate": 0.00014032373258260255, "loss": 0.0033, "step": 12900 }, { "epoch": 2.63, "learning_rate": 0.00014030438767258574, "loss": 0.0045, "step": 12901 }, { "epoch": 2.63, "learning_rate": 0.00014028504292450396, "loss": 0.0072, "step": 12902 }, { "epoch": 2.63, "learning_rate": 0.00014026569833868033, "loss": 0.005, "step": 12903 }, { "epoch": 2.63, "learning_rate": 0.00014024635391543785, "loss": 0.0071, "step": 12904 }, { "epoch": 2.63, "learning_rate": 0.0001402270096550997, "loss": 0.0017, "step": 12905 }, { "epoch": 2.63, "learning_rate": 0.00014020766555798892, "loss": 0.0175, "step": 12906 }, { "epoch": 2.63, "learning_rate": 0.00014018832162442866, "loss": 0.0126, "step": 12907 }, { "epoch": 2.63, "learning_rate": 0.00014016897785474193, "loss": 0.0149, "step": 12908 }, { "epoch": 2.63, "learning_rate": 0.00014014963424925178, "loss": 0.0115, "step": 12909 }, { "epoch": 2.63, "learning_rate": 0.00014013029080828137, "loss": 0.0096, "step": 12910 }, { "epoch": 2.63, "learning_rate": 0.00014011094753215374, "loss": 0.0055, "step": 12911 }, { "epoch": 2.63, "learning_rate": 0.00014009160442119193, "loss": 0.0005, "step": 12912 }, { "epoch": 2.63, "learning_rate": 0.00014007226147571907, "loss": 0.0072, "step": 12913 }, { "epoch": 2.63, "learning_rate": 0.00014005291869605813, "loss": 0.0059, "step": 12914 }, { "epoch": 2.63, "learning_rate": 0.00014003357608253228, "loss": 0.0088, "step": 12915 }, { "epoch": 2.63, "learning_rate": 0.00014001423363546445, "loss": 0.0026, "step": 12916 }, { "epoch": 2.63, "learning_rate": 0.00013999489135517785, "loss": 0.0185, "step": 12917 }, { "epoch": 2.63, "learning_rate": 0.00013997554924199545, "loss": 0.0178, "step": 12918 }, { "epoch": 2.63, "learning_rate": 0.0001399562072962402, "loss": 0.0068, "step": 12919 }, { "epoch": 2.63, "learning_rate": 0.00013993686551823535, "loss": 0.0171, "step": 12920 }, { "epoch": 2.63, "learning_rate": 0.0001399175239083038, "loss": 0.0055, "step": 12921 }, { "epoch": 2.63, "learning_rate": 0.0001398981824667686, "loss": 0.0064, "step": 12922 }, { "epoch": 2.63, "learning_rate": 0.0001398788411939529, "loss": 0.0216, "step": 12923 }, { "epoch": 2.63, "learning_rate": 0.00013985950009017954, "loss": 0.0086, "step": 12924 }, { "epoch": 2.63, "learning_rate": 0.00013984015915577178, "loss": 0.0911, "step": 12925 }, { "epoch": 2.63, "learning_rate": 0.00013982081839105254, "loss": 0.0027, "step": 12926 }, { "epoch": 2.63, "learning_rate": 0.00013980147779634478, "loss": 0.0064, "step": 12927 }, { "epoch": 2.63, "learning_rate": 0.00013978213737197165, "loss": 0.0064, "step": 12928 }, { "epoch": 2.63, "learning_rate": 0.00013976279711825604, "loss": 0.0081, "step": 12929 }, { "epoch": 2.63, "learning_rate": 0.00013974345703552112, "loss": 0.0068, "step": 12930 }, { "epoch": 2.63, "learning_rate": 0.00013972411712408978, "loss": 0.0059, "step": 12931 }, { "epoch": 2.63, "learning_rate": 0.00013970477738428505, "loss": 0.0089, "step": 12932 }, { "epoch": 2.63, "learning_rate": 0.00013968543781643004, "loss": 0.0359, "step": 12933 }, { "epoch": 2.63, "learning_rate": 0.00013966609842084763, "loss": 0.0136, "step": 12934 }, { "epoch": 2.63, "learning_rate": 0.00013964675919786096, "loss": 0.0103, "step": 12935 }, { "epoch": 2.63, "learning_rate": 0.00013962742014779296, "loss": 0.0111, "step": 12936 }, { "epoch": 2.63, "learning_rate": 0.00013960808127096651, "loss": 0.0091, "step": 12937 }, { "epoch": 2.63, "learning_rate": 0.00013958874256770484, "loss": 0.002, "step": 12938 }, { "epoch": 2.63, "learning_rate": 0.0001395694040383307, "loss": 0.0052, "step": 12939 }, { "epoch": 2.63, "learning_rate": 0.00013955006568316732, "loss": 0.0033, "step": 12940 }, { "epoch": 2.64, "learning_rate": 0.00013953072750253753, "loss": 0.0067, "step": 12941 }, { "epoch": 2.64, "learning_rate": 0.00013951138949676434, "loss": 0.0137, "step": 12942 }, { "epoch": 2.64, "learning_rate": 0.00013949205166617073, "loss": 0.0151, "step": 12943 }, { "epoch": 2.64, "learning_rate": 0.00013947271401107967, "loss": 0.0178, "step": 12944 }, { "epoch": 2.64, "learning_rate": 0.0001394533765318142, "loss": 0.0067, "step": 12945 }, { "epoch": 2.64, "learning_rate": 0.0001394340392286973, "loss": 0.0086, "step": 12946 }, { "epoch": 2.64, "learning_rate": 0.00013941470210205177, "loss": 0.0259, "step": 12947 }, { "epoch": 2.64, "learning_rate": 0.0001393953651522008, "loss": 0.0065, "step": 12948 }, { "epoch": 2.64, "learning_rate": 0.00013937602837946724, "loss": 0.0115, "step": 12949 }, { "epoch": 2.64, "learning_rate": 0.00013935669178417398, "loss": 0.0103, "step": 12950 }, { "epoch": 2.64, "learning_rate": 0.0001393373553666441, "loss": 0.0107, "step": 12951 }, { "epoch": 2.64, "learning_rate": 0.00013931801912720054, "loss": 0.0055, "step": 12952 }, { "epoch": 2.64, "learning_rate": 0.0001392986830661662, "loss": 0.003, "step": 12953 }, { "epoch": 2.64, "learning_rate": 0.0001392793471838641, "loss": 0.0017, "step": 12954 }, { "epoch": 2.64, "learning_rate": 0.00013926001148061704, "loss": 0.0211, "step": 12955 }, { "epoch": 2.64, "learning_rate": 0.00013924067595674815, "loss": 0.0073, "step": 12956 }, { "epoch": 2.64, "learning_rate": 0.00013922134061258022, "loss": 0.0094, "step": 12957 }, { "epoch": 2.64, "learning_rate": 0.0001392020054484363, "loss": 0.0086, "step": 12958 }, { "epoch": 2.64, "learning_rate": 0.00013918267046463928, "loss": 0.0102, "step": 12959 }, { "epoch": 2.64, "learning_rate": 0.00013916333566151202, "loss": 0.0023, "step": 12960 }, { "epoch": 2.64, "learning_rate": 0.00013914400103937755, "loss": 0.0076, "step": 12961 }, { "epoch": 2.64, "learning_rate": 0.00013912466659855873, "loss": 0.0084, "step": 12962 }, { "epoch": 2.64, "learning_rate": 0.00013910533233937853, "loss": 0.0019, "step": 12963 }, { "epoch": 2.64, "learning_rate": 0.00013908599826215987, "loss": 0.0029, "step": 12964 }, { "epoch": 2.64, "learning_rate": 0.00013906666436722554, "loss": 0.0017, "step": 12965 }, { "epoch": 2.64, "learning_rate": 0.00013904733065489867, "loss": 0.0116, "step": 12966 }, { "epoch": 2.64, "learning_rate": 0.00013902799712550197, "loss": 0.0081, "step": 12967 }, { "epoch": 2.64, "learning_rate": 0.00013900866377935847, "loss": 0.0048, "step": 12968 }, { "epoch": 2.64, "learning_rate": 0.00013898933061679109, "loss": 0.0182, "step": 12969 }, { "epoch": 2.64, "learning_rate": 0.00013896999763812255, "loss": 0.013, "step": 12970 }, { "epoch": 2.64, "learning_rate": 0.00013895066484367595, "loss": 0.0099, "step": 12971 }, { "epoch": 2.64, "learning_rate": 0.0001389313322337741, "loss": 0.0039, "step": 12972 }, { "epoch": 2.64, "learning_rate": 0.00013891199980873987, "loss": 0.0049, "step": 12973 }, { "epoch": 2.64, "learning_rate": 0.00013889266756889618, "loss": 0.0125, "step": 12974 }, { "epoch": 2.64, "learning_rate": 0.00013887333551456586, "loss": 0.0045, "step": 12975 }, { "epoch": 2.64, "learning_rate": 0.0001388540036460719, "loss": 0.0065, "step": 12976 }, { "epoch": 2.64, "learning_rate": 0.00013883467196373715, "loss": 0.0031, "step": 12977 }, { "epoch": 2.64, "learning_rate": 0.00013881534046788439, "loss": 0.0115, "step": 12978 }, { "epoch": 2.64, "learning_rate": 0.0001387960091588366, "loss": 0.0187, "step": 12979 }, { "epoch": 2.64, "learning_rate": 0.00013877667803691656, "loss": 0.0016, "step": 12980 }, { "epoch": 2.64, "learning_rate": 0.00013875734710244722, "loss": 0.0065, "step": 12981 }, { "epoch": 2.64, "learning_rate": 0.0001387380163557514, "loss": 0.0068, "step": 12982 }, { "epoch": 2.64, "learning_rate": 0.00013871868579715195, "loss": 0.0035, "step": 12983 }, { "epoch": 2.64, "learning_rate": 0.00013869935542697176, "loss": 0.012, "step": 12984 }, { "epoch": 2.64, "learning_rate": 0.0001386800252455336, "loss": 0.012, "step": 12985 }, { "epoch": 2.64, "learning_rate": 0.0001386606952531605, "loss": 0.0032, "step": 12986 }, { "epoch": 2.64, "learning_rate": 0.00013864136545017514, "loss": 0.0264, "step": 12987 }, { "epoch": 2.64, "learning_rate": 0.0001386220358369004, "loss": 0.0078, "step": 12988 }, { "epoch": 2.64, "learning_rate": 0.00013860270641365916, "loss": 0.0119, "step": 12989 }, { "epoch": 2.65, "learning_rate": 0.0001385833771807742, "loss": 0.0226, "step": 12990 }, { "epoch": 2.65, "learning_rate": 0.00013856404813856845, "loss": 0.0038, "step": 12991 }, { "epoch": 2.65, "learning_rate": 0.00013854471928736464, "loss": 0.0026, "step": 12992 }, { "epoch": 2.65, "learning_rate": 0.00013852539062748567, "loss": 0.0176, "step": 12993 }, { "epoch": 2.65, "learning_rate": 0.0001385060621592543, "loss": 0.0057, "step": 12994 }, { "epoch": 2.65, "learning_rate": 0.00013848673388299347, "loss": 0.0077, "step": 12995 }, { "epoch": 2.65, "learning_rate": 0.0001384674057990258, "loss": 0.0044, "step": 12996 }, { "epoch": 2.65, "learning_rate": 0.00013844807790767432, "loss": 0.0084, "step": 12997 }, { "epoch": 2.65, "learning_rate": 0.00013842875020926167, "loss": 0.0084, "step": 12998 }, { "epoch": 2.65, "learning_rate": 0.0001384094227041108, "loss": 0.0182, "step": 12999 }, { "epoch": 2.65, "learning_rate": 0.00013839009539254443, "loss": 0.0026, "step": 13000 }, { "epoch": 2.65, "learning_rate": 0.00013837076827488535, "loss": 0.0165, "step": 13001 }, { "epoch": 2.65, "learning_rate": 0.00013835144135145643, "loss": 0.0149, "step": 13002 }, { "epoch": 2.65, "learning_rate": 0.00013833211462258038, "loss": 0.0019, "step": 13003 }, { "epoch": 2.65, "learning_rate": 0.00013831278808858004, "loss": 0.0095, "step": 13004 }, { "epoch": 2.65, "learning_rate": 0.00013829346174977828, "loss": 0.0057, "step": 13005 }, { "epoch": 2.65, "learning_rate": 0.0001382741356064977, "loss": 0.0042, "step": 13006 }, { "epoch": 2.65, "learning_rate": 0.0001382548096590613, "loss": 0.012, "step": 13007 }, { "epoch": 2.65, "learning_rate": 0.00013823548390779167, "loss": 0.0063, "step": 13008 }, { "epoch": 2.65, "learning_rate": 0.0001382161583530117, "loss": 0.0091, "step": 13009 }, { "epoch": 2.65, "learning_rate": 0.00013819683299504416, "loss": 0.0053, "step": 13010 }, { "epoch": 2.65, "learning_rate": 0.0001381775078342117, "loss": 0.0035, "step": 13011 }, { "epoch": 2.65, "learning_rate": 0.00013815818287083725, "loss": 0.0103, "step": 13012 }, { "epoch": 2.65, "learning_rate": 0.00013813885810524344, "loss": 0.0061, "step": 13013 }, { "epoch": 2.65, "learning_rate": 0.00013811953353775315, "loss": 0.0078, "step": 13014 }, { "epoch": 2.65, "learning_rate": 0.00013810020916868907, "loss": 0.0075, "step": 13015 }, { "epoch": 2.65, "learning_rate": 0.00013808088499837388, "loss": 0.022, "step": 13016 }, { "epoch": 2.65, "learning_rate": 0.0001380615610271305, "loss": 0.0085, "step": 13017 }, { "epoch": 2.65, "learning_rate": 0.00013804223725528153, "loss": 0.0224, "step": 13018 }, { "epoch": 2.65, "learning_rate": 0.0001380229136831498, "loss": 0.0129, "step": 13019 }, { "epoch": 2.65, "learning_rate": 0.00013800359031105805, "loss": 0.0053, "step": 13020 }, { "epoch": 2.65, "learning_rate": 0.00013798426713932893, "loss": 0.0168, "step": 13021 }, { "epoch": 2.65, "learning_rate": 0.00013796494416828527, "loss": 0.0055, "step": 13022 }, { "epoch": 2.65, "learning_rate": 0.00013794562139824975, "loss": 0.0205, "step": 13023 }, { "epoch": 2.65, "learning_rate": 0.0001379262988295451, "loss": 0.0086, "step": 13024 }, { "epoch": 2.65, "learning_rate": 0.000137906976462494, "loss": 0.0094, "step": 13025 }, { "epoch": 2.65, "learning_rate": 0.00013788765429741928, "loss": 0.0202, "step": 13026 }, { "epoch": 2.65, "learning_rate": 0.00013786833233464358, "loss": 0.003, "step": 13027 }, { "epoch": 2.65, "learning_rate": 0.00013784901057448966, "loss": 0.0073, "step": 13028 }, { "epoch": 2.65, "learning_rate": 0.00013782968901728015, "loss": 0.0091, "step": 13029 }, { "epoch": 2.65, "learning_rate": 0.00013781036766333785, "loss": 0.0055, "step": 13030 }, { "epoch": 2.65, "learning_rate": 0.00013779104651298537, "loss": 0.0078, "step": 13031 }, { "epoch": 2.65, "learning_rate": 0.00013777172556654553, "loss": 0.0068, "step": 13032 }, { "epoch": 2.65, "learning_rate": 0.00013775240482434092, "loss": 0.0056, "step": 13033 }, { "epoch": 2.65, "learning_rate": 0.00013773308428669426, "loss": 0.0015, "step": 13034 }, { "epoch": 2.65, "learning_rate": 0.00013771376395392822, "loss": 0.0051, "step": 13035 }, { "epoch": 2.65, "learning_rate": 0.00013769444382636555, "loss": 0.017, "step": 13036 }, { "epoch": 2.65, "learning_rate": 0.00013767512390432888, "loss": 0.0151, "step": 13037 }, { "epoch": 2.65, "learning_rate": 0.00013765580418814097, "loss": 0.0028, "step": 13038 }, { "epoch": 2.65, "learning_rate": 0.00013763648467812433, "loss": 0.0147, "step": 13039 }, { "epoch": 2.66, "learning_rate": 0.00013761716537460182, "loss": 0.0138, "step": 13040 }, { "epoch": 2.66, "learning_rate": 0.00013759784627789595, "loss": 0.0266, "step": 13041 }, { "epoch": 2.66, "learning_rate": 0.00013757852738832953, "loss": 0.0118, "step": 13042 }, { "epoch": 2.66, "learning_rate": 0.00013755920870622514, "loss": 0.0078, "step": 13043 }, { "epoch": 2.66, "learning_rate": 0.0001375398902319054, "loss": 0.0114, "step": 13044 }, { "epoch": 2.66, "learning_rate": 0.00013752057196569304, "loss": 0.0062, "step": 13045 }, { "epoch": 2.66, "learning_rate": 0.0001375012539079107, "loss": 0.0061, "step": 13046 }, { "epoch": 2.66, "learning_rate": 0.00013748193605888094, "loss": 0.0159, "step": 13047 }, { "epoch": 2.66, "learning_rate": 0.00013746261841892656, "loss": 0.0058, "step": 13048 }, { "epoch": 2.66, "learning_rate": 0.00013744330098837006, "loss": 0.0119, "step": 13049 }, { "epoch": 2.66, "learning_rate": 0.00013742398376753417, "loss": 0.0096, "step": 13050 }, { "epoch": 2.66, "learning_rate": 0.00013740466675674152, "loss": 0.0036, "step": 13051 }, { "epoch": 2.66, "learning_rate": 0.00013738534995631465, "loss": 0.0072, "step": 13052 }, { "epoch": 2.66, "learning_rate": 0.00013736603336657628, "loss": 0.0091, "step": 13053 }, { "epoch": 2.66, "learning_rate": 0.00013734671698784897, "loss": 0.0106, "step": 13054 }, { "epoch": 2.66, "learning_rate": 0.00013732740082045543, "loss": 0.0029, "step": 13055 }, { "epoch": 2.66, "learning_rate": 0.00013730808486471817, "loss": 0.0151, "step": 13056 }, { "epoch": 2.66, "learning_rate": 0.00013728876912095982, "loss": 0.0187, "step": 13057 }, { "epoch": 2.66, "learning_rate": 0.0001372694535895031, "loss": 0.0105, "step": 13058 }, { "epoch": 2.66, "learning_rate": 0.00013725013827067047, "loss": 0.0078, "step": 13059 }, { "epoch": 2.66, "learning_rate": 0.00013723082316478464, "loss": 0.0048, "step": 13060 }, { "epoch": 2.66, "learning_rate": 0.00013721150827216818, "loss": 0.0097, "step": 13061 }, { "epoch": 2.66, "learning_rate": 0.00013719219359314362, "loss": 0.0095, "step": 13062 }, { "epoch": 2.66, "learning_rate": 0.00013717287912803366, "loss": 0.0145, "step": 13063 }, { "epoch": 2.66, "learning_rate": 0.00013715356487716075, "loss": 0.0084, "step": 13064 }, { "epoch": 2.66, "learning_rate": 0.00013713425084084765, "loss": 0.0071, "step": 13065 }, { "epoch": 2.66, "learning_rate": 0.00013711493701941679, "loss": 0.0118, "step": 13066 }, { "epoch": 2.66, "learning_rate": 0.0001370956234131908, "loss": 0.0117, "step": 13067 }, { "epoch": 2.66, "learning_rate": 0.00013707631002249227, "loss": 0.0022, "step": 13068 }, { "epoch": 2.66, "learning_rate": 0.0001370569968476438, "loss": 0.0065, "step": 13069 }, { "epoch": 2.66, "learning_rate": 0.00013703768388896785, "loss": 0.0276, "step": 13070 }, { "epoch": 2.66, "learning_rate": 0.00013701837114678709, "loss": 0.0055, "step": 13071 }, { "epoch": 2.66, "learning_rate": 0.00013699905862142397, "loss": 0.0064, "step": 13072 }, { "epoch": 2.66, "learning_rate": 0.0001369797463132012, "loss": 0.0073, "step": 13073 }, { "epoch": 2.66, "learning_rate": 0.00013696043422244125, "loss": 0.0072, "step": 13074 }, { "epoch": 2.66, "learning_rate": 0.00013694112234946657, "loss": 0.0146, "step": 13075 }, { "epoch": 2.66, "learning_rate": 0.00013692181069459983, "loss": 0.0114, "step": 13076 }, { "epoch": 2.66, "learning_rate": 0.00013690249925816356, "loss": 0.0024, "step": 13077 }, { "epoch": 2.66, "learning_rate": 0.00013688318804048027, "loss": 0.0028, "step": 13078 }, { "epoch": 2.66, "learning_rate": 0.00013686387704187254, "loss": 0.0089, "step": 13079 }, { "epoch": 2.66, "learning_rate": 0.00013684456626266277, "loss": 0.0068, "step": 13080 }, { "epoch": 2.66, "learning_rate": 0.00013682525570317365, "loss": 0.0032, "step": 13081 }, { "epoch": 2.66, "learning_rate": 0.00013680594536372756, "loss": 0.0042, "step": 13082 }, { "epoch": 2.66, "learning_rate": 0.00013678663524464718, "loss": 0.0041, "step": 13083 }, { "epoch": 2.66, "learning_rate": 0.0001367673253462549, "loss": 0.002, "step": 13084 }, { "epoch": 2.66, "learning_rate": 0.00013674801566887322, "loss": 0.0029, "step": 13085 }, { "epoch": 2.66, "learning_rate": 0.00013672870621282473, "loss": 0.0134, "step": 13086 }, { "epoch": 2.66, "learning_rate": 0.00013670939697843187, "loss": 0.0118, "step": 13087 }, { "epoch": 2.66, "learning_rate": 0.0001366900879660172, "loss": 0.0183, "step": 13088 }, { "epoch": 2.67, "learning_rate": 0.0001366707791759032, "loss": 0.019, "step": 13089 }, { "epoch": 2.67, "learning_rate": 0.00013665147060841227, "loss": 0.007, "step": 13090 }, { "epoch": 2.67, "learning_rate": 0.00013663216226386706, "loss": 0.0074, "step": 13091 }, { "epoch": 2.67, "learning_rate": 0.0001366128541425899, "loss": 0.0025, "step": 13092 }, { "epoch": 2.67, "learning_rate": 0.00013659354624490343, "loss": 0.0111, "step": 13093 }, { "epoch": 2.67, "learning_rate": 0.00013657423857113004, "loss": 0.015, "step": 13094 }, { "epoch": 2.67, "learning_rate": 0.00013655493112159212, "loss": 0.0186, "step": 13095 }, { "epoch": 2.67, "learning_rate": 0.00013653562389661232, "loss": 0.0045, "step": 13096 }, { "epoch": 2.67, "learning_rate": 0.00013651631689651298, "loss": 0.0022, "step": 13097 }, { "epoch": 2.67, "learning_rate": 0.0001364970101216166, "loss": 0.0033, "step": 13098 }, { "epoch": 2.67, "learning_rate": 0.00013647770357224563, "loss": 0.009, "step": 13099 }, { "epoch": 2.67, "learning_rate": 0.0001364583972487225, "loss": 0.006, "step": 13100 }, { "epoch": 2.67, "learning_rate": 0.0001364390911513698, "loss": 0.0008, "step": 13101 }, { "epoch": 2.67, "learning_rate": 0.00013641978528050982, "loss": 0.0036, "step": 13102 }, { "epoch": 2.67, "learning_rate": 0.00013640047963646502, "loss": 0.0193, "step": 13103 }, { "epoch": 2.67, "learning_rate": 0.00013638117421955795, "loss": 0.013, "step": 13104 }, { "epoch": 2.67, "learning_rate": 0.0001363618690301109, "loss": 0.0028, "step": 13105 }, { "epoch": 2.67, "learning_rate": 0.00013634256406844646, "loss": 0.0148, "step": 13106 }, { "epoch": 2.67, "learning_rate": 0.00013632325933488694, "loss": 0.0146, "step": 13107 }, { "epoch": 2.67, "learning_rate": 0.0001363039548297548, "loss": 0.0077, "step": 13108 }, { "epoch": 2.67, "learning_rate": 0.0001362846505533725, "loss": 0.0096, "step": 13109 }, { "epoch": 2.67, "learning_rate": 0.00013626534650606237, "loss": 0.0253, "step": 13110 }, { "epoch": 2.67, "learning_rate": 0.00013624604268814693, "loss": 0.0042, "step": 13111 }, { "epoch": 2.67, "learning_rate": 0.00013622673909994857, "loss": 0.0059, "step": 13112 }, { "epoch": 2.67, "learning_rate": 0.00013620743574178958, "loss": 0.0093, "step": 13113 }, { "epoch": 2.67, "learning_rate": 0.00013618813261399252, "loss": 0.0159, "step": 13114 }, { "epoch": 2.67, "learning_rate": 0.00013616882971687966, "loss": 0.0037, "step": 13115 }, { "epoch": 2.67, "learning_rate": 0.0001361495270507735, "loss": 0.0091, "step": 13116 }, { "epoch": 2.67, "learning_rate": 0.00013613022461599636, "loss": 0.0023, "step": 13117 }, { "epoch": 2.67, "learning_rate": 0.00013611092241287066, "loss": 0.0087, "step": 13118 }, { "epoch": 2.67, "learning_rate": 0.00013609162044171875, "loss": 0.0063, "step": 13119 }, { "epoch": 2.67, "learning_rate": 0.00013607231870286306, "loss": 0.0053, "step": 13120 }, { "epoch": 2.67, "learning_rate": 0.0001360530171966259, "loss": 0.0202, "step": 13121 }, { "epoch": 2.67, "learning_rate": 0.00013603371592332974, "loss": 0.0047, "step": 13122 }, { "epoch": 2.67, "learning_rate": 0.0001360144148832968, "loss": 0.0039, "step": 13123 }, { "epoch": 2.67, "learning_rate": 0.00013599511407684964, "loss": 0.0209, "step": 13124 }, { "epoch": 2.67, "learning_rate": 0.00013597581350431048, "loss": 0.0182, "step": 13125 }, { "epoch": 2.67, "learning_rate": 0.00013595651316600165, "loss": 0.0088, "step": 13126 }, { "epoch": 2.67, "learning_rate": 0.0001359372130622456, "loss": 0.0122, "step": 13127 }, { "epoch": 2.67, "learning_rate": 0.0001359179131933646, "loss": 0.0047, "step": 13128 }, { "epoch": 2.67, "learning_rate": 0.00013589861355968105, "loss": 0.0085, "step": 13129 }, { "epoch": 2.67, "learning_rate": 0.0001358793141615173, "loss": 0.0208, "step": 13130 }, { "epoch": 2.67, "learning_rate": 0.00013586001499919561, "loss": 0.0116, "step": 13131 }, { "epoch": 2.67, "learning_rate": 0.00013584071607303843, "loss": 0.0072, "step": 13132 }, { "epoch": 2.67, "learning_rate": 0.00013582141738336794, "loss": 0.0097, "step": 13133 }, { "epoch": 2.67, "learning_rate": 0.0001358021189305066, "loss": 0.01, "step": 13134 }, { "epoch": 2.67, "learning_rate": 0.0001357828207147767, "loss": 0.0308, "step": 13135 }, { "epoch": 2.67, "learning_rate": 0.00013576352273650044, "loss": 0.0067, "step": 13136 }, { "epoch": 2.67, "learning_rate": 0.00013574422499600033, "loss": 0.0075, "step": 13137 }, { "epoch": 2.68, "learning_rate": 0.00013572492749359846, "loss": 0.0064, "step": 13138 }, { "epoch": 2.68, "learning_rate": 0.00013570563022961732, "loss": 0.0054, "step": 13139 }, { "epoch": 2.68, "learning_rate": 0.00013568633320437912, "loss": 0.0031, "step": 13140 }, { "epoch": 2.68, "learning_rate": 0.00013566703641820614, "loss": 0.0108, "step": 13141 }, { "epoch": 2.68, "learning_rate": 0.00013564773987142077, "loss": 0.0011, "step": 13142 }, { "epoch": 2.68, "learning_rate": 0.00013562844356434522, "loss": 0.0088, "step": 13143 }, { "epoch": 2.68, "learning_rate": 0.00013560914749730175, "loss": 0.0035, "step": 13144 }, { "epoch": 2.68, "learning_rate": 0.00013558985167061273, "loss": 0.0168, "step": 13145 }, { "epoch": 2.68, "learning_rate": 0.00013557055608460036, "loss": 0.0045, "step": 13146 }, { "epoch": 2.68, "learning_rate": 0.00013555126073958696, "loss": 0.0029, "step": 13147 }, { "epoch": 2.68, "learning_rate": 0.00013553196563589475, "loss": 0.001, "step": 13148 }, { "epoch": 2.68, "learning_rate": 0.00013551267077384604, "loss": 0.0067, "step": 13149 }, { "epoch": 2.68, "learning_rate": 0.00013549337615376307, "loss": 0.0059, "step": 13150 }, { "epoch": 2.68, "learning_rate": 0.00013547408177596812, "loss": 0.0107, "step": 13151 }, { "epoch": 2.68, "learning_rate": 0.0001354547876407834, "loss": 0.0033, "step": 13152 }, { "epoch": 2.68, "learning_rate": 0.00013543549374853123, "loss": 0.017, "step": 13153 }, { "epoch": 2.68, "learning_rate": 0.00013541620009953372, "loss": 0.0034, "step": 13154 }, { "epoch": 2.68, "learning_rate": 0.00013539690669411327, "loss": 0.0144, "step": 13155 }, { "epoch": 2.68, "learning_rate": 0.000135377613532592, "loss": 0.0075, "step": 13156 }, { "epoch": 2.68, "learning_rate": 0.00013535832061529224, "loss": 0.0099, "step": 13157 }, { "epoch": 2.68, "learning_rate": 0.00013533902794253614, "loss": 0.0161, "step": 13158 }, { "epoch": 2.68, "learning_rate": 0.00013531973551464592, "loss": 0.0074, "step": 13159 }, { "epoch": 2.68, "learning_rate": 0.00013530044333194384, "loss": 0.0032, "step": 13160 }, { "epoch": 2.68, "learning_rate": 0.0001352811513947521, "loss": 0.0019, "step": 13161 }, { "epoch": 2.68, "learning_rate": 0.00013526185970339294, "loss": 0.0082, "step": 13162 }, { "epoch": 2.68, "learning_rate": 0.00013524256825818854, "loss": 0.0334, "step": 13163 }, { "epoch": 2.68, "learning_rate": 0.00013522327705946106, "loss": 0.0214, "step": 13164 }, { "epoch": 2.68, "learning_rate": 0.00013520398610753281, "loss": 0.0029, "step": 13165 }, { "epoch": 2.68, "learning_rate": 0.00013518469540272588, "loss": 0.0038, "step": 13166 }, { "epoch": 2.68, "learning_rate": 0.00013516540494536253, "loss": 0.0019, "step": 13167 }, { "epoch": 2.68, "learning_rate": 0.00013514611473576494, "loss": 0.0128, "step": 13168 }, { "epoch": 2.68, "learning_rate": 0.0001351268247742552, "loss": 0.0066, "step": 13169 }, { "epoch": 2.68, "learning_rate": 0.0001351075350611556, "loss": 0.0111, "step": 13170 }, { "epoch": 2.68, "learning_rate": 0.0001350882455967883, "loss": 0.0158, "step": 13171 }, { "epoch": 2.68, "learning_rate": 0.00013506895638147539, "loss": 0.0166, "step": 13172 }, { "epoch": 2.68, "learning_rate": 0.00013504966741553914, "loss": 0.0117, "step": 13173 }, { "epoch": 2.68, "learning_rate": 0.0001350303786993016, "loss": 0.009, "step": 13174 }, { "epoch": 2.68, "learning_rate": 0.0001350110902330851, "loss": 0.0023, "step": 13175 }, { "epoch": 2.68, "learning_rate": 0.00013499180201721167, "loss": 0.0066, "step": 13176 }, { "epoch": 2.68, "learning_rate": 0.00013497251405200338, "loss": 0.0053, "step": 13177 }, { "epoch": 2.68, "learning_rate": 0.00013495322633778255, "loss": 0.0123, "step": 13178 }, { "epoch": 2.68, "learning_rate": 0.0001349339388748712, "loss": 0.0013, "step": 13179 }, { "epoch": 2.68, "learning_rate": 0.00013491465166359155, "loss": 0.0231, "step": 13180 }, { "epoch": 2.68, "learning_rate": 0.00013489536470426568, "loss": 0.0034, "step": 13181 }, { "epoch": 2.68, "learning_rate": 0.00013487607799721567, "loss": 0.0058, "step": 13182 }, { "epoch": 2.68, "learning_rate": 0.0001348567915427638, "loss": 0.0073, "step": 13183 }, { "epoch": 2.68, "learning_rate": 0.000134837505341232, "loss": 0.0082, "step": 13184 }, { "epoch": 2.68, "learning_rate": 0.00013481821939294257, "loss": 0.0089, "step": 13185 }, { "epoch": 2.68, "learning_rate": 0.00013479893369821753, "loss": 0.0048, "step": 13186 }, { "epoch": 2.69, "learning_rate": 0.00013477964825737895, "loss": 0.005, "step": 13187 }, { "epoch": 2.69, "learning_rate": 0.00013476036307074902, "loss": 0.0071, "step": 13188 }, { "epoch": 2.69, "learning_rate": 0.0001347410781386497, "loss": 0.0114, "step": 13189 }, { "epoch": 2.69, "learning_rate": 0.0001347217934614033, "loss": 0.0067, "step": 13190 }, { "epoch": 2.69, "learning_rate": 0.0001347025090393317, "loss": 0.0054, "step": 13191 }, { "epoch": 2.69, "learning_rate": 0.0001346832248727571, "loss": 0.0017, "step": 13192 }, { "epoch": 2.69, "learning_rate": 0.00013466394096200158, "loss": 0.0072, "step": 13193 }, { "epoch": 2.69, "learning_rate": 0.00013464465730738718, "loss": 0.0119, "step": 13194 }, { "epoch": 2.69, "learning_rate": 0.00013462537390923596, "loss": 0.0042, "step": 13195 }, { "epoch": 2.69, "learning_rate": 0.00013460609076787009, "loss": 0.0118, "step": 13196 }, { "epoch": 2.69, "learning_rate": 0.00013458680788361145, "loss": 0.0101, "step": 13197 }, { "epoch": 2.69, "learning_rate": 0.0001345675252567823, "loss": 0.0073, "step": 13198 }, { "epoch": 2.69, "learning_rate": 0.00013454824288770462, "loss": 0.0116, "step": 13199 }, { "epoch": 2.69, "learning_rate": 0.00013452896077670038, "loss": 0.0094, "step": 13200 }, { "epoch": 2.69, "learning_rate": 0.00013450967892409175, "loss": 0.0073, "step": 13201 }, { "epoch": 2.69, "learning_rate": 0.0001344903973302007, "loss": 0.0132, "step": 13202 }, { "epoch": 2.69, "learning_rate": 0.0001344711159953493, "loss": 0.0101, "step": 13203 }, { "epoch": 2.69, "learning_rate": 0.0001344518349198596, "loss": 0.0013, "step": 13204 }, { "epoch": 2.69, "learning_rate": 0.00013443255410405355, "loss": 0.0048, "step": 13205 }, { "epoch": 2.69, "learning_rate": 0.00013441327354825328, "loss": 0.0073, "step": 13206 }, { "epoch": 2.69, "learning_rate": 0.0001343939932527807, "loss": 0.0157, "step": 13207 }, { "epoch": 2.69, "learning_rate": 0.00013437471321795798, "loss": 0.0025, "step": 13208 }, { "epoch": 2.69, "learning_rate": 0.000134355433444107, "loss": 0.0094, "step": 13209 }, { "epoch": 2.69, "learning_rate": 0.0001343361539315498, "loss": 0.0182, "step": 13210 }, { "epoch": 2.69, "learning_rate": 0.00013431687468060845, "loss": 0.011, "step": 13211 }, { "epoch": 2.69, "learning_rate": 0.0001342975956916048, "loss": 0.0103, "step": 13212 }, { "epoch": 2.69, "learning_rate": 0.000134278316964861, "loss": 0.0075, "step": 13213 }, { "epoch": 2.69, "learning_rate": 0.00013425903850069904, "loss": 0.0006, "step": 13214 }, { "epoch": 2.69, "learning_rate": 0.00013423976029944073, "loss": 0.021, "step": 13215 }, { "epoch": 2.69, "learning_rate": 0.00013422048236140827, "loss": 0.0187, "step": 13216 }, { "epoch": 2.69, "learning_rate": 0.00013420120468692355, "loss": 0.0096, "step": 13217 }, { "epoch": 2.69, "learning_rate": 0.00013418192727630845, "loss": 0.003, "step": 13218 }, { "epoch": 2.69, "learning_rate": 0.0001341626501298851, "loss": 0.0049, "step": 13219 }, { "epoch": 2.69, "learning_rate": 0.0001341433732479753, "loss": 0.0075, "step": 13220 }, { "epoch": 2.69, "learning_rate": 0.00013412409663090118, "loss": 0.0019, "step": 13221 }, { "epoch": 2.69, "learning_rate": 0.0001341048202789846, "loss": 0.0173, "step": 13222 }, { "epoch": 2.69, "learning_rate": 0.00013408554419254746, "loss": 0.0087, "step": 13223 }, { "epoch": 2.69, "learning_rate": 0.00013406626837191184, "loss": 0.0103, "step": 13224 }, { "epoch": 2.69, "learning_rate": 0.00013404699281739958, "loss": 0.0074, "step": 13225 }, { "epoch": 2.69, "learning_rate": 0.00013402771752933269, "loss": 0.0201, "step": 13226 }, { "epoch": 2.69, "learning_rate": 0.0001340084425080331, "loss": 0.0074, "step": 13227 }, { "epoch": 2.69, "learning_rate": 0.0001339891677538226, "loss": 0.0105, "step": 13228 }, { "epoch": 2.69, "learning_rate": 0.0001339698932670233, "loss": 0.0075, "step": 13229 }, { "epoch": 2.69, "learning_rate": 0.000133950619047957, "loss": 0.0033, "step": 13230 }, { "epoch": 2.69, "learning_rate": 0.00013393134509694568, "loss": 0.0072, "step": 13231 }, { "epoch": 2.69, "learning_rate": 0.00013391207141431123, "loss": 0.0134, "step": 13232 }, { "epoch": 2.69, "learning_rate": 0.00013389279800037553, "loss": 0.0126, "step": 13233 }, { "epoch": 2.69, "learning_rate": 0.00013387352485546054, "loss": 0.0106, "step": 13234 }, { "epoch": 2.69, "learning_rate": 0.00013385425197988806, "loss": 0.0115, "step": 13235 }, { "epoch": 2.7, "learning_rate": 0.00013383497937398015, "loss": 0.0011, "step": 13236 }, { "epoch": 2.7, "learning_rate": 0.00013381570703805857, "loss": 0.0142, "step": 13237 }, { "epoch": 2.7, "learning_rate": 0.00013379643497244518, "loss": 0.0054, "step": 13238 }, { "epoch": 2.7, "learning_rate": 0.00013377716317746196, "loss": 0.0136, "step": 13239 }, { "epoch": 2.7, "learning_rate": 0.0001337578916534307, "loss": 0.0213, "step": 13240 }, { "epoch": 2.7, "learning_rate": 0.00013373862040067335, "loss": 0.0005, "step": 13241 }, { "epoch": 2.7, "learning_rate": 0.00013371934941951172, "loss": 0.0009, "step": 13242 }, { "epoch": 2.7, "learning_rate": 0.00013370007871026768, "loss": 0.0012, "step": 13243 }, { "epoch": 2.7, "learning_rate": 0.00013368080827326308, "loss": 0.0013, "step": 13244 }, { "epoch": 2.7, "learning_rate": 0.00013366153810881985, "loss": 0.0069, "step": 13245 }, { "epoch": 2.7, "learning_rate": 0.00013364226821725966, "loss": 0.007, "step": 13246 }, { "epoch": 2.7, "learning_rate": 0.0001336229985989046, "loss": 0.0072, "step": 13247 }, { "epoch": 2.7, "learning_rate": 0.00013360372925407625, "loss": 0.0111, "step": 13248 }, { "epoch": 2.7, "learning_rate": 0.00013358446018309667, "loss": 0.006, "step": 13249 }, { "epoch": 2.7, "learning_rate": 0.00013356519138628758, "loss": 0.0011, "step": 13250 }, { "epoch": 2.7, "learning_rate": 0.00013354592286397076, "loss": 0.0018, "step": 13251 }, { "epoch": 2.7, "learning_rate": 0.00013352665461646815, "loss": 0.0008, "step": 13252 }, { "epoch": 2.7, "learning_rate": 0.00013350738664410144, "loss": 0.013, "step": 13253 }, { "epoch": 2.7, "learning_rate": 0.00013348811894719253, "loss": 0.0156, "step": 13254 }, { "epoch": 2.7, "learning_rate": 0.00013346885152606323, "loss": 0.0075, "step": 13255 }, { "epoch": 2.7, "learning_rate": 0.00013344958438103526, "loss": 0.0025, "step": 13256 }, { "epoch": 2.7, "learning_rate": 0.00013343031751243055, "loss": 0.0092, "step": 13257 }, { "epoch": 2.7, "learning_rate": 0.00013341105092057074, "loss": 0.0126, "step": 13258 }, { "epoch": 2.7, "learning_rate": 0.00013339178460577774, "loss": 0.0096, "step": 13259 }, { "epoch": 2.7, "learning_rate": 0.0001333725185683733, "loss": 0.002, "step": 13260 }, { "epoch": 2.7, "learning_rate": 0.00013335325280867914, "loss": 0.0039, "step": 13261 }, { "epoch": 2.7, "learning_rate": 0.00013333398732701712, "loss": 0.0096, "step": 13262 }, { "epoch": 2.7, "learning_rate": 0.0001333147221237089, "loss": 0.0072, "step": 13263 }, { "epoch": 2.7, "learning_rate": 0.0001332954571990764, "loss": 0.017, "step": 13264 }, { "epoch": 2.7, "learning_rate": 0.00013327619255344128, "loss": 0.0038, "step": 13265 }, { "epoch": 2.7, "learning_rate": 0.00013325692818712525, "loss": 0.0123, "step": 13266 }, { "epoch": 2.7, "learning_rate": 0.0001332376641004502, "loss": 0.0127, "step": 13267 }, { "epoch": 2.7, "learning_rate": 0.0001332184002937378, "loss": 0.0255, "step": 13268 }, { "epoch": 2.7, "learning_rate": 0.00013319913676730974, "loss": 0.0218, "step": 13269 }, { "epoch": 2.7, "learning_rate": 0.00013317987352148787, "loss": 0.0052, "step": 13270 }, { "epoch": 2.7, "learning_rate": 0.0001331606105565938, "loss": 0.003, "step": 13271 }, { "epoch": 2.7, "learning_rate": 0.00013314134787294934, "loss": 0.0062, "step": 13272 }, { "epoch": 2.7, "learning_rate": 0.0001331220854708762, "loss": 0.0032, "step": 13273 }, { "epoch": 2.7, "learning_rate": 0.0001331028233506961, "loss": 0.0068, "step": 13274 }, { "epoch": 2.7, "learning_rate": 0.00013308356151273075, "loss": 0.0077, "step": 13275 }, { "epoch": 2.7, "learning_rate": 0.00013306429995730177, "loss": 0.0371, "step": 13276 }, { "epoch": 2.7, "learning_rate": 0.00013304503868473108, "loss": 0.0102, "step": 13277 }, { "epoch": 2.7, "learning_rate": 0.0001330257776953402, "loss": 0.0039, "step": 13278 }, { "epoch": 2.7, "learning_rate": 0.00013300651698945084, "loss": 0.0062, "step": 13279 }, { "epoch": 2.7, "learning_rate": 0.00013298725656738476, "loss": 0.0113, "step": 13280 }, { "epoch": 2.7, "learning_rate": 0.00013296799642946357, "loss": 0.009, "step": 13281 }, { "epoch": 2.7, "learning_rate": 0.00013294873657600904, "loss": 0.0078, "step": 13282 }, { "epoch": 2.7, "learning_rate": 0.0001329294770073428, "loss": 0.0014, "step": 13283 }, { "epoch": 2.7, "learning_rate": 0.00013291021772378648, "loss": 0.0088, "step": 13284 }, { "epoch": 2.71, "learning_rate": 0.00013289095872566178, "loss": 0.0102, "step": 13285 }, { "epoch": 2.71, "learning_rate": 0.00013287170001329037, "loss": 0.0146, "step": 13286 }, { "epoch": 2.71, "learning_rate": 0.0001328524415869939, "loss": 0.0042, "step": 13287 }, { "epoch": 2.71, "learning_rate": 0.00013283318344709406, "loss": 0.0198, "step": 13288 }, { "epoch": 2.71, "learning_rate": 0.0001328139255939124, "loss": 0.0051, "step": 13289 }, { "epoch": 2.71, "learning_rate": 0.00013279466802777068, "loss": 0.0028, "step": 13290 }, { "epoch": 2.71, "learning_rate": 0.0001327754107489905, "loss": 0.0053, "step": 13291 }, { "epoch": 2.71, "learning_rate": 0.0001327561537578934, "loss": 0.0088, "step": 13292 }, { "epoch": 2.71, "learning_rate": 0.00013273689705480113, "loss": 0.014, "step": 13293 }, { "epoch": 2.71, "learning_rate": 0.00013271764064003524, "loss": 0.0121, "step": 13294 }, { "epoch": 2.71, "learning_rate": 0.00013269838451391737, "loss": 0.0053, "step": 13295 }, { "epoch": 2.71, "learning_rate": 0.00013267912867676919, "loss": 0.0113, "step": 13296 }, { "epoch": 2.71, "learning_rate": 0.00013265987312891217, "loss": 0.0088, "step": 13297 }, { "epoch": 2.71, "learning_rate": 0.00013264061787066807, "loss": 0.0164, "step": 13298 }, { "epoch": 2.71, "learning_rate": 0.00013262136290235837, "loss": 0.0079, "step": 13299 }, { "epoch": 2.71, "learning_rate": 0.00013260210822430476, "loss": 0.0082, "step": 13300 }, { "epoch": 2.71, "learning_rate": 0.0001325828538368288, "loss": 0.0135, "step": 13301 }, { "epoch": 2.71, "learning_rate": 0.000132563599740252, "loss": 0.0106, "step": 13302 }, { "epoch": 2.71, "learning_rate": 0.00013254434593489605, "loss": 0.0018, "step": 13303 }, { "epoch": 2.71, "learning_rate": 0.0001325250924210824, "loss": 0.0064, "step": 13304 }, { "epoch": 2.71, "learning_rate": 0.00013250583919913278, "loss": 0.0108, "step": 13305 }, { "epoch": 2.71, "learning_rate": 0.00013248658626936863, "loss": 0.0046, "step": 13306 }, { "epoch": 2.71, "learning_rate": 0.0001324673336321115, "loss": 0.0052, "step": 13307 }, { "epoch": 2.71, "learning_rate": 0.00013244808128768306, "loss": 0.0094, "step": 13308 }, { "epoch": 2.71, "learning_rate": 0.00013242882923640475, "loss": 0.033, "step": 13309 }, { "epoch": 2.71, "learning_rate": 0.00013240957747859822, "loss": 0.0116, "step": 13310 }, { "epoch": 2.71, "learning_rate": 0.00013239032601458493, "loss": 0.0034, "step": 13311 }, { "epoch": 2.71, "learning_rate": 0.00013237107484468638, "loss": 0.0056, "step": 13312 }, { "epoch": 2.71, "learning_rate": 0.0001323518239692242, "loss": 0.026, "step": 13313 }, { "epoch": 2.71, "learning_rate": 0.00013233257338851986, "loss": 0.0052, "step": 13314 }, { "epoch": 2.71, "learning_rate": 0.00013231332310289492, "loss": 0.0025, "step": 13315 }, { "epoch": 2.71, "learning_rate": 0.00013229407311267087, "loss": 0.0044, "step": 13316 }, { "epoch": 2.71, "learning_rate": 0.0001322748234181692, "loss": 0.0022, "step": 13317 }, { "epoch": 2.71, "learning_rate": 0.00013225557401971142, "loss": 0.024, "step": 13318 }, { "epoch": 2.71, "learning_rate": 0.0001322363249176191, "loss": 0.005, "step": 13319 }, { "epoch": 2.71, "learning_rate": 0.00013221707611221363, "loss": 0.0013, "step": 13320 }, { "epoch": 2.71, "learning_rate": 0.0001321978276038166, "loss": 0.0183, "step": 13321 }, { "epoch": 2.71, "learning_rate": 0.00013217857939274943, "loss": 0.0022, "step": 13322 }, { "epoch": 2.71, "learning_rate": 0.00013215933147933364, "loss": 0.0193, "step": 13323 }, { "epoch": 2.71, "learning_rate": 0.0001321400838638907, "loss": 0.0052, "step": 13324 }, { "epoch": 2.71, "learning_rate": 0.00013212083654674204, "loss": 0.0054, "step": 13325 }, { "epoch": 2.71, "learning_rate": 0.00013210158952820916, "loss": 0.008, "step": 13326 }, { "epoch": 2.71, "learning_rate": 0.00013208234280861353, "loss": 0.0043, "step": 13327 }, { "epoch": 2.71, "learning_rate": 0.0001320630963882766, "loss": 0.0028, "step": 13328 }, { "epoch": 2.71, "learning_rate": 0.00013204385026751984, "loss": 0.0149, "step": 13329 }, { "epoch": 2.71, "learning_rate": 0.0001320246044466646, "loss": 0.0089, "step": 13330 }, { "epoch": 2.71, "learning_rate": 0.0001320053589260325, "loss": 0.0045, "step": 13331 }, { "epoch": 2.71, "learning_rate": 0.00013198611370594479, "loss": 0.0063, "step": 13332 }, { "epoch": 2.71, "learning_rate": 0.00013196686878672305, "loss": 0.006, "step": 13333 }, { "epoch": 2.72, "learning_rate": 0.00013194762416868862, "loss": 0.0218, "step": 13334 }, { "epoch": 2.72, "learning_rate": 0.0001319283798521629, "loss": 0.011, "step": 13335 }, { "epoch": 2.72, "learning_rate": 0.00013190913583746743, "loss": 0.008, "step": 13336 }, { "epoch": 2.72, "learning_rate": 0.00013188989212492344, "loss": 0.0246, "step": 13337 }, { "epoch": 2.72, "learning_rate": 0.0001318706487148525, "loss": 0.0055, "step": 13338 }, { "epoch": 2.72, "learning_rate": 0.00013185140560757595, "loss": 0.0025, "step": 13339 }, { "epoch": 2.72, "learning_rate": 0.00013183216280341514, "loss": 0.0042, "step": 13340 }, { "epoch": 2.72, "learning_rate": 0.00013181292030269156, "loss": 0.0037, "step": 13341 }, { "epoch": 2.72, "learning_rate": 0.00013179367810572655, "loss": 0.0086, "step": 13342 }, { "epoch": 2.72, "learning_rate": 0.00013177443621284143, "loss": 0.0014, "step": 13343 }, { "epoch": 2.72, "learning_rate": 0.00013175519462435767, "loss": 0.0086, "step": 13344 }, { "epoch": 2.72, "learning_rate": 0.00013173595334059653, "loss": 0.0091, "step": 13345 }, { "epoch": 2.72, "learning_rate": 0.00013171671236187954, "loss": 0.0004, "step": 13346 }, { "epoch": 2.72, "learning_rate": 0.0001316974716885279, "loss": 0.0009, "step": 13347 }, { "epoch": 2.72, "learning_rate": 0.00013167823132086303, "loss": 0.0026, "step": 13348 }, { "epoch": 2.72, "learning_rate": 0.0001316589912592063, "loss": 0.0153, "step": 13349 }, { "epoch": 2.72, "learning_rate": 0.00013163975150387903, "loss": 0.0054, "step": 13350 }, { "epoch": 2.72, "learning_rate": 0.0001316205120552026, "loss": 0.0069, "step": 13351 }, { "epoch": 2.72, "learning_rate": 0.00013160127291349832, "loss": 0.0031, "step": 13352 }, { "epoch": 2.72, "learning_rate": 0.00013158203407908744, "loss": 0.0113, "step": 13353 }, { "epoch": 2.72, "learning_rate": 0.00013156279555229144, "loss": 0.0079, "step": 13354 }, { "epoch": 2.72, "learning_rate": 0.00013154355733343146, "loss": 0.0051, "step": 13355 }, { "epoch": 2.72, "learning_rate": 0.000131524319422829, "loss": 0.0122, "step": 13356 }, { "epoch": 2.72, "learning_rate": 0.00013150508182080525, "loss": 0.0002, "step": 13357 }, { "epoch": 2.72, "learning_rate": 0.00013148584452768154, "loss": 0.0053, "step": 13358 }, { "epoch": 2.72, "learning_rate": 0.00013146660754377918, "loss": 0.0189, "step": 13359 }, { "epoch": 2.72, "learning_rate": 0.0001314473708694194, "loss": 0.0105, "step": 13360 }, { "epoch": 2.72, "learning_rate": 0.00013142813450492364, "loss": 0.0019, "step": 13361 }, { "epoch": 2.72, "learning_rate": 0.00013140889845061307, "loss": 0.0038, "step": 13362 }, { "epoch": 2.72, "learning_rate": 0.00013138966270680896, "loss": 0.0072, "step": 13363 }, { "epoch": 2.72, "learning_rate": 0.00013137042727383265, "loss": 0.0115, "step": 13364 }, { "epoch": 2.72, "learning_rate": 0.00013135119215200536, "loss": 0.0128, "step": 13365 }, { "epoch": 2.72, "learning_rate": 0.00013133195734164833, "loss": 0.0014, "step": 13366 }, { "epoch": 2.72, "learning_rate": 0.00013131272284308285, "loss": 0.0004, "step": 13367 }, { "epoch": 2.72, "learning_rate": 0.0001312934886566302, "loss": 0.0047, "step": 13368 }, { "epoch": 2.72, "learning_rate": 0.00013127425478261158, "loss": 0.0007, "step": 13369 }, { "epoch": 2.72, "learning_rate": 0.0001312550212213483, "loss": 0.0288, "step": 13370 }, { "epoch": 2.72, "learning_rate": 0.00013123578797316146, "loss": 0.0072, "step": 13371 }, { "epoch": 2.72, "learning_rate": 0.00013121655503837247, "loss": 0.013, "step": 13372 }, { "epoch": 2.72, "learning_rate": 0.0001311973224173024, "loss": 0.0031, "step": 13373 }, { "epoch": 2.72, "learning_rate": 0.00013117809011027262, "loss": 0.0013, "step": 13374 }, { "epoch": 2.72, "learning_rate": 0.00013115885811760422, "loss": 0.0067, "step": 13375 }, { "epoch": 2.72, "learning_rate": 0.00013113962643961842, "loss": 0.0098, "step": 13376 }, { "epoch": 2.72, "learning_rate": 0.00013112039507663653, "loss": 0.0003, "step": 13377 }, { "epoch": 2.72, "learning_rate": 0.00013110116402897958, "loss": 0.0269, "step": 13378 }, { "epoch": 2.72, "learning_rate": 0.00013108193329696894, "loss": 0.0175, "step": 13379 }, { "epoch": 2.72, "learning_rate": 0.00013106270288092573, "loss": 0.0071, "step": 13380 }, { "epoch": 2.72, "learning_rate": 0.00013104347278117108, "loss": 0.003, "step": 13381 }, { "epoch": 2.72, "learning_rate": 0.00013102424299802628, "loss": 0.0022, "step": 13382 }, { "epoch": 2.73, "learning_rate": 0.00013100501353181235, "loss": 0.0052, "step": 13383 }, { "epoch": 2.73, "learning_rate": 0.00013098578438285063, "loss": 0.0018, "step": 13384 }, { "epoch": 2.73, "learning_rate": 0.00013096655555146222, "loss": 0.0295, "step": 13385 }, { "epoch": 2.73, "learning_rate": 0.00013094732703796818, "loss": 0.0175, "step": 13386 }, { "epoch": 2.73, "learning_rate": 0.0001309280988426898, "loss": 0.0082, "step": 13387 }, { "epoch": 2.73, "learning_rate": 0.00013090887096594813, "loss": 0.0141, "step": 13388 }, { "epoch": 2.73, "learning_rate": 0.0001308896434080644, "loss": 0.0063, "step": 13389 }, { "epoch": 2.73, "learning_rate": 0.00013087041616935966, "loss": 0.0007, "step": 13390 }, { "epoch": 2.73, "learning_rate": 0.00013085118925015504, "loss": 0.0258, "step": 13391 }, { "epoch": 2.73, "learning_rate": 0.0001308319626507718, "loss": 0.0033, "step": 13392 }, { "epoch": 2.73, "learning_rate": 0.00013081273637153095, "loss": 0.0162, "step": 13393 }, { "epoch": 2.73, "learning_rate": 0.00013079351041275355, "loss": 0.0198, "step": 13394 }, { "epoch": 2.73, "learning_rate": 0.00013077428477476088, "loss": 0.032, "step": 13395 }, { "epoch": 2.73, "learning_rate": 0.00013075505945787382, "loss": 0.0081, "step": 13396 }, { "epoch": 2.73, "learning_rate": 0.0001307358344624137, "loss": 0.0056, "step": 13397 }, { "epoch": 2.73, "learning_rate": 0.00013071660978870148, "loss": 0.0081, "step": 13398 }, { "epoch": 2.73, "learning_rate": 0.00013069738543705826, "loss": 0.0082, "step": 13399 }, { "epoch": 2.73, "learning_rate": 0.00013067816140780516, "loss": 0.0017, "step": 13400 }, { "epoch": 2.73, "learning_rate": 0.00013065893770126318, "loss": 0.0038, "step": 13401 }, { "epoch": 2.73, "learning_rate": 0.00013063971431775354, "loss": 0.0044, "step": 13402 }, { "epoch": 2.73, "learning_rate": 0.0001306204912575972, "loss": 0.0054, "step": 13403 }, { "epoch": 2.73, "learning_rate": 0.00013060126852111517, "loss": 0.0221, "step": 13404 }, { "epoch": 2.73, "learning_rate": 0.00013058204610862862, "loss": 0.0098, "step": 13405 }, { "epoch": 2.73, "learning_rate": 0.0001305628240204585, "loss": 0.0055, "step": 13406 }, { "epoch": 2.73, "learning_rate": 0.000130543602256926, "loss": 0.0052, "step": 13407 }, { "epoch": 2.73, "learning_rate": 0.00013052438081835203, "loss": 0.0064, "step": 13408 }, { "epoch": 2.73, "learning_rate": 0.00013050515970505766, "loss": 0.0111, "step": 13409 }, { "epoch": 2.73, "learning_rate": 0.0001304859389173639, "loss": 0.0009, "step": 13410 }, { "epoch": 2.73, "learning_rate": 0.00013046671845559182, "loss": 0.0057, "step": 13411 }, { "epoch": 2.73, "learning_rate": 0.0001304474983200624, "loss": 0.0072, "step": 13412 }, { "epoch": 2.73, "learning_rate": 0.0001304282785110967, "loss": 0.0047, "step": 13413 }, { "epoch": 2.73, "learning_rate": 0.00013040905902901562, "loss": 0.0064, "step": 13414 }, { "epoch": 2.73, "learning_rate": 0.00013038983987414033, "loss": 0.0071, "step": 13415 }, { "epoch": 2.73, "learning_rate": 0.00013037062104679173, "loss": 0.0022, "step": 13416 }, { "epoch": 2.73, "learning_rate": 0.0001303514025472907, "loss": 0.0102, "step": 13417 }, { "epoch": 2.73, "learning_rate": 0.00013033218437595844, "loss": 0.0024, "step": 13418 }, { "epoch": 2.73, "learning_rate": 0.00013031296653311574, "loss": 0.009, "step": 13419 }, { "epoch": 2.73, "learning_rate": 0.0001302937490190837, "loss": 0.0131, "step": 13420 }, { "epoch": 2.73, "learning_rate": 0.0001302745318341833, "loss": 0.006, "step": 13421 }, { "epoch": 2.73, "learning_rate": 0.0001302553149787354, "loss": 0.0142, "step": 13422 }, { "epoch": 2.73, "learning_rate": 0.00013023609845306102, "loss": 0.0278, "step": 13423 }, { "epoch": 2.73, "learning_rate": 0.00013021688225748108, "loss": 0.0062, "step": 13424 }, { "epoch": 2.73, "learning_rate": 0.0001301976663923166, "loss": 0.0129, "step": 13425 }, { "epoch": 2.73, "learning_rate": 0.00013017845085788846, "loss": 0.0078, "step": 13426 }, { "epoch": 2.73, "learning_rate": 0.00013015923565451757, "loss": 0.0082, "step": 13427 }, { "epoch": 2.73, "learning_rate": 0.00013014002078252495, "loss": 0.0039, "step": 13428 }, { "epoch": 2.73, "learning_rate": 0.00013012080624223138, "loss": 0.0054, "step": 13429 }, { "epoch": 2.73, "learning_rate": 0.00013010159203395797, "loss": 0.0109, "step": 13430 }, { "epoch": 2.73, "learning_rate": 0.0001300823781580255, "loss": 0.0036, "step": 13431 }, { "epoch": 2.74, "learning_rate": 0.00013006316461475486, "loss": 0.0051, "step": 13432 }, { "epoch": 2.74, "learning_rate": 0.00013004395140446708, "loss": 0.0047, "step": 13433 }, { "epoch": 2.74, "learning_rate": 0.00013002473852748292, "loss": 0.0073, "step": 13434 }, { "epoch": 2.74, "learning_rate": 0.00013000552598412338, "loss": 0.0045, "step": 13435 }, { "epoch": 2.74, "learning_rate": 0.00012998631377470933, "loss": 0.0048, "step": 13436 }, { "epoch": 2.74, "learning_rate": 0.00012996710189956153, "loss": 0.0061, "step": 13437 }, { "epoch": 2.74, "learning_rate": 0.000129947890359001, "loss": 0.0048, "step": 13438 }, { "epoch": 2.74, "learning_rate": 0.00012992867915334852, "loss": 0.0047, "step": 13439 }, { "epoch": 2.74, "learning_rate": 0.00012990946828292502, "loss": 0.0278, "step": 13440 }, { "epoch": 2.74, "learning_rate": 0.0001298902577480513, "loss": 0.008, "step": 13441 }, { "epoch": 2.74, "learning_rate": 0.00012987104754904824, "loss": 0.0038, "step": 13442 }, { "epoch": 2.74, "learning_rate": 0.00012985183768623668, "loss": 0.0101, "step": 13443 }, { "epoch": 2.74, "learning_rate": 0.0001298326281599375, "loss": 0.0058, "step": 13444 }, { "epoch": 2.74, "learning_rate": 0.0001298134189704714, "loss": 0.0116, "step": 13445 }, { "epoch": 2.74, "learning_rate": 0.00012979421011815941, "loss": 0.0175, "step": 13446 }, { "epoch": 2.74, "learning_rate": 0.00012977500160332218, "loss": 0.0103, "step": 13447 }, { "epoch": 2.74, "learning_rate": 0.00012975579342628066, "loss": 0.0136, "step": 13448 }, { "epoch": 2.74, "learning_rate": 0.0001297365855873556, "loss": 0.0031, "step": 13449 }, { "epoch": 2.74, "learning_rate": 0.00012971737808686775, "loss": 0.0045, "step": 13450 }, { "epoch": 2.74, "learning_rate": 0.00012969817092513803, "loss": 0.0154, "step": 13451 }, { "epoch": 2.74, "learning_rate": 0.00012967896410248715, "loss": 0.0055, "step": 13452 }, { "epoch": 2.74, "learning_rate": 0.00012965975761923592, "loss": 0.0014, "step": 13453 }, { "epoch": 2.74, "learning_rate": 0.00012964055147570517, "loss": 0.0018, "step": 13454 }, { "epoch": 2.74, "learning_rate": 0.00012962134567221558, "loss": 0.0123, "step": 13455 }, { "epoch": 2.74, "learning_rate": 0.00012960214020908808, "loss": 0.0053, "step": 13456 }, { "epoch": 2.74, "learning_rate": 0.00012958293508664323, "loss": 0.0005, "step": 13457 }, { "epoch": 2.74, "learning_rate": 0.00012956373030520202, "loss": 0.0059, "step": 13458 }, { "epoch": 2.74, "learning_rate": 0.00012954452586508506, "loss": 0.0084, "step": 13459 }, { "epoch": 2.74, "learning_rate": 0.00012952532176661305, "loss": 0.0109, "step": 13460 }, { "epoch": 2.74, "learning_rate": 0.00012950611801010686, "loss": 0.0067, "step": 13461 }, { "epoch": 2.74, "learning_rate": 0.00012948691459588717, "loss": 0.0039, "step": 13462 }, { "epoch": 2.74, "learning_rate": 0.00012946771152427477, "loss": 0.0128, "step": 13463 }, { "epoch": 2.74, "learning_rate": 0.00012944850879559035, "loss": 0.0052, "step": 13464 }, { "epoch": 2.74, "learning_rate": 0.00012942930641015457, "loss": 0.0067, "step": 13465 }, { "epoch": 2.74, "learning_rate": 0.00012941010436828826, "loss": 0.0087, "step": 13466 }, { "epoch": 2.74, "learning_rate": 0.00012939090267031207, "loss": 0.002, "step": 13467 }, { "epoch": 2.74, "learning_rate": 0.00012937170131654664, "loss": 0.0072, "step": 13468 }, { "epoch": 2.74, "learning_rate": 0.00012935250030731284, "loss": 0.0042, "step": 13469 }, { "epoch": 2.74, "learning_rate": 0.00012933329964293113, "loss": 0.0102, "step": 13470 }, { "epoch": 2.74, "learning_rate": 0.00012931409932372245, "loss": 0.0044, "step": 13471 }, { "epoch": 2.74, "learning_rate": 0.0001292948993500073, "loss": 0.031, "step": 13472 }, { "epoch": 2.74, "learning_rate": 0.00012927569972210639, "loss": 0.001, "step": 13473 }, { "epoch": 2.74, "learning_rate": 0.00012925650044034046, "loss": 0.0031, "step": 13474 }, { "epoch": 2.74, "learning_rate": 0.00012923730150503007, "loss": 0.0021, "step": 13475 }, { "epoch": 2.74, "learning_rate": 0.00012921810291649603, "loss": 0.0077, "step": 13476 }, { "epoch": 2.74, "learning_rate": 0.00012919890467505887, "loss": 0.0051, "step": 13477 }, { "epoch": 2.74, "learning_rate": 0.0001291797067810392, "loss": 0.0087, "step": 13478 }, { "epoch": 2.74, "learning_rate": 0.0001291605092347578, "loss": 0.0136, "step": 13479 }, { "epoch": 2.74, "learning_rate": 0.0001291413120365352, "loss": 0.0119, "step": 13480 }, { "epoch": 2.74, "learning_rate": 0.0001291221151866921, "loss": 0.0062, "step": 13481 }, { "epoch": 2.75, "learning_rate": 0.00012910291868554905, "loss": 0.0017, "step": 13482 }, { "epoch": 2.75, "learning_rate": 0.0001290837225334267, "loss": 0.0054, "step": 13483 }, { "epoch": 2.75, "learning_rate": 0.0001290645267306457, "loss": 0.0102, "step": 13484 }, { "epoch": 2.75, "learning_rate": 0.00012904533127752654, "loss": 0.0172, "step": 13485 }, { "epoch": 2.75, "learning_rate": 0.00012902613617439, "loss": 0.0073, "step": 13486 }, { "epoch": 2.75, "learning_rate": 0.00012900694142155657, "loss": 0.0102, "step": 13487 }, { "epoch": 2.75, "learning_rate": 0.00012898774701934677, "loss": 0.0017, "step": 13488 }, { "epoch": 2.75, "learning_rate": 0.00012896855296808135, "loss": 0.0048, "step": 13489 }, { "epoch": 2.75, "learning_rate": 0.00012894935926808075, "loss": 0.0034, "step": 13490 }, { "epoch": 2.75, "learning_rate": 0.00012893016591966554, "loss": 0.0014, "step": 13491 }, { "epoch": 2.75, "learning_rate": 0.00012891097292315638, "loss": 0.008, "step": 13492 }, { "epoch": 2.75, "learning_rate": 0.00012889178027887378, "loss": 0.0034, "step": 13493 }, { "epoch": 2.75, "learning_rate": 0.0001288725879871383, "loss": 0.0029, "step": 13494 }, { "epoch": 2.75, "learning_rate": 0.0001288533960482705, "loss": 0.0135, "step": 13495 }, { "epoch": 2.75, "learning_rate": 0.00012883420446259083, "loss": 0.0059, "step": 13496 }, { "epoch": 2.75, "learning_rate": 0.00012881501323041997, "loss": 0.0048, "step": 13497 }, { "epoch": 2.75, "learning_rate": 0.00012879582235207832, "loss": 0.0031, "step": 13498 }, { "epoch": 2.75, "learning_rate": 0.00012877663182788652, "loss": 0.0154, "step": 13499 }, { "epoch": 2.75, "learning_rate": 0.00012875744165816502, "loss": 0.0032, "step": 13500 }, { "epoch": 2.75, "learning_rate": 0.0001287382518432343, "loss": 0.004, "step": 13501 }, { "epoch": 2.75, "learning_rate": 0.00012871906238341496, "loss": 0.0065, "step": 13502 }, { "epoch": 2.75, "learning_rate": 0.0001286998732790274, "loss": 0.0087, "step": 13503 }, { "epoch": 2.75, "learning_rate": 0.00012868068453039216, "loss": 0.0007, "step": 13504 }, { "epoch": 2.75, "learning_rate": 0.00012866149613782981, "loss": 0.0046, "step": 13505 }, { "epoch": 2.75, "learning_rate": 0.00012864230810166069, "loss": 0.0134, "step": 13506 }, { "epoch": 2.75, "learning_rate": 0.00012862312042220535, "loss": 0.0174, "step": 13507 }, { "epoch": 2.75, "learning_rate": 0.00012860393309978424, "loss": 0.0146, "step": 13508 }, { "epoch": 2.75, "learning_rate": 0.00012858474613471787, "loss": 0.0069, "step": 13509 }, { "epoch": 2.75, "learning_rate": 0.00012856555952732668, "loss": 0.0238, "step": 13510 }, { "epoch": 2.75, "learning_rate": 0.00012854637327793102, "loss": 0.0193, "step": 13511 }, { "epoch": 2.75, "learning_rate": 0.0001285271873868515, "loss": 0.0043, "step": 13512 }, { "epoch": 2.75, "learning_rate": 0.00012850800185440842, "loss": 0.0216, "step": 13513 }, { "epoch": 2.75, "learning_rate": 0.0001284888166809223, "loss": 0.0062, "step": 13514 }, { "epoch": 2.75, "learning_rate": 0.0001284696318667136, "loss": 0.006, "step": 13515 }, { "epoch": 2.75, "learning_rate": 0.00012845044741210262, "loss": 0.0051, "step": 13516 }, { "epoch": 2.75, "learning_rate": 0.0001284312633174099, "loss": 0.0096, "step": 13517 }, { "epoch": 2.75, "learning_rate": 0.00012841207958295582, "loss": 0.0147, "step": 13518 }, { "epoch": 2.75, "learning_rate": 0.00012839289620906064, "loss": 0.0114, "step": 13519 }, { "epoch": 2.75, "learning_rate": 0.00012837371319604499, "loss": 0.0111, "step": 13520 }, { "epoch": 2.75, "learning_rate": 0.00012835453054422908, "loss": 0.0007, "step": 13521 }, { "epoch": 2.75, "learning_rate": 0.00012833534825393343, "loss": 0.0076, "step": 13522 }, { "epoch": 2.75, "learning_rate": 0.00012831616632547833, "loss": 0.0052, "step": 13523 }, { "epoch": 2.75, "learning_rate": 0.00012829698475918418, "loss": 0.0116, "step": 13524 }, { "epoch": 2.75, "learning_rate": 0.00012827780355537135, "loss": 0.0384, "step": 13525 }, { "epoch": 2.75, "learning_rate": 0.00012825862271436018, "loss": 0.0037, "step": 13526 }, { "epoch": 2.75, "learning_rate": 0.00012823944223647112, "loss": 0.0036, "step": 13527 }, { "epoch": 2.75, "learning_rate": 0.00012822026212202443, "loss": 0.0076, "step": 13528 }, { "epoch": 2.75, "learning_rate": 0.00012820108237134042, "loss": 0.0008, "step": 13529 }, { "epoch": 2.75, "learning_rate": 0.00012818190298473955, "loss": 0.0151, "step": 13530 }, { "epoch": 2.76, "learning_rate": 0.000128162723962542, "loss": 0.0096, "step": 13531 }, { "epoch": 2.76, "learning_rate": 0.0001281435453050683, "loss": 0.0094, "step": 13532 }, { "epoch": 2.76, "learning_rate": 0.00012812436701263856, "loss": 0.0085, "step": 13533 }, { "epoch": 2.76, "learning_rate": 0.00012810518908557323, "loss": 0.022, "step": 13534 }, { "epoch": 2.76, "learning_rate": 0.00012808601152419254, "loss": 0.0014, "step": 13535 }, { "epoch": 2.76, "learning_rate": 0.00012806683432881684, "loss": 0.0089, "step": 13536 }, { "epoch": 2.76, "learning_rate": 0.00012804765749976639, "loss": 0.0068, "step": 13537 }, { "epoch": 2.76, "learning_rate": 0.00012802848103736153, "loss": 0.0078, "step": 13538 }, { "epoch": 2.76, "learning_rate": 0.00012800930494192246, "loss": 0.0014, "step": 13539 }, { "epoch": 2.76, "learning_rate": 0.00012799012921376957, "loss": 0.0039, "step": 13540 }, { "epoch": 2.76, "learning_rate": 0.00012797095385322306, "loss": 0.0077, "step": 13541 }, { "epoch": 2.76, "learning_rate": 0.00012795177886060316, "loss": 0.003, "step": 13542 }, { "epoch": 2.76, "learning_rate": 0.00012793260423623023, "loss": 0.0155, "step": 13543 }, { "epoch": 2.76, "learning_rate": 0.00012791342998042437, "loss": 0.0213, "step": 13544 }, { "epoch": 2.76, "learning_rate": 0.000127894256093506, "loss": 0.0269, "step": 13545 }, { "epoch": 2.76, "learning_rate": 0.00012787508257579527, "loss": 0.002, "step": 13546 }, { "epoch": 2.76, "learning_rate": 0.0001278559094276124, "loss": 0.0097, "step": 13547 }, { "epoch": 2.76, "learning_rate": 0.00012783673664927767, "loss": 0.0007, "step": 13548 }, { "epoch": 2.76, "learning_rate": 0.0001278175642411112, "loss": 0.0042, "step": 13549 }, { "epoch": 2.76, "learning_rate": 0.0001277983922034334, "loss": 0.0274, "step": 13550 }, { "epoch": 2.76, "learning_rate": 0.00012777922053656434, "loss": 0.0077, "step": 13551 }, { "epoch": 2.76, "learning_rate": 0.00012776004924082413, "loss": 0.0126, "step": 13552 }, { "epoch": 2.76, "learning_rate": 0.00012774087831653319, "loss": 0.023, "step": 13553 }, { "epoch": 2.76, "learning_rate": 0.0001277217077640115, "loss": 0.0086, "step": 13554 }, { "epoch": 2.76, "learning_rate": 0.00012770253758357945, "loss": 0.0016, "step": 13555 }, { "epoch": 2.76, "learning_rate": 0.00012768336777555707, "loss": 0.0136, "step": 13556 }, { "epoch": 2.76, "learning_rate": 0.00012766419834026453, "loss": 0.0067, "step": 13557 }, { "epoch": 2.76, "learning_rate": 0.0001276450292780221, "loss": 0.0202, "step": 13558 }, { "epoch": 2.76, "learning_rate": 0.00012762586058914983, "loss": 0.0257, "step": 13559 }, { "epoch": 2.76, "learning_rate": 0.000127606692273968, "loss": 0.0043, "step": 13560 }, { "epoch": 2.76, "learning_rate": 0.00012758752433279663, "loss": 0.0105, "step": 13561 }, { "epoch": 2.76, "learning_rate": 0.00012756835676595588, "loss": 0.008, "step": 13562 }, { "epoch": 2.76, "learning_rate": 0.00012754918957376597, "loss": 0.0051, "step": 13563 }, { "epoch": 2.76, "learning_rate": 0.00012753002275654694, "loss": 0.0025, "step": 13564 }, { "epoch": 2.76, "learning_rate": 0.00012751085631461894, "loss": 0.0016, "step": 13565 }, { "epoch": 2.76, "learning_rate": 0.0001274916902483021, "loss": 0.005, "step": 13566 }, { "epoch": 2.76, "learning_rate": 0.0001274725245579165, "loss": 0.0049, "step": 13567 }, { "epoch": 2.76, "learning_rate": 0.0001274533592437823, "loss": 0.0025, "step": 13568 }, { "epoch": 2.76, "learning_rate": 0.00012743419430621958, "loss": 0.0011, "step": 13569 }, { "epoch": 2.76, "learning_rate": 0.00012741502974554834, "loss": 0.0108, "step": 13570 }, { "epoch": 2.76, "learning_rate": 0.0001273958655620888, "loss": 0.0022, "step": 13571 }, { "epoch": 2.76, "learning_rate": 0.0001273767017561609, "loss": 0.005, "step": 13572 }, { "epoch": 2.76, "learning_rate": 0.00012735753832808486, "loss": 0.0008, "step": 13573 }, { "epoch": 2.76, "learning_rate": 0.00012733837527818066, "loss": 0.0119, "step": 13574 }, { "epoch": 2.76, "learning_rate": 0.00012731921260676835, "loss": 0.0046, "step": 13575 }, { "epoch": 2.76, "learning_rate": 0.00012730005031416798, "loss": 0.0045, "step": 13576 }, { "epoch": 2.76, "learning_rate": 0.00012728088840069965, "loss": 0.0065, "step": 13577 }, { "epoch": 2.76, "learning_rate": 0.00012726172686668334, "loss": 0.011, "step": 13578 }, { "epoch": 2.76, "learning_rate": 0.00012724256571243917, "loss": 0.0047, "step": 13579 }, { "epoch": 2.77, "learning_rate": 0.00012722340493828704, "loss": 0.0009, "step": 13580 }, { "epoch": 2.77, "learning_rate": 0.0001272042445445471, "loss": 0.0088, "step": 13581 }, { "epoch": 2.77, "learning_rate": 0.00012718508453153925, "loss": 0.0217, "step": 13582 }, { "epoch": 2.77, "learning_rate": 0.00012716592489958362, "loss": 0.0062, "step": 13583 }, { "epoch": 2.77, "learning_rate": 0.00012714676564900014, "loss": 0.0165, "step": 13584 }, { "epoch": 2.77, "learning_rate": 0.00012712760678010876, "loss": 0.0122, "step": 13585 }, { "epoch": 2.77, "learning_rate": 0.00012710844829322954, "loss": 0.007, "step": 13586 }, { "epoch": 2.77, "learning_rate": 0.00012708929018868245, "loss": 0.007, "step": 13587 }, { "epoch": 2.77, "learning_rate": 0.00012707013246678745, "loss": 0.0067, "step": 13588 }, { "epoch": 2.77, "learning_rate": 0.00012705097512786458, "loss": 0.006, "step": 13589 }, { "epoch": 2.77, "learning_rate": 0.00012703181817223365, "loss": 0.0035, "step": 13590 }, { "epoch": 2.77, "learning_rate": 0.0001270126616002148, "loss": 0.0077, "step": 13591 }, { "epoch": 2.77, "learning_rate": 0.0001269935054121279, "loss": 0.006, "step": 13592 }, { "epoch": 2.77, "learning_rate": 0.00012697434960829278, "loss": 0.0127, "step": 13593 }, { "epoch": 2.77, "learning_rate": 0.0001269551941890296, "loss": 0.0141, "step": 13594 }, { "epoch": 2.77, "learning_rate": 0.00012693603915465805, "loss": 0.0078, "step": 13595 }, { "epoch": 2.77, "learning_rate": 0.0001269168845054983, "loss": 0.0062, "step": 13596 }, { "epoch": 2.77, "learning_rate": 0.0001268977302418701, "loss": 0.0358, "step": 13597 }, { "epoch": 2.77, "learning_rate": 0.0001268785763640934, "loss": 0.001, "step": 13598 }, { "epoch": 2.77, "learning_rate": 0.00012685942287248816, "loss": 0.0032, "step": 13599 }, { "epoch": 2.77, "learning_rate": 0.00012684026976737418, "loss": 0.0141, "step": 13600 }, { "epoch": 2.77, "learning_rate": 0.0001268211170490715, "loss": 0.0128, "step": 13601 }, { "epoch": 2.77, "learning_rate": 0.0001268019647178999, "loss": 0.0203, "step": 13602 }, { "epoch": 2.77, "learning_rate": 0.00012678281277417918, "loss": 0.0043, "step": 13603 }, { "epoch": 2.77, "learning_rate": 0.00012676366121822943, "loss": 0.0263, "step": 13604 }, { "epoch": 2.77, "learning_rate": 0.0001267445100503703, "loss": 0.0072, "step": 13605 }, { "epoch": 2.77, "learning_rate": 0.00012672535927092183, "loss": 0.0131, "step": 13606 }, { "epoch": 2.77, "learning_rate": 0.00012670620888020377, "loss": 0.0079, "step": 13607 }, { "epoch": 2.77, "learning_rate": 0.00012668705887853597, "loss": 0.0021, "step": 13608 }, { "epoch": 2.77, "learning_rate": 0.0001266679092662383, "loss": 0.0091, "step": 13609 }, { "epoch": 2.77, "learning_rate": 0.00012664876004363058, "loss": 0.0148, "step": 13610 }, { "epoch": 2.77, "learning_rate": 0.00012662961121103267, "loss": 0.0052, "step": 13611 }, { "epoch": 2.77, "learning_rate": 0.0001266104627687644, "loss": 0.0024, "step": 13612 }, { "epoch": 2.77, "learning_rate": 0.00012659131471714547, "loss": 0.0048, "step": 13613 }, { "epoch": 2.77, "learning_rate": 0.00012657216705649584, "loss": 0.0055, "step": 13614 }, { "epoch": 2.77, "learning_rate": 0.00012655301978713526, "loss": 0.0143, "step": 13615 }, { "epoch": 2.77, "learning_rate": 0.00012653387290938344, "loss": 0.0116, "step": 13616 }, { "epoch": 2.77, "learning_rate": 0.00012651472642356024, "loss": 0.0115, "step": 13617 }, { "epoch": 2.77, "learning_rate": 0.00012649558032998547, "loss": 0.0083, "step": 13618 }, { "epoch": 2.77, "learning_rate": 0.00012647643462897887, "loss": 0.0052, "step": 13619 }, { "epoch": 2.77, "learning_rate": 0.00012645728932086022, "loss": 0.0021, "step": 13620 }, { "epoch": 2.77, "learning_rate": 0.00012643814440594926, "loss": 0.0248, "step": 13621 }, { "epoch": 2.77, "learning_rate": 0.0001264189998845658, "loss": 0.0011, "step": 13622 }, { "epoch": 2.77, "learning_rate": 0.0001263998557570295, "loss": 0.0278, "step": 13623 }, { "epoch": 2.77, "learning_rate": 0.0001263807120236602, "loss": 0.0019, "step": 13624 }, { "epoch": 2.77, "learning_rate": 0.00012636156868477765, "loss": 0.0036, "step": 13625 }, { "epoch": 2.77, "learning_rate": 0.0001263424257407014, "loss": 0.0084, "step": 13626 }, { "epoch": 2.77, "learning_rate": 0.0001263232831917514, "loss": 0.0096, "step": 13627 }, { "epoch": 2.77, "learning_rate": 0.00012630414103824718, "loss": 0.0113, "step": 13628 }, { "epoch": 2.78, "learning_rate": 0.00012628499928050857, "loss": 0.0043, "step": 13629 }, { "epoch": 2.78, "learning_rate": 0.00012626585791885526, "loss": 0.0045, "step": 13630 }, { "epoch": 2.78, "learning_rate": 0.00012624671695360686, "loss": 0.0041, "step": 13631 }, { "epoch": 2.78, "learning_rate": 0.0001262275763850832, "loss": 0.0115, "step": 13632 }, { "epoch": 2.78, "learning_rate": 0.00012620843621360383, "loss": 0.0261, "step": 13633 }, { "epoch": 2.78, "learning_rate": 0.00012618929643948854, "loss": 0.0043, "step": 13634 }, { "epoch": 2.78, "learning_rate": 0.00012617015706305694, "loss": 0.0073, "step": 13635 }, { "epoch": 2.78, "learning_rate": 0.00012615101808462865, "loss": 0.0105, "step": 13636 }, { "epoch": 2.78, "learning_rate": 0.0001261318795045234, "loss": 0.0052, "step": 13637 }, { "epoch": 2.78, "learning_rate": 0.00012611274132306083, "loss": 0.004, "step": 13638 }, { "epoch": 2.78, "learning_rate": 0.00012609360354056055, "loss": 0.0014, "step": 13639 }, { "epoch": 2.78, "learning_rate": 0.00012607446615734225, "loss": 0.008, "step": 13640 }, { "epoch": 2.78, "learning_rate": 0.00012605532917372547, "loss": 0.0094, "step": 13641 }, { "epoch": 2.78, "learning_rate": 0.00012603619259002994, "loss": 0.004, "step": 13642 }, { "epoch": 2.78, "learning_rate": 0.00012601705640657523, "loss": 0.008, "step": 13643 }, { "epoch": 2.78, "learning_rate": 0.0001259979206236809, "loss": 0.0072, "step": 13644 }, { "epoch": 2.78, "learning_rate": 0.00012597878524166667, "loss": 0.0049, "step": 13645 }, { "epoch": 2.78, "learning_rate": 0.000125959650260852, "loss": 0.0029, "step": 13646 }, { "epoch": 2.78, "learning_rate": 0.00012594051568155662, "loss": 0.003, "step": 13647 }, { "epoch": 2.78, "learning_rate": 0.0001259213815041, "loss": 0.017, "step": 13648 }, { "epoch": 2.78, "learning_rate": 0.00012590224772880178, "loss": 0.0055, "step": 13649 }, { "epoch": 2.78, "learning_rate": 0.00012588311435598147, "loss": 0.0029, "step": 13650 }, { "epoch": 2.78, "learning_rate": 0.00012586398138595867, "loss": 0.0069, "step": 13651 }, { "epoch": 2.78, "learning_rate": 0.00012584484881905303, "loss": 0.0045, "step": 13652 }, { "epoch": 2.78, "learning_rate": 0.00012582571665558395, "loss": 0.0055, "step": 13653 }, { "epoch": 2.78, "learning_rate": 0.00012580658489587103, "loss": 0.0104, "step": 13654 }, { "epoch": 2.78, "learning_rate": 0.00012578745354023383, "loss": 0.0066, "step": 13655 }, { "epoch": 2.78, "learning_rate": 0.00012576832258899182, "loss": 0.0122, "step": 13656 }, { "epoch": 2.78, "learning_rate": 0.00012574919204246465, "loss": 0.0061, "step": 13657 }, { "epoch": 2.78, "learning_rate": 0.00012573006190097168, "loss": 0.0043, "step": 13658 }, { "epoch": 2.78, "learning_rate": 0.00012571093216483248, "loss": 0.0056, "step": 13659 }, { "epoch": 2.78, "learning_rate": 0.0001256918028343666, "loss": 0.0188, "step": 13660 }, { "epoch": 2.78, "learning_rate": 0.00012567267390989348, "loss": 0.0006, "step": 13661 }, { "epoch": 2.78, "learning_rate": 0.00012565354539173263, "loss": 0.0466, "step": 13662 }, { "epoch": 2.78, "learning_rate": 0.00012563441728020354, "loss": 0.0147, "step": 13663 }, { "epoch": 2.78, "learning_rate": 0.0001256152895756256, "loss": 0.0065, "step": 13664 }, { "epoch": 2.78, "learning_rate": 0.00012559616227831848, "loss": 0.0058, "step": 13665 }, { "epoch": 2.78, "learning_rate": 0.00012557703538860148, "loss": 0.0037, "step": 13666 }, { "epoch": 2.78, "learning_rate": 0.00012555790890679403, "loss": 0.0076, "step": 13667 }, { "epoch": 2.78, "learning_rate": 0.0001255387828332157, "loss": 0.0046, "step": 13668 }, { "epoch": 2.78, "learning_rate": 0.0001255196571681858, "loss": 0.0042, "step": 13669 }, { "epoch": 2.78, "learning_rate": 0.00012550053191202385, "loss": 0.004, "step": 13670 }, { "epoch": 2.78, "learning_rate": 0.00012548140706504933, "loss": 0.02, "step": 13671 }, { "epoch": 2.78, "learning_rate": 0.00012546228262758153, "loss": 0.0148, "step": 13672 }, { "epoch": 2.78, "learning_rate": 0.00012544315859993997, "loss": 0.0098, "step": 13673 }, { "epoch": 2.78, "learning_rate": 0.00012542403498244395, "loss": 0.0193, "step": 13674 }, { "epoch": 2.78, "learning_rate": 0.00012540491177541303, "loss": 0.0021, "step": 13675 }, { "epoch": 2.78, "learning_rate": 0.0001253857889791665, "loss": 0.0025, "step": 13676 }, { "epoch": 2.78, "learning_rate": 0.00012536666659402368, "loss": 0.0037, "step": 13677 }, { "epoch": 2.79, "learning_rate": 0.00012534754462030411, "loss": 0.0162, "step": 13678 }, { "epoch": 2.79, "learning_rate": 0.000125328423058327, "loss": 0.0065, "step": 13679 }, { "epoch": 2.79, "learning_rate": 0.00012530930190841186, "loss": 0.01, "step": 13680 }, { "epoch": 2.79, "learning_rate": 0.00012529018117087796, "loss": 0.0084, "step": 13681 }, { "epoch": 2.79, "learning_rate": 0.00012527106084604463, "loss": 0.0108, "step": 13682 }, { "epoch": 2.79, "learning_rate": 0.00012525194093423133, "loss": 0.0086, "step": 13683 }, { "epoch": 2.79, "learning_rate": 0.00012523282143575727, "loss": 0.0016, "step": 13684 }, { "epoch": 2.79, "learning_rate": 0.00012521370235094191, "loss": 0.008, "step": 13685 }, { "epoch": 2.79, "learning_rate": 0.00012519458368010451, "loss": 0.0031, "step": 13686 }, { "epoch": 2.79, "learning_rate": 0.00012517546542356432, "loss": 0.0228, "step": 13687 }, { "epoch": 2.79, "learning_rate": 0.00012515634758164082, "loss": 0.0163, "step": 13688 }, { "epoch": 2.79, "learning_rate": 0.0001251372301546531, "loss": 0.0028, "step": 13689 }, { "epoch": 2.79, "learning_rate": 0.00012511811314292064, "loss": 0.0076, "step": 13690 }, { "epoch": 2.79, "learning_rate": 0.00012509899654676262, "loss": 0.0037, "step": 13691 }, { "epoch": 2.79, "learning_rate": 0.00012507988036649834, "loss": 0.0113, "step": 13692 }, { "epoch": 2.79, "learning_rate": 0.00012506076460244716, "loss": 0.0159, "step": 13693 }, { "epoch": 2.79, "learning_rate": 0.00012504164925492827, "loss": 0.0103, "step": 13694 }, { "epoch": 2.79, "learning_rate": 0.0001250225343242609, "loss": 0.0013, "step": 13695 }, { "epoch": 2.79, "learning_rate": 0.00012500341981076446, "loss": 0.0073, "step": 13696 }, { "epoch": 2.79, "learning_rate": 0.00012498430571475797, "loss": 0.0096, "step": 13697 }, { "epoch": 2.79, "learning_rate": 0.00012496519203656088, "loss": 0.0031, "step": 13698 }, { "epoch": 2.79, "learning_rate": 0.00012494607877649232, "loss": 0.0044, "step": 13699 }, { "epoch": 2.79, "learning_rate": 0.0001249269659348715, "loss": 0.0005, "step": 13700 }, { "epoch": 2.79, "learning_rate": 0.00012490785351201774, "loss": 0.0043, "step": 13701 }, { "epoch": 2.79, "learning_rate": 0.00012488874150825015, "loss": 0.0094, "step": 13702 }, { "epoch": 2.79, "learning_rate": 0.00012486962992388798, "loss": 0.0029, "step": 13703 }, { "epoch": 2.79, "learning_rate": 0.00012485051875925045, "loss": 0.0043, "step": 13704 }, { "epoch": 2.79, "learning_rate": 0.00012483140801465667, "loss": 0.0004, "step": 13705 }, { "epoch": 2.79, "learning_rate": 0.00012481229769042596, "loss": 0.0058, "step": 13706 }, { "epoch": 2.79, "learning_rate": 0.00012479318778687738, "loss": 0.0025, "step": 13707 }, { "epoch": 2.79, "learning_rate": 0.0001247740783043302, "loss": 0.0183, "step": 13708 }, { "epoch": 2.79, "learning_rate": 0.00012475496924310348, "loss": 0.0118, "step": 13709 }, { "epoch": 2.79, "learning_rate": 0.0001247358606035164, "loss": 0.0055, "step": 13710 }, { "epoch": 2.79, "learning_rate": 0.0001247167523858882, "loss": 0.0086, "step": 13711 }, { "epoch": 2.79, "learning_rate": 0.00012469764459053793, "loss": 0.0082, "step": 13712 }, { "epoch": 2.79, "learning_rate": 0.00012467853721778472, "loss": 0.0103, "step": 13713 }, { "epoch": 2.79, "learning_rate": 0.00012465943026794782, "loss": 0.0024, "step": 13714 }, { "epoch": 2.79, "learning_rate": 0.00012464032374134618, "loss": 0.0054, "step": 13715 }, { "epoch": 2.79, "learning_rate": 0.00012462121763829906, "loss": 0.0115, "step": 13716 }, { "epoch": 2.79, "learning_rate": 0.00012460211195912553, "loss": 0.0095, "step": 13717 }, { "epoch": 2.79, "learning_rate": 0.00012458300670414461, "loss": 0.0041, "step": 13718 }, { "epoch": 2.79, "learning_rate": 0.00012456390187367552, "loss": 0.0121, "step": 13719 }, { "epoch": 2.79, "learning_rate": 0.00012454479746803722, "loss": 0.006, "step": 13720 }, { "epoch": 2.79, "learning_rate": 0.0001245256934875489, "loss": 0.0128, "step": 13721 }, { "epoch": 2.79, "learning_rate": 0.00012450658993252956, "loss": 0.0065, "step": 13722 }, { "epoch": 2.79, "learning_rate": 0.00012448748680329825, "loss": 0.0129, "step": 13723 }, { "epoch": 2.79, "learning_rate": 0.00012446838410017417, "loss": 0.0169, "step": 13724 }, { "epoch": 2.79, "learning_rate": 0.00012444928182347615, "loss": 0.0064, "step": 13725 }, { "epoch": 2.79, "learning_rate": 0.00012443017997352347, "loss": 0.0026, "step": 13726 }, { "epoch": 2.8, "learning_rate": 0.00012441107855063502, "loss": 0.0049, "step": 13727 }, { "epoch": 2.8, "learning_rate": 0.0001243919775551298, "loss": 0.0042, "step": 13728 }, { "epoch": 2.8, "learning_rate": 0.00012437287698732698, "loss": 0.0204, "step": 13729 }, { "epoch": 2.8, "learning_rate": 0.0001243537768475454, "loss": 0.0047, "step": 13730 }, { "epoch": 2.8, "learning_rate": 0.00012433467713610422, "loss": 0.0072, "step": 13731 }, { "epoch": 2.8, "learning_rate": 0.00012431557785332235, "loss": 0.0106, "step": 13732 }, { "epoch": 2.8, "learning_rate": 0.00012429647899951882, "loss": 0.011, "step": 13733 }, { "epoch": 2.8, "learning_rate": 0.00012427738057501261, "loss": 0.0079, "step": 13734 }, { "epoch": 2.8, "learning_rate": 0.00012425828258012266, "loss": 0.0035, "step": 13735 }, { "epoch": 2.8, "learning_rate": 0.00012423918501516806, "loss": 0.004, "step": 13736 }, { "epoch": 2.8, "learning_rate": 0.0001242200878804677, "loss": 0.005, "step": 13737 }, { "epoch": 2.8, "learning_rate": 0.00012420099117634045, "loss": 0.0333, "step": 13738 }, { "epoch": 2.8, "learning_rate": 0.0001241818949031054, "loss": 0.0059, "step": 13739 }, { "epoch": 2.8, "learning_rate": 0.00012416279906108147, "loss": 0.0124, "step": 13740 }, { "epoch": 2.8, "learning_rate": 0.00012414370365058748, "loss": 0.0047, "step": 13741 }, { "epoch": 2.8, "learning_rate": 0.00012412460867194253, "loss": 0.008, "step": 13742 }, { "epoch": 2.8, "learning_rate": 0.0001241055141254654, "loss": 0.0235, "step": 13743 }, { "epoch": 2.8, "learning_rate": 0.0001240864200114751, "loss": 0.0105, "step": 13744 }, { "epoch": 2.8, "learning_rate": 0.0001240673263302905, "loss": 0.0189, "step": 13745 }, { "epoch": 2.8, "learning_rate": 0.00012404823308223044, "loss": 0.0419, "step": 13746 }, { "epoch": 2.8, "learning_rate": 0.00012402914026761396, "loss": 0.0036, "step": 13747 }, { "epoch": 2.8, "learning_rate": 0.0001240100478867598, "loss": 0.0094, "step": 13748 }, { "epoch": 2.8, "learning_rate": 0.00012399095593998693, "loss": 0.0062, "step": 13749 }, { "epoch": 2.8, "learning_rate": 0.00012397186442761422, "loss": 0.0101, "step": 13750 }, { "epoch": 2.8, "learning_rate": 0.00012395277334996044, "loss": 0.0126, "step": 13751 }, { "epoch": 2.8, "learning_rate": 0.00012393368270734455, "loss": 0.0061, "step": 13752 }, { "epoch": 2.8, "learning_rate": 0.00012391459250008535, "loss": 0.005, "step": 13753 }, { "epoch": 2.8, "learning_rate": 0.00012389550272850168, "loss": 0.0134, "step": 13754 }, { "epoch": 2.8, "learning_rate": 0.00012387641339291246, "loss": 0.0011, "step": 13755 }, { "epoch": 2.8, "learning_rate": 0.00012385732449363636, "loss": 0.0071, "step": 13756 }, { "epoch": 2.8, "learning_rate": 0.00012383823603099236, "loss": 0.012, "step": 13757 }, { "epoch": 2.8, "learning_rate": 0.00012381914800529913, "loss": 0.002, "step": 13758 }, { "epoch": 2.8, "learning_rate": 0.0001238000604168756, "loss": 0.0038, "step": 13759 }, { "epoch": 2.8, "learning_rate": 0.00012378097326604055, "loss": 0.0062, "step": 13760 }, { "epoch": 2.8, "learning_rate": 0.00012376188655311267, "loss": 0.0047, "step": 13761 }, { "epoch": 2.8, "learning_rate": 0.00012374280027841088, "loss": 0.0042, "step": 13762 }, { "epoch": 2.8, "learning_rate": 0.00012372371444225382, "loss": 0.0047, "step": 13763 }, { "epoch": 2.8, "learning_rate": 0.0001237046290449603, "loss": 0.0117, "step": 13764 }, { "epoch": 2.8, "learning_rate": 0.0001236855440868492, "loss": 0.0029, "step": 13765 }, { "epoch": 2.8, "learning_rate": 0.00012366645956823913, "loss": 0.0132, "step": 13766 }, { "epoch": 2.8, "learning_rate": 0.00012364737548944895, "loss": 0.0188, "step": 13767 }, { "epoch": 2.8, "learning_rate": 0.00012362829185079733, "loss": 0.0066, "step": 13768 }, { "epoch": 2.8, "learning_rate": 0.00012360920865260296, "loss": 0.022, "step": 13769 }, { "epoch": 2.8, "learning_rate": 0.00012359012589518469, "loss": 0.0026, "step": 13770 }, { "epoch": 2.8, "learning_rate": 0.0001235710435788611, "loss": 0.0048, "step": 13771 }, { "epoch": 2.8, "learning_rate": 0.00012355196170395102, "loss": 0.0064, "step": 13772 }, { "epoch": 2.8, "learning_rate": 0.00012353288027077309, "loss": 0.0158, "step": 13773 }, { "epoch": 2.8, "learning_rate": 0.00012351379927964603, "loss": 0.0287, "step": 13774 }, { "epoch": 2.8, "learning_rate": 0.0001234947187308885, "loss": 0.0057, "step": 13775 }, { "epoch": 2.81, "learning_rate": 0.00012347563862481918, "loss": 0.0095, "step": 13776 }, { "epoch": 2.81, "learning_rate": 0.00012345655896175682, "loss": 0.0083, "step": 13777 }, { "epoch": 2.81, "learning_rate": 0.00012343747974202, "loss": 0.0027, "step": 13778 }, { "epoch": 2.81, "learning_rate": 0.0001234184009659274, "loss": 0.0101, "step": 13779 }, { "epoch": 2.81, "learning_rate": 0.00012339932263379772, "loss": 0.0055, "step": 13780 }, { "epoch": 2.81, "learning_rate": 0.0001233802447459495, "loss": 0.0016, "step": 13781 }, { "epoch": 2.81, "learning_rate": 0.00012336116730270148, "loss": 0.0044, "step": 13782 }, { "epoch": 2.81, "learning_rate": 0.00012334209030437224, "loss": 0.0123, "step": 13783 }, { "epoch": 2.81, "learning_rate": 0.00012332301375128044, "loss": 0.0163, "step": 13784 }, { "epoch": 2.81, "learning_rate": 0.00012330393764374464, "loss": 0.0283, "step": 13785 }, { "epoch": 2.81, "learning_rate": 0.0001232848619820835, "loss": 0.0137, "step": 13786 }, { "epoch": 2.81, "learning_rate": 0.00012326578676661551, "loss": 0.0155, "step": 13787 }, { "epoch": 2.81, "learning_rate": 0.00012324671199765946, "loss": 0.0103, "step": 13788 }, { "epoch": 2.81, "learning_rate": 0.00012322763767553372, "loss": 0.0037, "step": 13789 }, { "epoch": 2.81, "learning_rate": 0.00012320856380055705, "loss": 0.0033, "step": 13790 }, { "epoch": 2.81, "learning_rate": 0.00012318949037304794, "loss": 0.0003, "step": 13791 }, { "epoch": 2.81, "learning_rate": 0.00012317041739332487, "loss": 0.008, "step": 13792 }, { "epoch": 2.81, "learning_rate": 0.00012315134486170655, "loss": 0.0139, "step": 13793 }, { "epoch": 2.81, "learning_rate": 0.00012313227277851137, "loss": 0.0052, "step": 13794 }, { "epoch": 2.81, "learning_rate": 0.00012311320114405798, "loss": 0.0157, "step": 13795 }, { "epoch": 2.81, "learning_rate": 0.00012309412995866495, "loss": 0.0036, "step": 13796 }, { "epoch": 2.81, "learning_rate": 0.00012307505922265065, "loss": 0.0103, "step": 13797 }, { "epoch": 2.81, "learning_rate": 0.00012305598893633374, "loss": 0.003, "step": 13798 }, { "epoch": 2.81, "learning_rate": 0.00012303691910003263, "loss": 0.0116, "step": 13799 }, { "epoch": 2.81, "learning_rate": 0.00012301784971406593, "loss": 0.0076, "step": 13800 }, { "epoch": 2.81, "learning_rate": 0.00012299878077875207, "loss": 0.01, "step": 13801 }, { "epoch": 2.81, "learning_rate": 0.00012297971229440947, "loss": 0.0015, "step": 13802 }, { "epoch": 2.81, "learning_rate": 0.00012296064426135672, "loss": 0.0149, "step": 13803 }, { "epoch": 2.81, "learning_rate": 0.00012294157667991224, "loss": 0.0015, "step": 13804 }, { "epoch": 2.81, "learning_rate": 0.00012292250955039453, "loss": 0.003, "step": 13805 }, { "epoch": 2.81, "learning_rate": 0.00012290344287312202, "loss": 0.0088, "step": 13806 }, { "epoch": 2.81, "learning_rate": 0.00012288437664841309, "loss": 0.0064, "step": 13807 }, { "epoch": 2.81, "learning_rate": 0.00012286531087658635, "loss": 0.0134, "step": 13808 }, { "epoch": 2.81, "learning_rate": 0.00012284624555796006, "loss": 0.0014, "step": 13809 }, { "epoch": 2.81, "learning_rate": 0.0001228271806928528, "loss": 0.0117, "step": 13810 }, { "epoch": 2.81, "learning_rate": 0.0001228081162815829, "loss": 0.0036, "step": 13811 }, { "epoch": 2.81, "learning_rate": 0.00012278905232446875, "loss": 0.0035, "step": 13812 }, { "epoch": 2.81, "learning_rate": 0.00012276998882182884, "loss": 0.0092, "step": 13813 }, { "epoch": 2.81, "learning_rate": 0.00012275092577398146, "loss": 0.0072, "step": 13814 }, { "epoch": 2.81, "learning_rate": 0.0001227318631812451, "loss": 0.0041, "step": 13815 }, { "epoch": 2.81, "learning_rate": 0.00012271280104393805, "loss": 0.0056, "step": 13816 }, { "epoch": 2.81, "learning_rate": 0.00012269373936237875, "loss": 0.0098, "step": 13817 }, { "epoch": 2.81, "learning_rate": 0.00012267467813688557, "loss": 0.0027, "step": 13818 }, { "epoch": 2.81, "learning_rate": 0.00012265561736777688, "loss": 0.0034, "step": 13819 }, { "epoch": 2.81, "learning_rate": 0.0001226365570553709, "loss": 0.0053, "step": 13820 }, { "epoch": 2.81, "learning_rate": 0.00012261749719998615, "loss": 0.0015, "step": 13821 }, { "epoch": 2.81, "learning_rate": 0.00012259843780194083, "loss": 0.0045, "step": 13822 }, { "epoch": 2.81, "learning_rate": 0.00012257937886155337, "loss": 0.0111, "step": 13823 }, { "epoch": 2.81, "learning_rate": 0.000122560320379142, "loss": 0.0045, "step": 13824 }, { "epoch": 2.82, "learning_rate": 0.0001225412623550251, "loss": 0.008, "step": 13825 }, { "epoch": 2.82, "learning_rate": 0.00012252220478952094, "loss": 0.0069, "step": 13826 }, { "epoch": 2.82, "learning_rate": 0.00012250314768294784, "loss": 0.0012, "step": 13827 }, { "epoch": 2.82, "learning_rate": 0.00012248409103562404, "loss": 0.0256, "step": 13828 }, { "epoch": 2.82, "learning_rate": 0.00012246503484786793, "loss": 0.0024, "step": 13829 }, { "epoch": 2.82, "learning_rate": 0.00012244597911999764, "loss": 0.0074, "step": 13830 }, { "epoch": 2.82, "learning_rate": 0.00012242692385233157, "loss": 0.0009, "step": 13831 }, { "epoch": 2.82, "learning_rate": 0.00012240786904518786, "loss": 0.0275, "step": 13832 }, { "epoch": 2.82, "learning_rate": 0.00012238881469888487, "loss": 0.0135, "step": 13833 }, { "epoch": 2.82, "learning_rate": 0.00012236976081374083, "loss": 0.0077, "step": 13834 }, { "epoch": 2.82, "learning_rate": 0.00012235070739007386, "loss": 0.0162, "step": 13835 }, { "epoch": 2.82, "learning_rate": 0.00012233165442820227, "loss": 0.0102, "step": 13836 }, { "epoch": 2.82, "learning_rate": 0.00012231260192844433, "loss": 0.0095, "step": 13837 }, { "epoch": 2.82, "learning_rate": 0.00012229354989111814, "loss": 0.0132, "step": 13838 }, { "epoch": 2.82, "learning_rate": 0.00012227449831654204, "loss": 0.01, "step": 13839 }, { "epoch": 2.82, "learning_rate": 0.00012225544720503409, "loss": 0.0076, "step": 13840 }, { "epoch": 2.82, "learning_rate": 0.0001222363965569126, "loss": 0.0115, "step": 13841 }, { "epoch": 2.82, "learning_rate": 0.0001222173463724957, "loss": 0.0049, "step": 13842 }, { "epoch": 2.82, "learning_rate": 0.0001221982966521015, "loss": 0.019, "step": 13843 }, { "epoch": 2.82, "learning_rate": 0.00012217924739604827, "loss": 0.0048, "step": 13844 }, { "epoch": 2.82, "learning_rate": 0.00012216019860465405, "loss": 0.0106, "step": 13845 }, { "epoch": 2.82, "learning_rate": 0.00012214115027823718, "loss": 0.0042, "step": 13846 }, { "epoch": 2.82, "learning_rate": 0.00012212210241711562, "loss": 0.0127, "step": 13847 }, { "epoch": 2.82, "learning_rate": 0.00012210305502160753, "loss": 0.0051, "step": 13848 }, { "epoch": 2.82, "learning_rate": 0.00012208400809203117, "loss": 0.009, "step": 13849 }, { "epoch": 2.82, "learning_rate": 0.0001220649616287045, "loss": 0.0049, "step": 13850 }, { "epoch": 2.82, "learning_rate": 0.00012204591563194575, "loss": 0.0122, "step": 13851 }, { "epoch": 2.82, "learning_rate": 0.00012202687010207299, "loss": 0.0113, "step": 13852 }, { "epoch": 2.82, "learning_rate": 0.00012200782503940424, "loss": 0.0064, "step": 13853 }, { "epoch": 2.82, "learning_rate": 0.0001219887804442577, "loss": 0.0065, "step": 13854 }, { "epoch": 2.82, "learning_rate": 0.00012196973631695135, "loss": 0.0071, "step": 13855 }, { "epoch": 2.82, "learning_rate": 0.00012195069265780338, "loss": 0.019, "step": 13856 }, { "epoch": 2.82, "learning_rate": 0.00012193164946713175, "loss": 0.0048, "step": 13857 }, { "epoch": 2.82, "learning_rate": 0.00012191260674525455, "loss": 0.0219, "step": 13858 }, { "epoch": 2.82, "learning_rate": 0.00012189356449248985, "loss": 0.0039, "step": 13859 }, { "epoch": 2.82, "learning_rate": 0.00012187452270915571, "loss": 0.0052, "step": 13860 }, { "epoch": 2.82, "learning_rate": 0.00012185548139557006, "loss": 0.0155, "step": 13861 }, { "epoch": 2.82, "learning_rate": 0.00012183644055205107, "loss": 0.0051, "step": 13862 }, { "epoch": 2.82, "learning_rate": 0.00012181740017891662, "loss": 0.0041, "step": 13863 }, { "epoch": 2.82, "learning_rate": 0.00012179836027648484, "loss": 0.0063, "step": 13864 }, { "epoch": 2.82, "learning_rate": 0.00012177932084507367, "loss": 0.0096, "step": 13865 }, { "epoch": 2.82, "learning_rate": 0.00012176028188500107, "loss": 0.0031, "step": 13866 }, { "epoch": 2.82, "learning_rate": 0.0001217412433965851, "loss": 0.0041, "step": 13867 }, { "epoch": 2.82, "learning_rate": 0.00012172220538014369, "loss": 0.0077, "step": 13868 }, { "epoch": 2.82, "learning_rate": 0.00012170316783599483, "loss": 0.0124, "step": 13869 }, { "epoch": 2.82, "learning_rate": 0.00012168413076445654, "loss": 0.0012, "step": 13870 }, { "epoch": 2.82, "learning_rate": 0.00012166509416584661, "loss": 0.007, "step": 13871 }, { "epoch": 2.82, "learning_rate": 0.0001216460580404832, "loss": 0.0227, "step": 13872 }, { "epoch": 2.82, "learning_rate": 0.00012162702238868405, "loss": 0.0055, "step": 13873 }, { "epoch": 2.83, "learning_rate": 0.00012160798721076727, "loss": 0.0143, "step": 13874 }, { "epoch": 2.83, "learning_rate": 0.00012158895250705068, "loss": 0.0089, "step": 13875 }, { "epoch": 2.83, "learning_rate": 0.00012156991827785214, "loss": 0.0123, "step": 13876 }, { "epoch": 2.83, "learning_rate": 0.00012155088452348968, "loss": 0.0126, "step": 13877 }, { "epoch": 2.83, "learning_rate": 0.00012153185124428114, "loss": 0.0035, "step": 13878 }, { "epoch": 2.83, "learning_rate": 0.00012151281844054443, "loss": 0.0036, "step": 13879 }, { "epoch": 2.83, "learning_rate": 0.00012149378611259745, "loss": 0.0223, "step": 13880 }, { "epoch": 2.83, "learning_rate": 0.000121474754260758, "loss": 0.0039, "step": 13881 }, { "epoch": 2.83, "learning_rate": 0.00012145572288534405, "loss": 0.0053, "step": 13882 }, { "epoch": 2.83, "learning_rate": 0.00012143669198667335, "loss": 0.0067, "step": 13883 }, { "epoch": 2.83, "learning_rate": 0.00012141766156506387, "loss": 0.0132, "step": 13884 }, { "epoch": 2.83, "learning_rate": 0.0001213986316208334, "loss": 0.0119, "step": 13885 }, { "epoch": 2.83, "learning_rate": 0.00012137960215429971, "loss": 0.0034, "step": 13886 }, { "epoch": 2.83, "learning_rate": 0.00012136057316578075, "loss": 0.0095, "step": 13887 }, { "epoch": 2.83, "learning_rate": 0.00012134154465559424, "loss": 0.0054, "step": 13888 }, { "epoch": 2.83, "learning_rate": 0.000121322516624058, "loss": 0.0146, "step": 13889 }, { "epoch": 2.83, "learning_rate": 0.00012130348907148994, "loss": 0.0041, "step": 13890 }, { "epoch": 2.83, "learning_rate": 0.0001212844619982077, "loss": 0.0117, "step": 13891 }, { "epoch": 2.83, "learning_rate": 0.00012126543540452924, "loss": 0.0084, "step": 13892 }, { "epoch": 2.83, "learning_rate": 0.00012124640929077222, "loss": 0.0129, "step": 13893 }, { "epoch": 2.83, "learning_rate": 0.00012122738365725439, "loss": 0.0097, "step": 13894 }, { "epoch": 2.83, "learning_rate": 0.00012120835850429363, "loss": 0.0156, "step": 13895 }, { "epoch": 2.83, "learning_rate": 0.00012118933383220757, "loss": 0.0154, "step": 13896 }, { "epoch": 2.83, "learning_rate": 0.00012117030964131409, "loss": 0.0048, "step": 13897 }, { "epoch": 2.83, "learning_rate": 0.00012115128593193081, "loss": 0.0042, "step": 13898 }, { "epoch": 2.83, "learning_rate": 0.00012113226270437551, "loss": 0.0023, "step": 13899 }, { "epoch": 2.83, "learning_rate": 0.00012111323995896592, "loss": 0.0038, "step": 13900 }, { "epoch": 2.83, "learning_rate": 0.00012109421769601972, "loss": 0.0023, "step": 13901 }, { "epoch": 2.83, "learning_rate": 0.00012107519591585472, "loss": 0.016, "step": 13902 }, { "epoch": 2.83, "learning_rate": 0.00012105617461878853, "loss": 0.0052, "step": 13903 }, { "epoch": 2.83, "learning_rate": 0.0001210371538051388, "loss": 0.0134, "step": 13904 }, { "epoch": 2.83, "learning_rate": 0.00012101813347522335, "loss": 0.0223, "step": 13905 }, { "epoch": 2.83, "learning_rate": 0.0001209991136293597, "loss": 0.0169, "step": 13906 }, { "epoch": 2.83, "learning_rate": 0.00012098009426786567, "loss": 0.0082, "step": 13907 }, { "epoch": 2.83, "learning_rate": 0.0001209610753910588, "loss": 0.0257, "step": 13908 }, { "epoch": 2.83, "learning_rate": 0.00012094205699925679, "loss": 0.033, "step": 13909 }, { "epoch": 2.83, "learning_rate": 0.0001209230390927773, "loss": 0.0008, "step": 13910 }, { "epoch": 2.83, "learning_rate": 0.00012090402167193795, "loss": 0.0004, "step": 13911 }, { "epoch": 2.83, "learning_rate": 0.00012088500473705629, "loss": 0.0072, "step": 13912 }, { "epoch": 2.83, "learning_rate": 0.00012086598828845009, "loss": 0.0065, "step": 13913 }, { "epoch": 2.83, "learning_rate": 0.00012084697232643683, "loss": 0.0149, "step": 13914 }, { "epoch": 2.83, "learning_rate": 0.0001208279568513342, "loss": 0.0152, "step": 13915 }, { "epoch": 2.83, "learning_rate": 0.00012080894186345977, "loss": 0.0028, "step": 13916 }, { "epoch": 2.83, "learning_rate": 0.00012078992736313104, "loss": 0.0092, "step": 13917 }, { "epoch": 2.83, "learning_rate": 0.00012077091335066574, "loss": 0.0051, "step": 13918 }, { "epoch": 2.83, "learning_rate": 0.00012075189982638128, "loss": 0.0143, "step": 13919 }, { "epoch": 2.83, "learning_rate": 0.00012073288679059535, "loss": 0.0074, "step": 13920 }, { "epoch": 2.83, "learning_rate": 0.00012071387424362546, "loss": 0.0074, "step": 13921 }, { "epoch": 2.83, "learning_rate": 0.00012069486218578912, "loss": 0.0059, "step": 13922 }, { "epoch": 2.83, "learning_rate": 0.00012067585061740395, "loss": 0.0186, "step": 13923 }, { "epoch": 2.84, "learning_rate": 0.00012065683953878737, "loss": 0.0105, "step": 13924 }, { "epoch": 2.84, "learning_rate": 0.000120637828950257, "loss": 0.0039, "step": 13925 }, { "epoch": 2.84, "learning_rate": 0.00012061881885213035, "loss": 0.0093, "step": 13926 }, { "epoch": 2.84, "learning_rate": 0.00012059980924472478, "loss": 0.0021, "step": 13927 }, { "epoch": 2.84, "learning_rate": 0.000120580800128358, "loss": 0.0025, "step": 13928 }, { "epoch": 2.84, "learning_rate": 0.0001205617915033473, "loss": 0.0038, "step": 13929 }, { "epoch": 2.84, "learning_rate": 0.00012054278337001027, "loss": 0.0099, "step": 13930 }, { "epoch": 2.84, "learning_rate": 0.00012052377572866443, "loss": 0.0092, "step": 13931 }, { "epoch": 2.84, "learning_rate": 0.00012050476857962708, "loss": 0.0048, "step": 13932 }, { "epoch": 2.84, "learning_rate": 0.00012048576192321584, "loss": 0.0071, "step": 13933 }, { "epoch": 2.84, "learning_rate": 0.0001204667557597481, "loss": 0.0087, "step": 13934 }, { "epoch": 2.84, "learning_rate": 0.00012044775008954123, "loss": 0.0145, "step": 13935 }, { "epoch": 2.84, "learning_rate": 0.00012042874491291276, "loss": 0.0392, "step": 13936 }, { "epoch": 2.84, "learning_rate": 0.00012040974023018001, "loss": 0.0093, "step": 13937 }, { "epoch": 2.84, "learning_rate": 0.00012039073604166054, "loss": 0.009, "step": 13938 }, { "epoch": 2.84, "learning_rate": 0.0001203717323476716, "loss": 0.005, "step": 13939 }, { "epoch": 2.84, "learning_rate": 0.00012035272914853069, "loss": 0.0127, "step": 13940 }, { "epoch": 2.84, "learning_rate": 0.00012033372644455516, "loss": 0.009, "step": 13941 }, { "epoch": 2.84, "learning_rate": 0.00012031472423606234, "loss": 0.0119, "step": 13942 }, { "epoch": 2.84, "learning_rate": 0.00012029572252336976, "loss": 0.0309, "step": 13943 }, { "epoch": 2.84, "learning_rate": 0.00012027672130679466, "loss": 0.0077, "step": 13944 }, { "epoch": 2.84, "learning_rate": 0.00012025772058665436, "loss": 0.006, "step": 13945 }, { "epoch": 2.84, "learning_rate": 0.00012023872036326635, "loss": 0.0215, "step": 13946 }, { "epoch": 2.84, "learning_rate": 0.00012021972063694782, "loss": 0.0049, "step": 13947 }, { "epoch": 2.84, "learning_rate": 0.00012020072140801622, "loss": 0.0379, "step": 13948 }, { "epoch": 2.84, "learning_rate": 0.00012018172267678879, "loss": 0.0089, "step": 13949 }, { "epoch": 2.84, "learning_rate": 0.00012016272444358289, "loss": 0.0072, "step": 13950 }, { "epoch": 2.84, "learning_rate": 0.0001201437267087158, "loss": 0.0091, "step": 13951 }, { "epoch": 2.84, "learning_rate": 0.00012012472947250484, "loss": 0.0014, "step": 13952 }, { "epoch": 2.84, "learning_rate": 0.00012010573273526728, "loss": 0.0029, "step": 13953 }, { "epoch": 2.84, "learning_rate": 0.00012008673649732046, "loss": 0.0053, "step": 13954 }, { "epoch": 2.84, "learning_rate": 0.00012006774075898154, "loss": 0.016, "step": 13955 }, { "epoch": 2.84, "learning_rate": 0.0001200487455205679, "loss": 0.0006, "step": 13956 }, { "epoch": 2.84, "learning_rate": 0.0001200297507823967, "loss": 0.0098, "step": 13957 }, { "epoch": 2.84, "learning_rate": 0.0001200107565447853, "loss": 0.0048, "step": 13958 }, { "epoch": 2.84, "learning_rate": 0.00011999176280805087, "loss": 0.0146, "step": 13959 }, { "epoch": 2.84, "learning_rate": 0.00011997276957251056, "loss": 0.0069, "step": 13960 }, { "epoch": 2.84, "learning_rate": 0.00011995377683848173, "loss": 0.0113, "step": 13961 }, { "epoch": 2.84, "learning_rate": 0.00011993478460628158, "loss": 0.0017, "step": 13962 }, { "epoch": 2.84, "learning_rate": 0.00011991579287622722, "loss": 0.0088, "step": 13963 }, { "epoch": 2.84, "learning_rate": 0.00011989680164863596, "loss": 0.0069, "step": 13964 }, { "epoch": 2.84, "learning_rate": 0.00011987781092382487, "loss": 0.005, "step": 13965 }, { "epoch": 2.84, "learning_rate": 0.00011985882070211127, "loss": 0.0056, "step": 13966 }, { "epoch": 2.84, "learning_rate": 0.00011983983098381224, "loss": 0.0061, "step": 13967 }, { "epoch": 2.84, "learning_rate": 0.00011982084176924493, "loss": 0.0065, "step": 13968 }, { "epoch": 2.84, "learning_rate": 0.00011980185305872656, "loss": 0.0104, "step": 13969 }, { "epoch": 2.84, "learning_rate": 0.00011978286485257421, "loss": 0.0088, "step": 13970 }, { "epoch": 2.84, "learning_rate": 0.00011976387715110511, "loss": 0.0062, "step": 13971 }, { "epoch": 2.84, "learning_rate": 0.00011974488995463631, "loss": 0.0109, "step": 13972 }, { "epoch": 2.85, "learning_rate": 0.0001197259032634849, "loss": 0.0057, "step": 13973 }, { "epoch": 2.85, "learning_rate": 0.00011970691707796815, "loss": 0.012, "step": 13974 }, { "epoch": 2.85, "learning_rate": 0.00011968793139840298, "loss": 0.0081, "step": 13975 }, { "epoch": 2.85, "learning_rate": 0.00011966894622510666, "loss": 0.0039, "step": 13976 }, { "epoch": 2.85, "learning_rate": 0.00011964996155839617, "loss": 0.0059, "step": 13977 }, { "epoch": 2.85, "learning_rate": 0.00011963097739858857, "loss": 0.0078, "step": 13978 }, { "epoch": 2.85, "learning_rate": 0.00011961199374600102, "loss": 0.0126, "step": 13979 }, { "epoch": 2.85, "learning_rate": 0.00011959301060095047, "loss": 0.0012, "step": 13980 }, { "epoch": 2.85, "learning_rate": 0.00011957402796375412, "loss": 0.0038, "step": 13981 }, { "epoch": 2.85, "learning_rate": 0.00011955504583472889, "loss": 0.003, "step": 13982 }, { "epoch": 2.85, "learning_rate": 0.00011953606421419184, "loss": 0.0085, "step": 13983 }, { "epoch": 2.85, "learning_rate": 0.00011951708310246008, "loss": 0.0216, "step": 13984 }, { "epoch": 2.85, "learning_rate": 0.00011949810249985057, "loss": 0.0052, "step": 13985 }, { "epoch": 2.85, "learning_rate": 0.00011947912240668028, "loss": 0.0119, "step": 13986 }, { "epoch": 2.85, "learning_rate": 0.00011946014282326629, "loss": 0.02, "step": 13987 }, { "epoch": 2.85, "learning_rate": 0.00011944116374992552, "loss": 0.0057, "step": 13988 }, { "epoch": 2.85, "learning_rate": 0.00011942218518697506, "loss": 0.0008, "step": 13989 }, { "epoch": 2.85, "learning_rate": 0.00011940320713473178, "loss": 0.0012, "step": 13990 }, { "epoch": 2.85, "learning_rate": 0.00011938422959351272, "loss": 0.0084, "step": 13991 }, { "epoch": 2.85, "learning_rate": 0.00011936525256363481, "loss": 0.0031, "step": 13992 }, { "epoch": 2.85, "learning_rate": 0.00011934627604541501, "loss": 0.0161, "step": 13993 }, { "epoch": 2.85, "learning_rate": 0.00011932730003917026, "loss": 0.0088, "step": 13994 }, { "epoch": 2.85, "learning_rate": 0.00011930832454521753, "loss": 0.0142, "step": 13995 }, { "epoch": 2.85, "learning_rate": 0.00011928934956387365, "loss": 0.0032, "step": 13996 }, { "epoch": 2.85, "learning_rate": 0.00011927037509545567, "loss": 0.0183, "step": 13997 }, { "epoch": 2.85, "learning_rate": 0.00011925140114028038, "loss": 0.0046, "step": 13998 }, { "epoch": 2.85, "learning_rate": 0.00011923242769866477, "loss": 0.0184, "step": 13999 }, { "epoch": 2.85, "learning_rate": 0.00011921345477092572, "loss": 0.007, "step": 14000 }, { "epoch": 2.85, "learning_rate": 0.00011919448235738, "loss": 0.0019, "step": 14001 }, { "epoch": 2.85, "learning_rate": 0.00011917551045834463, "loss": 0.016, "step": 14002 }, { "epoch": 2.85, "learning_rate": 0.00011915653907413641, "loss": 0.0114, "step": 14003 }, { "epoch": 2.85, "learning_rate": 0.0001191375682050722, "loss": 0.0118, "step": 14004 }, { "epoch": 2.85, "learning_rate": 0.00011911859785146891, "loss": 0.0119, "step": 14005 }, { "epoch": 2.85, "learning_rate": 0.00011909962801364324, "loss": 0.0073, "step": 14006 }, { "epoch": 2.85, "learning_rate": 0.00011908065869191219, "loss": 0.0014, "step": 14007 }, { "epoch": 2.85, "learning_rate": 0.0001190616898865925, "loss": 0.0073, "step": 14008 }, { "epoch": 2.85, "learning_rate": 0.00011904272159800093, "loss": 0.0053, "step": 14009 }, { "epoch": 2.85, "learning_rate": 0.00011902375382645441, "loss": 0.0084, "step": 14010 }, { "epoch": 2.85, "learning_rate": 0.00011900478657226961, "loss": 0.0038, "step": 14011 }, { "epoch": 2.85, "learning_rate": 0.00011898581983576345, "loss": 0.0158, "step": 14012 }, { "epoch": 2.85, "learning_rate": 0.0001189668536172526, "loss": 0.0017, "step": 14013 }, { "epoch": 2.85, "learning_rate": 0.00011894788791705385, "loss": 0.0101, "step": 14014 }, { "epoch": 2.85, "learning_rate": 0.00011892892273548403, "loss": 0.0273, "step": 14015 }, { "epoch": 2.85, "learning_rate": 0.00011890995807285981, "loss": 0.0065, "step": 14016 }, { "epoch": 2.85, "learning_rate": 0.00011889099392949804, "loss": 0.0024, "step": 14017 }, { "epoch": 2.85, "learning_rate": 0.00011887203030571539, "loss": 0.0073, "step": 14018 }, { "epoch": 2.85, "learning_rate": 0.00011885306720182852, "loss": 0.0082, "step": 14019 }, { "epoch": 2.85, "learning_rate": 0.00011883410461815429, "loss": 0.0052, "step": 14020 }, { "epoch": 2.85, "learning_rate": 0.00011881514255500928, "loss": 0.0058, "step": 14021 }, { "epoch": 2.86, "learning_rate": 0.00011879618101271032, "loss": 0.0134, "step": 14022 }, { "epoch": 2.86, "learning_rate": 0.00011877721999157401, "loss": 0.0095, "step": 14023 }, { "epoch": 2.86, "learning_rate": 0.00011875825949191704, "loss": 0.0064, "step": 14024 }, { "epoch": 2.86, "learning_rate": 0.00011873929951405614, "loss": 0.0054, "step": 14025 }, { "epoch": 2.86, "learning_rate": 0.0001187203400583079, "loss": 0.0025, "step": 14026 }, { "epoch": 2.86, "learning_rate": 0.00011870138112498909, "loss": 0.0034, "step": 14027 }, { "epoch": 2.86, "learning_rate": 0.00011868242271441629, "loss": 0.0085, "step": 14028 }, { "epoch": 2.86, "learning_rate": 0.00011866346482690609, "loss": 0.0115, "step": 14029 }, { "epoch": 2.86, "learning_rate": 0.00011864450746277526, "loss": 0.0036, "step": 14030 }, { "epoch": 2.86, "learning_rate": 0.00011862555062234025, "loss": 0.0098, "step": 14031 }, { "epoch": 2.86, "learning_rate": 0.00011860659430591786, "loss": 0.0068, "step": 14032 }, { "epoch": 2.86, "learning_rate": 0.00011858763851382454, "loss": 0.0122, "step": 14033 }, { "epoch": 2.86, "learning_rate": 0.00011856868324637698, "loss": 0.0108, "step": 14034 }, { "epoch": 2.86, "learning_rate": 0.00011854972850389173, "loss": 0.0218, "step": 14035 }, { "epoch": 2.86, "learning_rate": 0.0001185307742866854, "loss": 0.0164, "step": 14036 }, { "epoch": 2.86, "learning_rate": 0.0001185118205950745, "loss": 0.0112, "step": 14037 }, { "epoch": 2.86, "learning_rate": 0.00011849286742937569, "loss": 0.0058, "step": 14038 }, { "epoch": 2.86, "learning_rate": 0.0001184739147899054, "loss": 0.0126, "step": 14039 }, { "epoch": 2.86, "learning_rate": 0.00011845496267698032, "loss": 0.0129, "step": 14040 }, { "epoch": 2.86, "learning_rate": 0.00011843601109091688, "loss": 0.003, "step": 14041 }, { "epoch": 2.86, "learning_rate": 0.0001184170600320316, "loss": 0.0076, "step": 14042 }, { "epoch": 2.86, "learning_rate": 0.00011839810950064109, "loss": 0.0214, "step": 14043 }, { "epoch": 2.86, "learning_rate": 0.00011837915949706173, "loss": 0.0111, "step": 14044 }, { "epoch": 2.86, "learning_rate": 0.00011836021002161013, "loss": 0.0089, "step": 14045 }, { "epoch": 2.86, "learning_rate": 0.00011834126107460278, "loss": 0.0025, "step": 14046 }, { "epoch": 2.86, "learning_rate": 0.00011832231265635607, "loss": 0.0097, "step": 14047 }, { "epoch": 2.86, "learning_rate": 0.00011830336476718661, "loss": 0.0104, "step": 14048 }, { "epoch": 2.86, "learning_rate": 0.00011828441740741071, "loss": 0.0233, "step": 14049 }, { "epoch": 2.86, "learning_rate": 0.00011826547057734497, "loss": 0.014, "step": 14050 }, { "epoch": 2.86, "learning_rate": 0.00011824652427730578, "loss": 0.0173, "step": 14051 }, { "epoch": 2.86, "learning_rate": 0.00011822757850760952, "loss": 0.0221, "step": 14052 }, { "epoch": 2.86, "learning_rate": 0.00011820863326857273, "loss": 0.002, "step": 14053 }, { "epoch": 2.86, "learning_rate": 0.0001181896885605117, "loss": 0.0177, "step": 14054 }, { "epoch": 2.86, "learning_rate": 0.00011817074438374296, "loss": 0.0059, "step": 14055 }, { "epoch": 2.86, "learning_rate": 0.0001181518007385829, "loss": 0.0037, "step": 14056 }, { "epoch": 2.86, "learning_rate": 0.00011813285762534783, "loss": 0.0142, "step": 14057 }, { "epoch": 2.86, "learning_rate": 0.00011811391504435422, "loss": 0.0089, "step": 14058 }, { "epoch": 2.86, "learning_rate": 0.00011809497299591847, "loss": 0.0093, "step": 14059 }, { "epoch": 2.86, "learning_rate": 0.0001180760314803568, "loss": 0.0117, "step": 14060 }, { "epoch": 2.86, "learning_rate": 0.00011805709049798573, "loss": 0.0017, "step": 14061 }, { "epoch": 2.86, "learning_rate": 0.0001180381500491215, "loss": 0.0036, "step": 14062 }, { "epoch": 2.86, "learning_rate": 0.00011801921013408054, "loss": 0.0058, "step": 14063 }, { "epoch": 2.86, "learning_rate": 0.00011800027075317911, "loss": 0.0196, "step": 14064 }, { "epoch": 2.86, "learning_rate": 0.00011798133190673355, "loss": 0.0038, "step": 14065 }, { "epoch": 2.86, "learning_rate": 0.00011796239359506021, "loss": 0.0016, "step": 14066 }, { "epoch": 2.86, "learning_rate": 0.00011794345581847534, "loss": 0.0072, "step": 14067 }, { "epoch": 2.86, "learning_rate": 0.00011792451857729533, "loss": 0.0016, "step": 14068 }, { "epoch": 2.86, "learning_rate": 0.0001179055818718364, "loss": 0.0022, "step": 14069 }, { "epoch": 2.86, "learning_rate": 0.00011788664570241477, "loss": 0.0062, "step": 14070 }, { "epoch": 2.87, "learning_rate": 0.00011786771006934686, "loss": 0.0109, "step": 14071 }, { "epoch": 2.87, "learning_rate": 0.00011784877497294876, "loss": 0.0133, "step": 14072 }, { "epoch": 2.87, "learning_rate": 0.00011782984041353686, "loss": 0.0093, "step": 14073 }, { "epoch": 2.87, "learning_rate": 0.00011781090639142734, "loss": 0.005, "step": 14074 }, { "epoch": 2.87, "learning_rate": 0.00011779197290693645, "loss": 0.0143, "step": 14075 }, { "epoch": 2.87, "learning_rate": 0.00011777303996038038, "loss": 0.0111, "step": 14076 }, { "epoch": 2.87, "learning_rate": 0.0001177541075520754, "loss": 0.0213, "step": 14077 }, { "epoch": 2.87, "learning_rate": 0.00011773517568233769, "loss": 0.0102, "step": 14078 }, { "epoch": 2.87, "learning_rate": 0.00011771624435148347, "loss": 0.006, "step": 14079 }, { "epoch": 2.87, "learning_rate": 0.00011769731355982887, "loss": 0.0143, "step": 14080 }, { "epoch": 2.87, "learning_rate": 0.00011767838330769015, "loss": 0.0036, "step": 14081 }, { "epoch": 2.87, "learning_rate": 0.00011765945359538339, "loss": 0.0077, "step": 14082 }, { "epoch": 2.87, "learning_rate": 0.00011764052442322485, "loss": 0.0045, "step": 14083 }, { "epoch": 2.87, "learning_rate": 0.00011762159579153064, "loss": 0.0223, "step": 14084 }, { "epoch": 2.87, "learning_rate": 0.00011760266770061683, "loss": 0.0083, "step": 14085 }, { "epoch": 2.87, "learning_rate": 0.00011758374015079969, "loss": 0.0104, "step": 14086 }, { "epoch": 2.87, "learning_rate": 0.00011756481314239527, "loss": 0.0086, "step": 14087 }, { "epoch": 2.87, "learning_rate": 0.00011754588667571965, "loss": 0.009, "step": 14088 }, { "epoch": 2.87, "learning_rate": 0.00011752696075108905, "loss": 0.006, "step": 14089 }, { "epoch": 2.87, "learning_rate": 0.00011750803536881943, "loss": 0.004, "step": 14090 }, { "epoch": 2.87, "learning_rate": 0.00011748911052922702, "loss": 0.0047, "step": 14091 }, { "epoch": 2.87, "learning_rate": 0.00011747018623262784, "loss": 0.0089, "step": 14092 }, { "epoch": 2.87, "learning_rate": 0.00011745126247933788, "loss": 0.0022, "step": 14093 }, { "epoch": 2.87, "learning_rate": 0.00011743233926967335, "loss": 0.024, "step": 14094 }, { "epoch": 2.87, "learning_rate": 0.00011741341660395016, "loss": 0.0044, "step": 14095 }, { "epoch": 2.87, "learning_rate": 0.00011739449448248448, "loss": 0.0012, "step": 14096 }, { "epoch": 2.87, "learning_rate": 0.00011737557290559229, "loss": 0.0037, "step": 14097 }, { "epoch": 2.87, "learning_rate": 0.00011735665187358955, "loss": 0.0237, "step": 14098 }, { "epoch": 2.87, "learning_rate": 0.00011733773138679242, "loss": 0.0175, "step": 14099 }, { "epoch": 2.87, "learning_rate": 0.00011731881144551675, "loss": 0.0131, "step": 14100 }, { "epoch": 2.87, "learning_rate": 0.0001172998920500787, "loss": 0.0042, "step": 14101 }, { "epoch": 2.87, "learning_rate": 0.00011728097320079418, "loss": 0.0074, "step": 14102 }, { "epoch": 2.87, "learning_rate": 0.00011726205489797911, "loss": 0.0053, "step": 14103 }, { "epoch": 2.87, "learning_rate": 0.00011724313714194957, "loss": 0.0034, "step": 14104 }, { "epoch": 2.87, "learning_rate": 0.00011722421993302141, "loss": 0.0039, "step": 14105 }, { "epoch": 2.87, "learning_rate": 0.00011720530327151071, "loss": 0.0041, "step": 14106 }, { "epoch": 2.87, "learning_rate": 0.00011718638715773332, "loss": 0.0072, "step": 14107 }, { "epoch": 2.87, "learning_rate": 0.00011716747159200516, "loss": 0.0075, "step": 14108 }, { "epoch": 2.87, "learning_rate": 0.00011714855657464229, "loss": 0.0172, "step": 14109 }, { "epoch": 2.87, "learning_rate": 0.00011712964210596052, "loss": 0.0036, "step": 14110 }, { "epoch": 2.87, "learning_rate": 0.0001171107281862757, "loss": 0.008, "step": 14111 }, { "epoch": 2.87, "learning_rate": 0.00011709181481590388, "loss": 0.0041, "step": 14112 }, { "epoch": 2.87, "learning_rate": 0.00011707290199516083, "loss": 0.0064, "step": 14113 }, { "epoch": 2.87, "learning_rate": 0.0001170539897243625, "loss": 0.0028, "step": 14114 }, { "epoch": 2.87, "learning_rate": 0.00011703507800382472, "loss": 0.0045, "step": 14115 }, { "epoch": 2.87, "learning_rate": 0.00011701616683386335, "loss": 0.0069, "step": 14116 }, { "epoch": 2.87, "learning_rate": 0.00011699725621479426, "loss": 0.006, "step": 14117 }, { "epoch": 2.87, "learning_rate": 0.0001169783461469333, "loss": 0.0144, "step": 14118 }, { "epoch": 2.87, "learning_rate": 0.00011695943663059627, "loss": 0.0071, "step": 14119 }, { "epoch": 2.88, "learning_rate": 0.00011694052766609906, "loss": 0.005, "step": 14120 }, { "epoch": 2.88, "learning_rate": 0.00011692161925375738, "loss": 0.0101, "step": 14121 }, { "epoch": 2.88, "learning_rate": 0.00011690271139388714, "loss": 0.0048, "step": 14122 }, { "epoch": 2.88, "learning_rate": 0.00011688380408680407, "loss": 0.0161, "step": 14123 }, { "epoch": 2.88, "learning_rate": 0.00011686489733282404, "loss": 0.008, "step": 14124 }, { "epoch": 2.88, "learning_rate": 0.00011684599113226274, "loss": 0.0062, "step": 14125 }, { "epoch": 2.88, "learning_rate": 0.00011682708548543592, "loss": 0.0074, "step": 14126 }, { "epoch": 2.88, "learning_rate": 0.00011680818039265944, "loss": 0.0072, "step": 14127 }, { "epoch": 2.88, "learning_rate": 0.00011678927585424899, "loss": 0.0132, "step": 14128 }, { "epoch": 2.88, "learning_rate": 0.00011677037187052033, "loss": 0.0319, "step": 14129 }, { "epoch": 2.88, "learning_rate": 0.0001167514684417892, "loss": 0.0171, "step": 14130 }, { "epoch": 2.88, "learning_rate": 0.00011673256556837125, "loss": 0.0222, "step": 14131 }, { "epoch": 2.88, "learning_rate": 0.00011671366325058234, "loss": 0.0178, "step": 14132 }, { "epoch": 2.88, "learning_rate": 0.00011669476148873805, "loss": 0.006, "step": 14133 }, { "epoch": 2.88, "learning_rate": 0.00011667586028315407, "loss": 0.0049, "step": 14134 }, { "epoch": 2.88, "learning_rate": 0.00011665695963414618, "loss": 0.0079, "step": 14135 }, { "epoch": 2.88, "learning_rate": 0.00011663805954202995, "loss": 0.0284, "step": 14136 }, { "epoch": 2.88, "learning_rate": 0.00011661916000712115, "loss": 0.0101, "step": 14137 }, { "epoch": 2.88, "learning_rate": 0.00011660026102973536, "loss": 0.008, "step": 14138 }, { "epoch": 2.88, "learning_rate": 0.00011658136261018824, "loss": 0.0037, "step": 14139 }, { "epoch": 2.88, "learning_rate": 0.0001165624647487955, "loss": 0.0061, "step": 14140 }, { "epoch": 2.88, "learning_rate": 0.00011654356744587265, "loss": 0.0057, "step": 14141 }, { "epoch": 2.88, "learning_rate": 0.00011652467070173545, "loss": 0.0131, "step": 14142 }, { "epoch": 2.88, "learning_rate": 0.00011650577451669944, "loss": 0.0041, "step": 14143 }, { "epoch": 2.88, "learning_rate": 0.00011648687889108014, "loss": 0.0025, "step": 14144 }, { "epoch": 2.88, "learning_rate": 0.00011646798382519332, "loss": 0.0044, "step": 14145 }, { "epoch": 2.88, "learning_rate": 0.00011644908931935436, "loss": 0.004, "step": 14146 }, { "epoch": 2.88, "learning_rate": 0.00011643019537387903, "loss": 0.009, "step": 14147 }, { "epoch": 2.88, "learning_rate": 0.00011641130198908277, "loss": 0.007, "step": 14148 }, { "epoch": 2.88, "learning_rate": 0.00011639240916528116, "loss": 0.0099, "step": 14149 }, { "epoch": 2.88, "learning_rate": 0.00011637351690278976, "loss": 0.0021, "step": 14150 }, { "epoch": 2.88, "learning_rate": 0.00011635462520192408, "loss": 0.0167, "step": 14151 }, { "epoch": 2.88, "learning_rate": 0.00011633573406299972, "loss": 0.0021, "step": 14152 }, { "epoch": 2.88, "learning_rate": 0.00011631684348633216, "loss": 0.0169, "step": 14153 }, { "epoch": 2.88, "learning_rate": 0.00011629795347223682, "loss": 0.0015, "step": 14154 }, { "epoch": 2.88, "learning_rate": 0.00011627906402102934, "loss": 0.0117, "step": 14155 }, { "epoch": 2.88, "learning_rate": 0.00011626017513302507, "loss": 0.0137, "step": 14156 }, { "epoch": 2.88, "learning_rate": 0.00011624128680853963, "loss": 0.0093, "step": 14157 }, { "epoch": 2.88, "learning_rate": 0.00011622239904788843, "loss": 0.0032, "step": 14158 }, { "epoch": 2.88, "learning_rate": 0.00011620351185138688, "loss": 0.0094, "step": 14159 }, { "epoch": 2.88, "learning_rate": 0.0001161846252193505, "loss": 0.0116, "step": 14160 }, { "epoch": 2.88, "learning_rate": 0.00011616573915209474, "loss": 0.0041, "step": 14161 }, { "epoch": 2.88, "learning_rate": 0.00011614685364993493, "loss": 0.0013, "step": 14162 }, { "epoch": 2.88, "learning_rate": 0.00011612796871318663, "loss": 0.0153, "step": 14163 }, { "epoch": 2.88, "learning_rate": 0.00011610908434216514, "loss": 0.0089, "step": 14164 }, { "epoch": 2.88, "learning_rate": 0.00011609020053718597, "loss": 0.0085, "step": 14165 }, { "epoch": 2.88, "learning_rate": 0.00011607131729856446, "loss": 0.0024, "step": 14166 }, { "epoch": 2.88, "learning_rate": 0.00011605243462661594, "loss": 0.0021, "step": 14167 }, { "epoch": 2.88, "learning_rate": 0.00011603355252165586, "loss": 0.0187, "step": 14168 }, { "epoch": 2.89, "learning_rate": 0.00011601467098399958, "loss": 0.0058, "step": 14169 }, { "epoch": 2.89, "learning_rate": 0.00011599579001396245, "loss": 0.0215, "step": 14170 }, { "epoch": 2.89, "learning_rate": 0.00011597690961185984, "loss": 0.0064, "step": 14171 }, { "epoch": 2.89, "learning_rate": 0.000115958029778007, "loss": 0.0022, "step": 14172 }, { "epoch": 2.89, "learning_rate": 0.00011593915051271937, "loss": 0.0087, "step": 14173 }, { "epoch": 2.89, "learning_rate": 0.00011592027181631218, "loss": 0.0011, "step": 14174 }, { "epoch": 2.89, "learning_rate": 0.00011590139368910084, "loss": 0.0029, "step": 14175 }, { "epoch": 2.89, "learning_rate": 0.00011588251613140058, "loss": 0.0164, "step": 14176 }, { "epoch": 2.89, "learning_rate": 0.00011586363914352665, "loss": 0.0046, "step": 14177 }, { "epoch": 2.89, "learning_rate": 0.00011584476272579444, "loss": 0.0064, "step": 14178 }, { "epoch": 2.89, "learning_rate": 0.0001158258868785191, "loss": 0.0015, "step": 14179 }, { "epoch": 2.89, "learning_rate": 0.00011580701160201599, "loss": 0.0097, "step": 14180 }, { "epoch": 2.89, "learning_rate": 0.00011578813689660038, "loss": 0.0065, "step": 14181 }, { "epoch": 2.89, "learning_rate": 0.00011576926276258736, "loss": 0.0095, "step": 14182 }, { "epoch": 2.89, "learning_rate": 0.00011575038920029236, "loss": 0.0175, "step": 14183 }, { "epoch": 2.89, "learning_rate": 0.0001157315162100305, "loss": 0.0049, "step": 14184 }, { "epoch": 2.89, "learning_rate": 0.00011571264379211695, "loss": 0.0115, "step": 14185 }, { "epoch": 2.89, "learning_rate": 0.00011569377194686704, "loss": 0.0004, "step": 14186 }, { "epoch": 2.89, "learning_rate": 0.00011567490067459582, "loss": 0.0025, "step": 14187 }, { "epoch": 2.89, "learning_rate": 0.00011565602997561862, "loss": 0.0071, "step": 14188 }, { "epoch": 2.89, "learning_rate": 0.00011563715985025051, "loss": 0.0098, "step": 14189 }, { "epoch": 2.89, "learning_rate": 0.00011561829029880671, "loss": 0.0033, "step": 14190 }, { "epoch": 2.89, "learning_rate": 0.00011559942132160235, "loss": 0.002, "step": 14191 }, { "epoch": 2.89, "learning_rate": 0.00011558055291895255, "loss": 0.01, "step": 14192 }, { "epoch": 2.89, "learning_rate": 0.00011556168509117257, "loss": 0.0038, "step": 14193 }, { "epoch": 2.89, "learning_rate": 0.00011554281783857745, "loss": 0.0075, "step": 14194 }, { "epoch": 2.89, "learning_rate": 0.00011552395116148226, "loss": 0.0059, "step": 14195 }, { "epoch": 2.89, "learning_rate": 0.00011550508506020221, "loss": 0.0092, "step": 14196 }, { "epoch": 2.89, "learning_rate": 0.00011548621953505229, "loss": 0.0009, "step": 14197 }, { "epoch": 2.89, "learning_rate": 0.00011546735458634772, "loss": 0.0132, "step": 14198 }, { "epoch": 2.89, "learning_rate": 0.00011544849021440349, "loss": 0.0038, "step": 14199 }, { "epoch": 2.89, "learning_rate": 0.00011542962641953469, "loss": 0.0065, "step": 14200 }, { "epoch": 2.89, "learning_rate": 0.00011541076320205637, "loss": 0.0083, "step": 14201 }, { "epoch": 2.89, "learning_rate": 0.00011539190056228362, "loss": 0.0147, "step": 14202 }, { "epoch": 2.89, "learning_rate": 0.00011537303850053144, "loss": 0.0114, "step": 14203 }, { "epoch": 2.89, "learning_rate": 0.00011535417701711494, "loss": 0.0026, "step": 14204 }, { "epoch": 2.89, "learning_rate": 0.00011533531611234898, "loss": 0.0024, "step": 14205 }, { "epoch": 2.89, "learning_rate": 0.00011531645578654875, "loss": 0.0047, "step": 14206 }, { "epoch": 2.89, "learning_rate": 0.0001152975960400292, "loss": 0.0022, "step": 14207 }, { "epoch": 2.89, "learning_rate": 0.00011527873687310522, "loss": 0.0098, "step": 14208 }, { "epoch": 2.89, "learning_rate": 0.00011525987828609193, "loss": 0.0023, "step": 14209 }, { "epoch": 2.89, "learning_rate": 0.00011524102027930421, "loss": 0.0006, "step": 14210 }, { "epoch": 2.89, "learning_rate": 0.00011522216285305708, "loss": 0.0027, "step": 14211 }, { "epoch": 2.89, "learning_rate": 0.00011520330600766552, "loss": 0.009, "step": 14212 }, { "epoch": 2.89, "learning_rate": 0.00011518444974344435, "loss": 0.0061, "step": 14213 }, { "epoch": 2.89, "learning_rate": 0.00011516559406070866, "loss": 0.0092, "step": 14214 }, { "epoch": 2.89, "learning_rate": 0.00011514673895977327, "loss": 0.0234, "step": 14215 }, { "epoch": 2.89, "learning_rate": 0.00011512788444095316, "loss": 0.0031, "step": 14216 }, { "epoch": 2.89, "learning_rate": 0.0001151090305045632, "loss": 0.0037, "step": 14217 }, { "epoch": 2.9, "learning_rate": 0.00011509017715091824, "loss": 0.0066, "step": 14218 }, { "epoch": 2.9, "learning_rate": 0.00011507132438033329, "loss": 0.0156, "step": 14219 }, { "epoch": 2.9, "learning_rate": 0.00011505247219312309, "loss": 0.0013, "step": 14220 }, { "epoch": 2.9, "learning_rate": 0.00011503362058960261, "loss": 0.0085, "step": 14221 }, { "epoch": 2.9, "learning_rate": 0.00011501476957008667, "loss": 0.0147, "step": 14222 }, { "epoch": 2.9, "learning_rate": 0.00011499591913489008, "loss": 0.0035, "step": 14223 }, { "epoch": 2.9, "learning_rate": 0.00011497706928432777, "loss": 0.0107, "step": 14224 }, { "epoch": 2.9, "learning_rate": 0.00011495822001871448, "loss": 0.0064, "step": 14225 }, { "epoch": 2.9, "learning_rate": 0.00011493937133836509, "loss": 0.0212, "step": 14226 }, { "epoch": 2.9, "learning_rate": 0.00011492052324359437, "loss": 0.003, "step": 14227 }, { "epoch": 2.9, "learning_rate": 0.0001149016757347171, "loss": 0.0141, "step": 14228 }, { "epoch": 2.9, "learning_rate": 0.00011488282881204816, "loss": 0.0072, "step": 14229 }, { "epoch": 2.9, "learning_rate": 0.00011486398247590219, "loss": 0.013, "step": 14230 }, { "epoch": 2.9, "learning_rate": 0.00011484513672659409, "loss": 0.0029, "step": 14231 }, { "epoch": 2.9, "learning_rate": 0.00011482629156443856, "loss": 0.0051, "step": 14232 }, { "epoch": 2.9, "learning_rate": 0.0001148074469897503, "loss": 0.0204, "step": 14233 }, { "epoch": 2.9, "learning_rate": 0.00011478860300284418, "loss": 0.0076, "step": 14234 }, { "epoch": 2.9, "learning_rate": 0.00011476975960403484, "loss": 0.0101, "step": 14235 }, { "epoch": 2.9, "learning_rate": 0.00011475091679363698, "loss": 0.0088, "step": 14236 }, { "epoch": 2.9, "learning_rate": 0.0001147320745719654, "loss": 0.0062, "step": 14237 }, { "epoch": 2.9, "learning_rate": 0.00011471323293933468, "loss": 0.01, "step": 14238 }, { "epoch": 2.9, "learning_rate": 0.00011469439189605964, "loss": 0.0123, "step": 14239 }, { "epoch": 2.9, "learning_rate": 0.00011467555144245486, "loss": 0.0061, "step": 14240 }, { "epoch": 2.9, "learning_rate": 0.00011465671157883508, "loss": 0.0201, "step": 14241 }, { "epoch": 2.9, "learning_rate": 0.00011463787230551491, "loss": 0.0066, "step": 14242 }, { "epoch": 2.9, "learning_rate": 0.00011461903362280903, "loss": 0.004, "step": 14243 }, { "epoch": 2.9, "learning_rate": 0.00011460019553103206, "loss": 0.0091, "step": 14244 }, { "epoch": 2.9, "learning_rate": 0.0001145813580304987, "loss": 0.0033, "step": 14245 }, { "epoch": 2.9, "learning_rate": 0.00011456252112152345, "loss": 0.029, "step": 14246 }, { "epoch": 2.9, "learning_rate": 0.00011454368480442103, "loss": 0.0043, "step": 14247 }, { "epoch": 2.9, "learning_rate": 0.00011452484907950597, "loss": 0.0139, "step": 14248 }, { "epoch": 2.9, "learning_rate": 0.00011450601394709294, "loss": 0.011, "step": 14249 }, { "epoch": 2.9, "learning_rate": 0.0001144871794074965, "loss": 0.0205, "step": 14250 }, { "epoch": 2.9, "learning_rate": 0.00011446834546103111, "loss": 0.0134, "step": 14251 }, { "epoch": 2.9, "learning_rate": 0.00011444951210801146, "loss": 0.0079, "step": 14252 }, { "epoch": 2.9, "learning_rate": 0.00011443067934875206, "loss": 0.0044, "step": 14253 }, { "epoch": 2.9, "learning_rate": 0.00011441184718356747, "loss": 0.0048, "step": 14254 }, { "epoch": 2.9, "learning_rate": 0.00011439301561277222, "loss": 0.0051, "step": 14255 }, { "epoch": 2.9, "learning_rate": 0.00011437418463668078, "loss": 0.0057, "step": 14256 }, { "epoch": 2.9, "learning_rate": 0.00011435535425560777, "loss": 0.0083, "step": 14257 }, { "epoch": 2.9, "learning_rate": 0.00011433652446986761, "loss": 0.0108, "step": 14258 }, { "epoch": 2.9, "learning_rate": 0.00011431769527977476, "loss": 0.0078, "step": 14259 }, { "epoch": 2.9, "learning_rate": 0.00011429886668564382, "loss": 0.0033, "step": 14260 }, { "epoch": 2.9, "learning_rate": 0.00011428003868778912, "loss": 0.0066, "step": 14261 }, { "epoch": 2.9, "learning_rate": 0.00011426121128652526, "loss": 0.0108, "step": 14262 }, { "epoch": 2.9, "learning_rate": 0.00011424238448216661, "loss": 0.0146, "step": 14263 }, { "epoch": 2.9, "learning_rate": 0.00011422355827502761, "loss": 0.0076, "step": 14264 }, { "epoch": 2.9, "learning_rate": 0.00011420473266542279, "loss": 0.0069, "step": 14265 }, { "epoch": 2.9, "learning_rate": 0.00011418590765366642, "loss": 0.0065, "step": 14266 }, { "epoch": 2.91, "learning_rate": 0.00011416708324007307, "loss": 0.0045, "step": 14267 }, { "epoch": 2.91, "learning_rate": 0.00011414825942495708, "loss": 0.0031, "step": 14268 }, { "epoch": 2.91, "learning_rate": 0.00011412943620863275, "loss": 0.0219, "step": 14269 }, { "epoch": 2.91, "learning_rate": 0.00011411061359141462, "loss": 0.0002, "step": 14270 }, { "epoch": 2.91, "learning_rate": 0.0001140917915736169, "loss": 0.0054, "step": 14271 }, { "epoch": 2.91, "learning_rate": 0.00011407297015555416, "loss": 0.0076, "step": 14272 }, { "epoch": 2.91, "learning_rate": 0.00011405414933754056, "loss": 0.0064, "step": 14273 }, { "epoch": 2.91, "learning_rate": 0.0001140353291198905, "loss": 0.0007, "step": 14274 }, { "epoch": 2.91, "learning_rate": 0.00011401650950291839, "loss": 0.0019, "step": 14275 }, { "epoch": 2.91, "learning_rate": 0.00011399769048693843, "loss": 0.0117, "step": 14276 }, { "epoch": 2.91, "learning_rate": 0.00011397887207226508, "loss": 0.0161, "step": 14277 }, { "epoch": 2.91, "learning_rate": 0.00011396005425921253, "loss": 0.01, "step": 14278 }, { "epoch": 2.91, "learning_rate": 0.00011394123704809507, "loss": 0.0074, "step": 14279 }, { "epoch": 2.91, "learning_rate": 0.00011392242043922706, "loss": 0.0036, "step": 14280 }, { "epoch": 2.91, "learning_rate": 0.00011390360443292275, "loss": 0.0013, "step": 14281 }, { "epoch": 2.91, "learning_rate": 0.0001138847890294963, "loss": 0.0026, "step": 14282 }, { "epoch": 2.91, "learning_rate": 0.00011386597422926209, "loss": 0.015, "step": 14283 }, { "epoch": 2.91, "learning_rate": 0.00011384716003253431, "loss": 0.006, "step": 14284 }, { "epoch": 2.91, "learning_rate": 0.00011382834643962721, "loss": 0.0085, "step": 14285 }, { "epoch": 2.91, "learning_rate": 0.00011380953345085503, "loss": 0.0063, "step": 14286 }, { "epoch": 2.91, "learning_rate": 0.0001137907210665319, "loss": 0.0066, "step": 14287 }, { "epoch": 2.91, "learning_rate": 0.00011377190928697213, "loss": 0.0092, "step": 14288 }, { "epoch": 2.91, "learning_rate": 0.00011375309811248979, "loss": 0.0059, "step": 14289 }, { "epoch": 2.91, "learning_rate": 0.0001137342875433992, "loss": 0.0071, "step": 14290 }, { "epoch": 2.91, "learning_rate": 0.00011371547758001448, "loss": 0.0275, "step": 14291 }, { "epoch": 2.91, "learning_rate": 0.00011369666822264972, "loss": 0.0214, "step": 14292 }, { "epoch": 2.91, "learning_rate": 0.00011367785947161912, "loss": 0.0095, "step": 14293 }, { "epoch": 2.91, "learning_rate": 0.00011365905132723684, "loss": 0.013, "step": 14294 }, { "epoch": 2.91, "learning_rate": 0.00011364024378981703, "loss": 0.0092, "step": 14295 }, { "epoch": 2.91, "learning_rate": 0.0001136214368596738, "loss": 0.0022, "step": 14296 }, { "epoch": 2.91, "learning_rate": 0.00011360263053712119, "loss": 0.0209, "step": 14297 }, { "epoch": 2.91, "learning_rate": 0.0001135838248224734, "loss": 0.0054, "step": 14298 }, { "epoch": 2.91, "learning_rate": 0.00011356501971604442, "loss": 0.0117, "step": 14299 }, { "epoch": 2.91, "learning_rate": 0.00011354621521814845, "loss": 0.003, "step": 14300 }, { "epoch": 2.91, "learning_rate": 0.00011352741132909948, "loss": 0.0057, "step": 14301 }, { "epoch": 2.91, "learning_rate": 0.00011350860804921155, "loss": 0.0054, "step": 14302 }, { "epoch": 2.91, "learning_rate": 0.0001134898053787988, "loss": 0.0053, "step": 14303 }, { "epoch": 2.91, "learning_rate": 0.00011347100331817516, "loss": 0.011, "step": 14304 }, { "epoch": 2.91, "learning_rate": 0.00011345220186765475, "loss": 0.0111, "step": 14305 }, { "epoch": 2.91, "learning_rate": 0.00011343340102755158, "loss": 0.0174, "step": 14306 }, { "epoch": 2.91, "learning_rate": 0.0001134146007981796, "loss": 0.0029, "step": 14307 }, { "epoch": 2.91, "learning_rate": 0.00011339580117985287, "loss": 0.0037, "step": 14308 }, { "epoch": 2.91, "learning_rate": 0.00011337700217288538, "loss": 0.0025, "step": 14309 }, { "epoch": 2.91, "learning_rate": 0.00011335820377759101, "loss": 0.0053, "step": 14310 }, { "epoch": 2.91, "learning_rate": 0.00011333940599428388, "loss": 0.0011, "step": 14311 }, { "epoch": 2.91, "learning_rate": 0.0001133206088232778, "loss": 0.0107, "step": 14312 }, { "epoch": 2.91, "learning_rate": 0.00011330181226488685, "loss": 0.0049, "step": 14313 }, { "epoch": 2.91, "learning_rate": 0.00011328301631942489, "loss": 0.0141, "step": 14314 }, { "epoch": 2.91, "learning_rate": 0.00011326422098720585, "loss": 0.0025, "step": 14315 }, { "epoch": 2.92, "learning_rate": 0.00011324542626854367, "loss": 0.0048, "step": 14316 }, { "epoch": 2.92, "learning_rate": 0.00011322663216375223, "loss": 0.0079, "step": 14317 }, { "epoch": 2.92, "learning_rate": 0.00011320783867314549, "loss": 0.0023, "step": 14318 }, { "epoch": 2.92, "learning_rate": 0.00011318904579703731, "loss": 0.0122, "step": 14319 }, { "epoch": 2.92, "learning_rate": 0.00011317025353574149, "loss": 0.0238, "step": 14320 }, { "epoch": 2.92, "learning_rate": 0.000113151461889572, "loss": 0.005, "step": 14321 }, { "epoch": 2.92, "learning_rate": 0.0001131326708588426, "loss": 0.0028, "step": 14322 }, { "epoch": 2.92, "learning_rate": 0.00011311388044386725, "loss": 0.0127, "step": 14323 }, { "epoch": 2.92, "learning_rate": 0.00011309509064495969, "loss": 0.0119, "step": 14324 }, { "epoch": 2.92, "learning_rate": 0.00011307630146243378, "loss": 0.0121, "step": 14325 }, { "epoch": 2.92, "learning_rate": 0.00011305751289660335, "loss": 0.0132, "step": 14326 }, { "epoch": 2.92, "learning_rate": 0.00011303872494778214, "loss": 0.0036, "step": 14327 }, { "epoch": 2.92, "learning_rate": 0.00011301993761628408, "loss": 0.0042, "step": 14328 }, { "epoch": 2.92, "learning_rate": 0.00011300115090242284, "loss": 0.0061, "step": 14329 }, { "epoch": 2.92, "learning_rate": 0.00011298236480651217, "loss": 0.0106, "step": 14330 }, { "epoch": 2.92, "learning_rate": 0.00011296357932886594, "loss": 0.0017, "step": 14331 }, { "epoch": 2.92, "learning_rate": 0.00011294479446979785, "loss": 0.0002, "step": 14332 }, { "epoch": 2.92, "learning_rate": 0.00011292601022962156, "loss": 0.0142, "step": 14333 }, { "epoch": 2.92, "learning_rate": 0.00011290722660865097, "loss": 0.0206, "step": 14334 }, { "epoch": 2.92, "learning_rate": 0.00011288844360719965, "loss": 0.0024, "step": 14335 }, { "epoch": 2.92, "learning_rate": 0.00011286966122558138, "loss": 0.0236, "step": 14336 }, { "epoch": 2.92, "learning_rate": 0.00011285087946410989, "loss": 0.0169, "step": 14337 }, { "epoch": 2.92, "learning_rate": 0.0001128320983230988, "loss": 0.0221, "step": 14338 }, { "epoch": 2.92, "learning_rate": 0.00011281331780286187, "loss": 0.0048, "step": 14339 }, { "epoch": 2.92, "learning_rate": 0.00011279453790371268, "loss": 0.0125, "step": 14340 }, { "epoch": 2.92, "learning_rate": 0.00011277575862596499, "loss": 0.0063, "step": 14341 }, { "epoch": 2.92, "learning_rate": 0.00011275697996993241, "loss": 0.0113, "step": 14342 }, { "epoch": 2.92, "learning_rate": 0.00011273820193592849, "loss": 0.0038, "step": 14343 }, { "epoch": 2.92, "learning_rate": 0.00011271942452426698, "loss": 0.0024, "step": 14344 }, { "epoch": 2.92, "learning_rate": 0.00011270064773526141, "loss": 0.019, "step": 14345 }, { "epoch": 2.92, "learning_rate": 0.00011268187156922547, "loss": 0.0019, "step": 14346 }, { "epoch": 2.92, "learning_rate": 0.00011266309602647273, "loss": 0.0082, "step": 14347 }, { "epoch": 2.92, "learning_rate": 0.00011264432110731671, "loss": 0.0299, "step": 14348 }, { "epoch": 2.92, "learning_rate": 0.0001126255468120711, "loss": 0.0089, "step": 14349 }, { "epoch": 2.92, "learning_rate": 0.00011260677314104935, "loss": 0.0147, "step": 14350 }, { "epoch": 2.92, "learning_rate": 0.00011258800009456514, "loss": 0.0094, "step": 14351 }, { "epoch": 2.92, "learning_rate": 0.00011256922767293195, "loss": 0.0033, "step": 14352 }, { "epoch": 2.92, "learning_rate": 0.00011255045587646323, "loss": 0.0075, "step": 14353 }, { "epoch": 2.92, "learning_rate": 0.00011253168470547268, "loss": 0.0083, "step": 14354 }, { "epoch": 2.92, "learning_rate": 0.00011251291416027367, "loss": 0.0064, "step": 14355 }, { "epoch": 2.92, "learning_rate": 0.00011249414424117975, "loss": 0.0022, "step": 14356 }, { "epoch": 2.92, "learning_rate": 0.00011247537494850444, "loss": 0.0004, "step": 14357 }, { "epoch": 2.92, "learning_rate": 0.00011245660628256115, "loss": 0.0047, "step": 14358 }, { "epoch": 2.92, "learning_rate": 0.0001124378382436635, "loss": 0.0103, "step": 14359 }, { "epoch": 2.92, "learning_rate": 0.00011241907083212483, "loss": 0.0094, "step": 14360 }, { "epoch": 2.92, "learning_rate": 0.00011240030404825854, "loss": 0.0102, "step": 14361 }, { "epoch": 2.92, "learning_rate": 0.00011238153789237821, "loss": 0.0075, "step": 14362 }, { "epoch": 2.92, "learning_rate": 0.00011236277236479717, "loss": 0.0022, "step": 14363 }, { "epoch": 2.92, "learning_rate": 0.00011234400746582892, "loss": 0.0028, "step": 14364 }, { "epoch": 2.92, "learning_rate": 0.00011232524319578681, "loss": 0.0149, "step": 14365 }, { "epoch": 2.93, "learning_rate": 0.00011230647955498424, "loss": 0.0016, "step": 14366 }, { "epoch": 2.93, "learning_rate": 0.00011228771654373464, "loss": 0.0063, "step": 14367 }, { "epoch": 2.93, "learning_rate": 0.00011226895416235133, "loss": 0.0041, "step": 14368 }, { "epoch": 2.93, "learning_rate": 0.00011225019241114772, "loss": 0.0087, "step": 14369 }, { "epoch": 2.93, "learning_rate": 0.00011223143129043719, "loss": 0.0049, "step": 14370 }, { "epoch": 2.93, "learning_rate": 0.00011221267080053297, "loss": 0.0139, "step": 14371 }, { "epoch": 2.93, "learning_rate": 0.00011219391094174856, "loss": 0.0042, "step": 14372 }, { "epoch": 2.93, "learning_rate": 0.00011217515171439714, "loss": 0.0055, "step": 14373 }, { "epoch": 2.93, "learning_rate": 0.00011215639311879212, "loss": 0.0186, "step": 14374 }, { "epoch": 2.93, "learning_rate": 0.00011213763515524681, "loss": 0.0071, "step": 14375 }, { "epoch": 2.93, "learning_rate": 0.00011211887782407436, "loss": 0.0075, "step": 14376 }, { "epoch": 2.93, "learning_rate": 0.00011210012112558821, "loss": 0.0226, "step": 14377 }, { "epoch": 2.93, "learning_rate": 0.00011208136506010157, "loss": 0.0056, "step": 14378 }, { "epoch": 2.93, "learning_rate": 0.00011206260962792773, "loss": 0.0062, "step": 14379 }, { "epoch": 2.93, "learning_rate": 0.00011204385482937993, "loss": 0.0219, "step": 14380 }, { "epoch": 2.93, "learning_rate": 0.00011202510066477134, "loss": 0.0081, "step": 14381 }, { "epoch": 2.93, "learning_rate": 0.00011200634713441533, "loss": 0.0076, "step": 14382 }, { "epoch": 2.93, "learning_rate": 0.00011198759423862503, "loss": 0.0067, "step": 14383 }, { "epoch": 2.93, "learning_rate": 0.00011196884197771358, "loss": 0.0166, "step": 14384 }, { "epoch": 2.93, "learning_rate": 0.00011195009035199436, "loss": 0.0104, "step": 14385 }, { "epoch": 2.93, "learning_rate": 0.00011193133936178037, "loss": 0.0145, "step": 14386 }, { "epoch": 2.93, "learning_rate": 0.00011191258900738493, "loss": 0.0109, "step": 14387 }, { "epoch": 2.93, "learning_rate": 0.0001118938392891211, "loss": 0.001, "step": 14388 }, { "epoch": 2.93, "learning_rate": 0.00011187509020730209, "loss": 0.0316, "step": 14389 }, { "epoch": 2.93, "learning_rate": 0.00011185634176224111, "loss": 0.0046, "step": 14390 }, { "epoch": 2.93, "learning_rate": 0.00011183759395425113, "loss": 0.0112, "step": 14391 }, { "epoch": 2.93, "learning_rate": 0.00011181884678364543, "loss": 0.0029, "step": 14392 }, { "epoch": 2.93, "learning_rate": 0.00011180010025073708, "loss": 0.007, "step": 14393 }, { "epoch": 2.93, "learning_rate": 0.00011178135435583908, "loss": 0.0101, "step": 14394 }, { "epoch": 2.93, "learning_rate": 0.00011176260909926468, "loss": 0.0135, "step": 14395 }, { "epoch": 2.93, "learning_rate": 0.00011174386448132683, "loss": 0.0213, "step": 14396 }, { "epoch": 2.93, "learning_rate": 0.00011172512050233872, "loss": 0.0073, "step": 14397 }, { "epoch": 2.93, "learning_rate": 0.00011170637716261329, "loss": 0.0055, "step": 14398 }, { "epoch": 2.93, "learning_rate": 0.00011168763446246365, "loss": 0.0028, "step": 14399 }, { "epoch": 2.93, "learning_rate": 0.00011166889240220286, "loss": 0.0061, "step": 14400 }, { "epoch": 2.93, "learning_rate": 0.00011165015098214389, "loss": 0.0098, "step": 14401 }, { "epoch": 2.93, "learning_rate": 0.00011163141020259985, "loss": 0.0053, "step": 14402 }, { "epoch": 2.93, "learning_rate": 0.00011161267006388367, "loss": 0.0051, "step": 14403 }, { "epoch": 2.93, "learning_rate": 0.00011159393056630828, "loss": 0.0031, "step": 14404 }, { "epoch": 2.93, "learning_rate": 0.00011157519171018686, "loss": 0.0075, "step": 14405 }, { "epoch": 2.93, "learning_rate": 0.00011155645349583221, "loss": 0.0058, "step": 14406 }, { "epoch": 2.93, "learning_rate": 0.00011153771592355735, "loss": 0.0168, "step": 14407 }, { "epoch": 2.93, "learning_rate": 0.00011151897899367524, "loss": 0.0058, "step": 14408 }, { "epoch": 2.93, "learning_rate": 0.00011150024270649883, "loss": 0.01, "step": 14409 }, { "epoch": 2.93, "learning_rate": 0.00011148150706234102, "loss": 0.0071, "step": 14410 }, { "epoch": 2.93, "learning_rate": 0.0001114627720615148, "loss": 0.0063, "step": 14411 }, { "epoch": 2.93, "learning_rate": 0.00011144403770433295, "loss": 0.0108, "step": 14412 }, { "epoch": 2.93, "learning_rate": 0.00011142530399110853, "loss": 0.0217, "step": 14413 }, { "epoch": 2.93, "learning_rate": 0.00011140657092215429, "loss": 0.0067, "step": 14414 }, { "epoch": 2.94, "learning_rate": 0.00011138783849778322, "loss": 0.0075, "step": 14415 }, { "epoch": 2.94, "learning_rate": 0.00011136910671830814, "loss": 0.004, "step": 14416 }, { "epoch": 2.94, "learning_rate": 0.00011135037558404182, "loss": 0.012, "step": 14417 }, { "epoch": 2.94, "learning_rate": 0.0001113316450952972, "loss": 0.0072, "step": 14418 }, { "epoch": 2.94, "learning_rate": 0.00011131291525238715, "loss": 0.0038, "step": 14419 }, { "epoch": 2.94, "learning_rate": 0.0001112941860556244, "loss": 0.0022, "step": 14420 }, { "epoch": 2.94, "learning_rate": 0.00011127545750532186, "loss": 0.0202, "step": 14421 }, { "epoch": 2.94, "learning_rate": 0.00011125672960179218, "loss": 0.0062, "step": 14422 }, { "epoch": 2.94, "learning_rate": 0.00011123800234534834, "loss": 0.0029, "step": 14423 }, { "epoch": 2.94, "learning_rate": 0.00011121927573630298, "loss": 0.0045, "step": 14424 }, { "epoch": 2.94, "learning_rate": 0.00011120054977496895, "loss": 0.0036, "step": 14425 }, { "epoch": 2.94, "learning_rate": 0.000111181824461659, "loss": 0.0047, "step": 14426 }, { "epoch": 2.94, "learning_rate": 0.00011116309979668579, "loss": 0.0035, "step": 14427 }, { "epoch": 2.94, "learning_rate": 0.00011114437578036218, "loss": 0.016, "step": 14428 }, { "epoch": 2.94, "learning_rate": 0.0001111256524130008, "loss": 0.0042, "step": 14429 }, { "epoch": 2.94, "learning_rate": 0.00011110692969491439, "loss": 0.0074, "step": 14430 }, { "epoch": 2.94, "learning_rate": 0.00011108820762641573, "loss": 0.002, "step": 14431 }, { "epoch": 2.94, "learning_rate": 0.00011106948620781738, "loss": 0.0061, "step": 14432 }, { "epoch": 2.94, "learning_rate": 0.00011105076543943218, "loss": 0.0055, "step": 14433 }, { "epoch": 2.94, "learning_rate": 0.0001110320453215727, "loss": 0.0153, "step": 14434 }, { "epoch": 2.94, "learning_rate": 0.00011101332585455157, "loss": 0.0024, "step": 14435 }, { "epoch": 2.94, "learning_rate": 0.00011099460703868154, "loss": 0.0181, "step": 14436 }, { "epoch": 2.94, "learning_rate": 0.00011097588887427514, "loss": 0.006, "step": 14437 }, { "epoch": 2.94, "learning_rate": 0.00011095717136164513, "loss": 0.0031, "step": 14438 }, { "epoch": 2.94, "learning_rate": 0.00011093845450110403, "loss": 0.0155, "step": 14439 }, { "epoch": 2.94, "learning_rate": 0.00011091973829296446, "loss": 0.0061, "step": 14440 }, { "epoch": 2.94, "learning_rate": 0.00011090102273753904, "loss": 0.0161, "step": 14441 }, { "epoch": 2.94, "learning_rate": 0.00011088230783514031, "loss": 0.0135, "step": 14442 }, { "epoch": 2.94, "learning_rate": 0.00011086359358608095, "loss": 0.02, "step": 14443 }, { "epoch": 2.94, "learning_rate": 0.00011084487999067343, "loss": 0.0131, "step": 14444 }, { "epoch": 2.94, "learning_rate": 0.00011082616704923028, "loss": 0.001, "step": 14445 }, { "epoch": 2.94, "learning_rate": 0.00011080745476206414, "loss": 0.0036, "step": 14446 }, { "epoch": 2.94, "learning_rate": 0.00011078874312948743, "loss": 0.0124, "step": 14447 }, { "epoch": 2.94, "learning_rate": 0.0001107700321518128, "loss": 0.0082, "step": 14448 }, { "epoch": 2.94, "learning_rate": 0.00011075132182935262, "loss": 0.0012, "step": 14449 }, { "epoch": 2.94, "learning_rate": 0.00011073261216241949, "loss": 0.0102, "step": 14450 }, { "epoch": 2.94, "learning_rate": 0.00011071390315132583, "loss": 0.0148, "step": 14451 }, { "epoch": 2.94, "learning_rate": 0.00011069519479638412, "loss": 0.0093, "step": 14452 }, { "epoch": 2.94, "learning_rate": 0.00011067648709790694, "loss": 0.0082, "step": 14453 }, { "epoch": 2.94, "learning_rate": 0.00011065778005620662, "loss": 0.0072, "step": 14454 }, { "epoch": 2.94, "learning_rate": 0.00011063907367159558, "loss": 0.007, "step": 14455 }, { "epoch": 2.94, "learning_rate": 0.00011062036794438639, "loss": 0.0055, "step": 14456 }, { "epoch": 2.94, "learning_rate": 0.00011060166287489138, "loss": 0.0108, "step": 14457 }, { "epoch": 2.94, "learning_rate": 0.0001105829584634229, "loss": 0.0028, "step": 14458 }, { "epoch": 2.94, "learning_rate": 0.00011056425471029346, "loss": 0.0037, "step": 14459 }, { "epoch": 2.94, "learning_rate": 0.0001105455516158154, "loss": 0.0025, "step": 14460 }, { "epoch": 2.94, "learning_rate": 0.00011052684918030109, "loss": 0.0043, "step": 14461 }, { "epoch": 2.94, "learning_rate": 0.00011050814740406297, "loss": 0.007, "step": 14462 }, { "epoch": 2.94, "learning_rate": 0.00011048944628741327, "loss": 0.0054, "step": 14463 }, { "epoch": 2.95, "learning_rate": 0.00011047074583066444, "loss": 0.0018, "step": 14464 }, { "epoch": 2.95, "learning_rate": 0.0001104520460341287, "loss": 0.0272, "step": 14465 }, { "epoch": 2.95, "learning_rate": 0.00011043334689811854, "loss": 0.0028, "step": 14466 }, { "epoch": 2.95, "learning_rate": 0.00011041464842294615, "loss": 0.0095, "step": 14467 }, { "epoch": 2.95, "learning_rate": 0.0001103959506089238, "loss": 0.0048, "step": 14468 }, { "epoch": 2.95, "learning_rate": 0.0001103772534563639, "loss": 0.0009, "step": 14469 }, { "epoch": 2.95, "learning_rate": 0.00011035855696557859, "loss": 0.0048, "step": 14470 }, { "epoch": 2.95, "learning_rate": 0.00011033986113688024, "loss": 0.0022, "step": 14471 }, { "epoch": 2.95, "learning_rate": 0.00011032116597058111, "loss": 0.0188, "step": 14472 }, { "epoch": 2.95, "learning_rate": 0.00011030247146699332, "loss": 0.0325, "step": 14473 }, { "epoch": 2.95, "learning_rate": 0.00011028377762642929, "loss": 0.0061, "step": 14474 }, { "epoch": 2.95, "learning_rate": 0.00011026508444920107, "loss": 0.0201, "step": 14475 }, { "epoch": 2.95, "learning_rate": 0.000110246391935621, "loss": 0.0099, "step": 14476 }, { "epoch": 2.95, "learning_rate": 0.00011022770008600123, "loss": 0.0123, "step": 14477 }, { "epoch": 2.95, "learning_rate": 0.00011020900890065387, "loss": 0.0039, "step": 14478 }, { "epoch": 2.95, "learning_rate": 0.00011019031837989123, "loss": 0.0079, "step": 14479 }, { "epoch": 2.95, "learning_rate": 0.00011017162852402541, "loss": 0.0212, "step": 14480 }, { "epoch": 2.95, "learning_rate": 0.00011015293933336857, "loss": 0.0073, "step": 14481 }, { "epoch": 2.95, "learning_rate": 0.00011013425080823287, "loss": 0.0064, "step": 14482 }, { "epoch": 2.95, "learning_rate": 0.00011011556294893036, "loss": 0.0072, "step": 14483 }, { "epoch": 2.95, "learning_rate": 0.00011009687575577333, "loss": 0.0043, "step": 14484 }, { "epoch": 2.95, "learning_rate": 0.00011007818922907379, "loss": 0.0128, "step": 14485 }, { "epoch": 2.95, "learning_rate": 0.00011005950336914378, "loss": 0.0048, "step": 14486 }, { "epoch": 2.95, "learning_rate": 0.00011004081817629554, "loss": 0.0087, "step": 14487 }, { "epoch": 2.95, "learning_rate": 0.00011002213365084099, "loss": 0.0127, "step": 14488 }, { "epoch": 2.95, "learning_rate": 0.00011000344979309232, "loss": 0.0137, "step": 14489 }, { "epoch": 2.95, "learning_rate": 0.00010998476660336153, "loss": 0.0159, "step": 14490 }, { "epoch": 2.95, "learning_rate": 0.00010996608408196067, "loss": 0.0048, "step": 14491 }, { "epoch": 2.95, "learning_rate": 0.00010994740222920176, "loss": 0.0049, "step": 14492 }, { "epoch": 2.95, "learning_rate": 0.00010992872104539685, "loss": 0.0127, "step": 14493 }, { "epoch": 2.95, "learning_rate": 0.00010991004053085792, "loss": 0.0076, "step": 14494 }, { "epoch": 2.95, "learning_rate": 0.00010989136068589704, "loss": 0.0068, "step": 14495 }, { "epoch": 2.95, "learning_rate": 0.00010987268151082607, "loss": 0.0074, "step": 14496 }, { "epoch": 2.95, "learning_rate": 0.00010985400300595715, "loss": 0.0113, "step": 14497 }, { "epoch": 2.95, "learning_rate": 0.00010983532517160207, "loss": 0.0054, "step": 14498 }, { "epoch": 2.95, "learning_rate": 0.00010981664800807296, "loss": 0.007, "step": 14499 }, { "epoch": 2.95, "learning_rate": 0.00010979797151568167, "loss": 0.0517, "step": 14500 }, { "epoch": 2.95, "learning_rate": 0.00010977929569474008, "loss": 0.0173, "step": 14501 }, { "epoch": 2.95, "learning_rate": 0.0001097606205455602, "loss": 0.0021, "step": 14502 }, { "epoch": 2.95, "learning_rate": 0.00010974194606845394, "loss": 0.005, "step": 14503 }, { "epoch": 2.95, "learning_rate": 0.00010972327226373314, "loss": 0.0037, "step": 14504 }, { "epoch": 2.95, "learning_rate": 0.00010970459913170976, "loss": 0.003, "step": 14505 }, { "epoch": 2.95, "learning_rate": 0.00010968592667269557, "loss": 0.0011, "step": 14506 }, { "epoch": 2.95, "learning_rate": 0.00010966725488700258, "loss": 0.0048, "step": 14507 }, { "epoch": 2.95, "learning_rate": 0.00010964858377494256, "loss": 0.0055, "step": 14508 }, { "epoch": 2.95, "learning_rate": 0.0001096299133368273, "loss": 0.0055, "step": 14509 }, { "epoch": 2.95, "learning_rate": 0.00010961124357296874, "loss": 0.0092, "step": 14510 }, { "epoch": 2.95, "learning_rate": 0.00010959257448367862, "loss": 0.0087, "step": 14511 }, { "epoch": 2.95, "learning_rate": 0.00010957390606926878, "loss": 0.0009, "step": 14512 }, { "epoch": 2.96, "learning_rate": 0.00010955523833005108, "loss": 0.0043, "step": 14513 }, { "epoch": 2.96, "learning_rate": 0.00010953657126633716, "loss": 0.003, "step": 14514 }, { "epoch": 2.96, "learning_rate": 0.00010951790487843894, "loss": 0.0025, "step": 14515 }, { "epoch": 2.96, "learning_rate": 0.00010949923916666807, "loss": 0.0128, "step": 14516 }, { "epoch": 2.96, "learning_rate": 0.00010948057413133641, "loss": 0.0031, "step": 14517 }, { "epoch": 2.96, "learning_rate": 0.00010946190977275567, "loss": 0.0034, "step": 14518 }, { "epoch": 2.96, "learning_rate": 0.00010944324609123746, "loss": 0.0124, "step": 14519 }, { "epoch": 2.96, "learning_rate": 0.00010942458308709369, "loss": 0.0076, "step": 14520 }, { "epoch": 2.96, "learning_rate": 0.0001094059207606359, "loss": 0.0119, "step": 14521 }, { "epoch": 2.96, "learning_rate": 0.00010938725911217593, "loss": 0.0029, "step": 14522 }, { "epoch": 2.96, "learning_rate": 0.00010936859814202537, "loss": 0.0038, "step": 14523 }, { "epoch": 2.96, "learning_rate": 0.00010934993785049586, "loss": 0.0302, "step": 14524 }, { "epoch": 2.96, "learning_rate": 0.0001093312782378992, "loss": 0.0071, "step": 14525 }, { "epoch": 2.96, "learning_rate": 0.0001093126193045469, "loss": 0.0035, "step": 14526 }, { "epoch": 2.96, "learning_rate": 0.00010929396105075071, "loss": 0.0028, "step": 14527 }, { "epoch": 2.96, "learning_rate": 0.00010927530347682222, "loss": 0.0127, "step": 14528 }, { "epoch": 2.96, "learning_rate": 0.00010925664658307297, "loss": 0.0075, "step": 14529 }, { "epoch": 2.96, "learning_rate": 0.00010923799036981469, "loss": 0.0035, "step": 14530 }, { "epoch": 2.96, "learning_rate": 0.00010921933483735889, "loss": 0.0011, "step": 14531 }, { "epoch": 2.96, "learning_rate": 0.00010920067998601719, "loss": 0.0087, "step": 14532 }, { "epoch": 2.96, "learning_rate": 0.00010918202581610113, "loss": 0.0083, "step": 14533 }, { "epoch": 2.96, "learning_rate": 0.00010916337232792228, "loss": 0.0021, "step": 14534 }, { "epoch": 2.96, "learning_rate": 0.0001091447195217922, "loss": 0.0151, "step": 14535 }, { "epoch": 2.96, "learning_rate": 0.00010912606739802246, "loss": 0.0092, "step": 14536 }, { "epoch": 2.96, "learning_rate": 0.0001091074159569245, "loss": 0.0044, "step": 14537 }, { "epoch": 2.96, "learning_rate": 0.00010908876519880994, "loss": 0.0128, "step": 14538 }, { "epoch": 2.96, "learning_rate": 0.00010907011512399015, "loss": 0.0111, "step": 14539 }, { "epoch": 2.96, "learning_rate": 0.00010905146573277678, "loss": 0.0201, "step": 14540 }, { "epoch": 2.96, "learning_rate": 0.00010903281702548123, "loss": 0.0288, "step": 14541 }, { "epoch": 2.96, "learning_rate": 0.00010901416900241487, "loss": 0.0027, "step": 14542 }, { "epoch": 2.96, "learning_rate": 0.00010899552166388931, "loss": 0.0018, "step": 14543 }, { "epoch": 2.96, "learning_rate": 0.00010897687501021593, "loss": 0.0051, "step": 14544 }, { "epoch": 2.96, "learning_rate": 0.0001089582290417062, "loss": 0.004, "step": 14545 }, { "epoch": 2.96, "learning_rate": 0.00010893958375867151, "loss": 0.014, "step": 14546 }, { "epoch": 2.96, "learning_rate": 0.00010892093916142325, "loss": 0.0032, "step": 14547 }, { "epoch": 2.96, "learning_rate": 0.0001089022952502729, "loss": 0.0146, "step": 14548 }, { "epoch": 2.96, "learning_rate": 0.0001088836520255317, "loss": 0.0086, "step": 14549 }, { "epoch": 2.96, "learning_rate": 0.00010886500948751124, "loss": 0.0037, "step": 14550 }, { "epoch": 2.96, "learning_rate": 0.00010884636763652274, "loss": 0.0138, "step": 14551 }, { "epoch": 2.96, "learning_rate": 0.00010882772647287753, "loss": 0.0029, "step": 14552 }, { "epoch": 2.96, "learning_rate": 0.00010880908599688707, "loss": 0.0049, "step": 14553 }, { "epoch": 2.96, "learning_rate": 0.00010879044620886259, "loss": 0.0078, "step": 14554 }, { "epoch": 2.96, "learning_rate": 0.00010877180710911541, "loss": 0.0101, "step": 14555 }, { "epoch": 2.96, "learning_rate": 0.00010875316869795696, "loss": 0.0038, "step": 14556 }, { "epoch": 2.96, "learning_rate": 0.00010873453097569835, "loss": 0.016, "step": 14557 }, { "epoch": 2.96, "learning_rate": 0.00010871589394265106, "loss": 0.0051, "step": 14558 }, { "epoch": 2.96, "learning_rate": 0.00010869725759912627, "loss": 0.0054, "step": 14559 }, { "epoch": 2.96, "learning_rate": 0.00010867862194543517, "loss": 0.0016, "step": 14560 }, { "epoch": 2.96, "learning_rate": 0.00010865998698188915, "loss": 0.0101, "step": 14561 }, { "epoch": 2.97, "learning_rate": 0.00010864135270879932, "loss": 0.0152, "step": 14562 }, { "epoch": 2.97, "learning_rate": 0.00010862271912647703, "loss": 0.0068, "step": 14563 }, { "epoch": 2.97, "learning_rate": 0.0001086040862352334, "loss": 0.005, "step": 14564 }, { "epoch": 2.97, "learning_rate": 0.00010858545403537965, "loss": 0.0104, "step": 14565 }, { "epoch": 2.97, "learning_rate": 0.00010856682252722706, "loss": 0.0202, "step": 14566 }, { "epoch": 2.97, "learning_rate": 0.00010854819171108665, "loss": 0.0043, "step": 14567 }, { "epoch": 2.97, "learning_rate": 0.00010852956158726977, "loss": 0.0023, "step": 14568 }, { "epoch": 2.97, "learning_rate": 0.0001085109321560875, "loss": 0.0026, "step": 14569 }, { "epoch": 2.97, "learning_rate": 0.00010849230341785091, "loss": 0.0066, "step": 14570 }, { "epoch": 2.97, "learning_rate": 0.00010847367537287127, "loss": 0.0026, "step": 14571 }, { "epoch": 2.97, "learning_rate": 0.00010845504802145956, "loss": 0.017, "step": 14572 }, { "epoch": 2.97, "learning_rate": 0.00010843642136392704, "loss": 0.007, "step": 14573 }, { "epoch": 2.97, "learning_rate": 0.00010841779540058471, "loss": 0.0015, "step": 14574 }, { "epoch": 2.97, "learning_rate": 0.0001083991701317437, "loss": 0.0091, "step": 14575 }, { "epoch": 2.97, "learning_rate": 0.00010838054555771505, "loss": 0.0042, "step": 14576 }, { "epoch": 2.97, "learning_rate": 0.00010836192167880991, "loss": 0.0045, "step": 14577 }, { "epoch": 2.97, "learning_rate": 0.0001083432984953392, "loss": 0.0167, "step": 14578 }, { "epoch": 2.97, "learning_rate": 0.00010832467600761409, "loss": 0.0135, "step": 14579 }, { "epoch": 2.97, "learning_rate": 0.00010830605421594552, "loss": 0.0019, "step": 14580 }, { "epoch": 2.97, "learning_rate": 0.00010828743312064459, "loss": 0.003, "step": 14581 }, { "epoch": 2.97, "learning_rate": 0.00010826881272202229, "loss": 0.0131, "step": 14582 }, { "epoch": 2.97, "learning_rate": 0.0001082501930203895, "loss": 0.0084, "step": 14583 }, { "epoch": 2.97, "learning_rate": 0.00010823157401605734, "loss": 0.0049, "step": 14584 }, { "epoch": 2.97, "learning_rate": 0.00010821295570933673, "loss": 0.0047, "step": 14585 }, { "epoch": 2.97, "learning_rate": 0.00010819433810053864, "loss": 0.0005, "step": 14586 }, { "epoch": 2.97, "learning_rate": 0.00010817572118997405, "loss": 0.0149, "step": 14587 }, { "epoch": 2.97, "learning_rate": 0.00010815710497795381, "loss": 0.0051, "step": 14588 }, { "epoch": 2.97, "learning_rate": 0.00010813848946478896, "loss": 0.0047, "step": 14589 }, { "epoch": 2.97, "learning_rate": 0.00010811987465079028, "loss": 0.0084, "step": 14590 }, { "epoch": 2.97, "learning_rate": 0.00010810126053626883, "loss": 0.0069, "step": 14591 }, { "epoch": 2.97, "learning_rate": 0.0001080826471215354, "loss": 0.0105, "step": 14592 }, { "epoch": 2.97, "learning_rate": 0.00010806403440690083, "loss": 0.0032, "step": 14593 }, { "epoch": 2.97, "learning_rate": 0.00010804542239267612, "loss": 0.0033, "step": 14594 }, { "epoch": 2.97, "learning_rate": 0.00010802681107917198, "loss": 0.0041, "step": 14595 }, { "epoch": 2.97, "learning_rate": 0.00010800820046669935, "loss": 0.0131, "step": 14596 }, { "epoch": 2.97, "learning_rate": 0.00010798959055556907, "loss": 0.0064, "step": 14597 }, { "epoch": 2.97, "learning_rate": 0.00010797098134609188, "loss": 0.0146, "step": 14598 }, { "epoch": 2.97, "learning_rate": 0.00010795237283857868, "loss": 0.005, "step": 14599 }, { "epoch": 2.97, "learning_rate": 0.00010793376503334017, "loss": 0.0005, "step": 14600 }, { "epoch": 2.97, "learning_rate": 0.00010791515793068726, "loss": 0.0146, "step": 14601 }, { "epoch": 2.97, "learning_rate": 0.00010789655153093065, "loss": 0.0026, "step": 14602 }, { "epoch": 2.97, "learning_rate": 0.00010787794583438103, "loss": 0.0048, "step": 14603 }, { "epoch": 2.97, "learning_rate": 0.00010785934084134931, "loss": 0.0064, "step": 14604 }, { "epoch": 2.97, "learning_rate": 0.0001078407365521461, "loss": 0.0033, "step": 14605 }, { "epoch": 2.97, "learning_rate": 0.00010782213296708217, "loss": 0.0039, "step": 14606 }, { "epoch": 2.97, "learning_rate": 0.00010780353008646823, "loss": 0.0119, "step": 14607 }, { "epoch": 2.97, "learning_rate": 0.00010778492791061496, "loss": 0.0206, "step": 14608 }, { "epoch": 2.97, "learning_rate": 0.00010776632643983316, "loss": 0.0078, "step": 14609 }, { "epoch": 2.97, "learning_rate": 0.00010774772567443341, "loss": 0.0097, "step": 14610 }, { "epoch": 2.98, "learning_rate": 0.00010772912561472633, "loss": 0.0028, "step": 14611 }, { "epoch": 2.98, "learning_rate": 0.00010771052626102273, "loss": 0.0083, "step": 14612 }, { "epoch": 2.98, "learning_rate": 0.0001076919276136331, "loss": 0.0042, "step": 14613 }, { "epoch": 2.98, "learning_rate": 0.0001076733296728682, "loss": 0.0039, "step": 14614 }, { "epoch": 2.98, "learning_rate": 0.00010765473243903856, "loss": 0.0071, "step": 14615 }, { "epoch": 2.98, "learning_rate": 0.00010763613591245482, "loss": 0.0089, "step": 14616 }, { "epoch": 2.98, "learning_rate": 0.00010761754009342758, "loss": 0.0056, "step": 14617 }, { "epoch": 2.98, "learning_rate": 0.00010759894498226743, "loss": 0.0112, "step": 14618 }, { "epoch": 2.98, "learning_rate": 0.0001075803505792849, "loss": 0.0067, "step": 14619 }, { "epoch": 2.98, "learning_rate": 0.00010756175688479065, "loss": 0.0123, "step": 14620 }, { "epoch": 2.98, "learning_rate": 0.00010754316389909513, "loss": 0.0159, "step": 14621 }, { "epoch": 2.98, "learning_rate": 0.00010752457162250893, "loss": 0.0026, "step": 14622 }, { "epoch": 2.98, "learning_rate": 0.00010750598005534253, "loss": 0.0093, "step": 14623 }, { "epoch": 2.98, "learning_rate": 0.00010748738919790652, "loss": 0.0083, "step": 14624 }, { "epoch": 2.98, "learning_rate": 0.00010746879905051137, "loss": 0.002, "step": 14625 }, { "epoch": 2.98, "learning_rate": 0.0001074502096134675, "loss": 0.0174, "step": 14626 }, { "epoch": 2.98, "learning_rate": 0.00010743162088708547, "loss": 0.0166, "step": 14627 }, { "epoch": 2.98, "learning_rate": 0.00010741303287167576, "loss": 0.0147, "step": 14628 }, { "epoch": 2.98, "learning_rate": 0.00010739444556754873, "loss": 0.0031, "step": 14629 }, { "epoch": 2.98, "learning_rate": 0.00010737585897501494, "loss": 0.003, "step": 14630 }, { "epoch": 2.98, "learning_rate": 0.0001073572730943847, "loss": 0.0036, "step": 14631 }, { "epoch": 2.98, "learning_rate": 0.00010733868792596856, "loss": 0.0044, "step": 14632 }, { "epoch": 2.98, "learning_rate": 0.00010732010347007686, "loss": 0.0111, "step": 14633 }, { "epoch": 2.98, "learning_rate": 0.00010730151972701992, "loss": 0.0336, "step": 14634 }, { "epoch": 2.98, "learning_rate": 0.00010728293669710829, "loss": 0.0009, "step": 14635 }, { "epoch": 2.98, "learning_rate": 0.00010726435438065216, "loss": 0.0185, "step": 14636 }, { "epoch": 2.98, "learning_rate": 0.00010724577277796203, "loss": 0.0055, "step": 14637 }, { "epoch": 2.98, "learning_rate": 0.00010722719188934822, "loss": 0.011, "step": 14638 }, { "epoch": 2.98, "learning_rate": 0.000107208611715121, "loss": 0.0029, "step": 14639 }, { "epoch": 2.98, "learning_rate": 0.00010719003225559079, "loss": 0.0139, "step": 14640 }, { "epoch": 2.98, "learning_rate": 0.00010717145351106778, "loss": 0.0141, "step": 14641 }, { "epoch": 2.98, "learning_rate": 0.00010715287548186241, "loss": 0.0049, "step": 14642 }, { "epoch": 2.98, "learning_rate": 0.00010713429816828491, "loss": 0.0107, "step": 14643 }, { "epoch": 2.98, "learning_rate": 0.00010711572157064549, "loss": 0.0049, "step": 14644 }, { "epoch": 2.98, "learning_rate": 0.00010709714568925449, "loss": 0.0029, "step": 14645 }, { "epoch": 2.98, "learning_rate": 0.00010707857052442212, "loss": 0.009, "step": 14646 }, { "epoch": 2.98, "learning_rate": 0.00010705999607645868, "loss": 0.0143, "step": 14647 }, { "epoch": 2.98, "learning_rate": 0.00010704142234567434, "loss": 0.007, "step": 14648 }, { "epoch": 2.98, "learning_rate": 0.0001070228493323793, "loss": 0.0165, "step": 14649 }, { "epoch": 2.98, "learning_rate": 0.00010700427703688388, "loss": 0.004, "step": 14650 }, { "epoch": 2.98, "learning_rate": 0.00010698570545949818, "loss": 0.0052, "step": 14651 }, { "epoch": 2.98, "learning_rate": 0.00010696713460053233, "loss": 0.0134, "step": 14652 }, { "epoch": 2.98, "learning_rate": 0.00010694856446029663, "loss": 0.0014, "step": 14653 }, { "epoch": 2.98, "learning_rate": 0.00010692999503910112, "loss": 0.0097, "step": 14654 }, { "epoch": 2.98, "learning_rate": 0.00010691142633725603, "loss": 0.004, "step": 14655 }, { "epoch": 2.98, "learning_rate": 0.00010689285835507145, "loss": 0.0024, "step": 14656 }, { "epoch": 2.98, "learning_rate": 0.00010687429109285747, "loss": 0.01, "step": 14657 }, { "epoch": 2.98, "learning_rate": 0.00010685572455092427, "loss": 0.0064, "step": 14658 }, { "epoch": 2.98, "learning_rate": 0.00010683715872958187, "loss": 0.0031, "step": 14659 }, { "epoch": 2.99, "learning_rate": 0.00010681859362914045, "loss": 0.0075, "step": 14660 }, { "epoch": 2.99, "learning_rate": 0.00010680002924991001, "loss": 0.011, "step": 14661 }, { "epoch": 2.99, "learning_rate": 0.00010678146559220058, "loss": 0.0049, "step": 14662 }, { "epoch": 2.99, "learning_rate": 0.00010676290265632232, "loss": 0.0076, "step": 14663 }, { "epoch": 2.99, "learning_rate": 0.00010674434044258514, "loss": 0.0225, "step": 14664 }, { "epoch": 2.99, "learning_rate": 0.0001067257789512992, "loss": 0.0157, "step": 14665 }, { "epoch": 2.99, "learning_rate": 0.00010670721818277443, "loss": 0.0049, "step": 14666 }, { "epoch": 2.99, "learning_rate": 0.00010668865813732076, "loss": 0.0044, "step": 14667 }, { "epoch": 2.99, "learning_rate": 0.00010667009881524832, "loss": 0.0012, "step": 14668 }, { "epoch": 2.99, "learning_rate": 0.00010665154021686699, "loss": 0.0029, "step": 14669 }, { "epoch": 2.99, "learning_rate": 0.00010663298234248678, "loss": 0.0046, "step": 14670 }, { "epoch": 2.99, "learning_rate": 0.00010661442519241764, "loss": 0.0018, "step": 14671 }, { "epoch": 2.99, "learning_rate": 0.00010659586876696943, "loss": 0.0173, "step": 14672 }, { "epoch": 2.99, "learning_rate": 0.00010657731306645222, "loss": 0.0008, "step": 14673 }, { "epoch": 2.99, "learning_rate": 0.0001065587580911758, "loss": 0.0024, "step": 14674 }, { "epoch": 2.99, "learning_rate": 0.00010654020384145017, "loss": 0.0018, "step": 14675 }, { "epoch": 2.99, "learning_rate": 0.00010652165031758516, "loss": 0.0278, "step": 14676 }, { "epoch": 2.99, "learning_rate": 0.00010650309751989061, "loss": 0.0064, "step": 14677 }, { "epoch": 2.99, "learning_rate": 0.00010648454544867649, "loss": 0.0023, "step": 14678 }, { "epoch": 2.99, "learning_rate": 0.00010646599410425257, "loss": 0.0049, "step": 14679 }, { "epoch": 2.99, "learning_rate": 0.00010644744348692872, "loss": 0.0224, "step": 14680 }, { "epoch": 2.99, "learning_rate": 0.0001064288935970148, "loss": 0.0123, "step": 14681 }, { "epoch": 2.99, "learning_rate": 0.00010641034443482056, "loss": 0.014, "step": 14682 }, { "epoch": 2.99, "learning_rate": 0.00010639179600065592, "loss": 0.0181, "step": 14683 }, { "epoch": 2.99, "learning_rate": 0.00010637324829483058, "loss": 0.0073, "step": 14684 }, { "epoch": 2.99, "learning_rate": 0.0001063547013176543, "loss": 0.0148, "step": 14685 }, { "epoch": 2.99, "learning_rate": 0.00010633615506943697, "loss": 0.0085, "step": 14686 }, { "epoch": 2.99, "learning_rate": 0.00010631760955048819, "loss": 0.0131, "step": 14687 }, { "epoch": 2.99, "learning_rate": 0.00010629906476111785, "loss": 0.0071, "step": 14688 }, { "epoch": 2.99, "learning_rate": 0.00010628052070163558, "loss": 0.0051, "step": 14689 }, { "epoch": 2.99, "learning_rate": 0.00010626197737235113, "loss": 0.0089, "step": 14690 }, { "epoch": 2.99, "learning_rate": 0.00010624343477357427, "loss": 0.0145, "step": 14691 }, { "epoch": 2.99, "learning_rate": 0.00010622489290561459, "loss": 0.0103, "step": 14692 }, { "epoch": 2.99, "learning_rate": 0.00010620635176878189, "loss": 0.0084, "step": 14693 }, { "epoch": 2.99, "learning_rate": 0.00010618781136338577, "loss": 0.0085, "step": 14694 }, { "epoch": 2.99, "learning_rate": 0.00010616927168973586, "loss": 0.007, "step": 14695 }, { "epoch": 2.99, "learning_rate": 0.00010615073274814189, "loss": 0.0107, "step": 14696 }, { "epoch": 2.99, "learning_rate": 0.0001061321945389134, "loss": 0.0111, "step": 14697 }, { "epoch": 2.99, "learning_rate": 0.00010611365706236013, "loss": 0.0066, "step": 14698 }, { "epoch": 2.99, "learning_rate": 0.00010609512031879161, "loss": 0.002, "step": 14699 }, { "epoch": 2.99, "learning_rate": 0.00010607658430851744, "loss": 0.0061, "step": 14700 }, { "epoch": 2.99, "learning_rate": 0.00010605804903184723, "loss": 0.0043, "step": 14701 }, { "epoch": 2.99, "learning_rate": 0.00010603951448909059, "loss": 0.0063, "step": 14702 }, { "epoch": 2.99, "learning_rate": 0.00010602098068055696, "loss": 0.0053, "step": 14703 }, { "epoch": 2.99, "learning_rate": 0.00010600244760655605, "loss": 0.0071, "step": 14704 }, { "epoch": 2.99, "learning_rate": 0.00010598391526739724, "loss": 0.0089, "step": 14705 }, { "epoch": 2.99, "learning_rate": 0.00010596538366339017, "loss": 0.0035, "step": 14706 }, { "epoch": 2.99, "learning_rate": 0.00010594685279484435, "loss": 0.0019, "step": 14707 }, { "epoch": 2.99, "learning_rate": 0.00010592832266206916, "loss": 0.0095, "step": 14708 }, { "epoch": 3.0, "learning_rate": 0.00010590979326537424, "loss": 0.0027, "step": 14709 }, { "epoch": 3.0, "learning_rate": 0.00010589126460506896, "loss": 0.0076, "step": 14710 }, { "epoch": 3.0, "learning_rate": 0.00010587273668146284, "loss": 0.0049, "step": 14711 }, { "epoch": 3.0, "learning_rate": 0.00010585420949486534, "loss": 0.002, "step": 14712 }, { "epoch": 3.0, "learning_rate": 0.0001058356830455858, "loss": 0.0011, "step": 14713 }, { "epoch": 3.0, "learning_rate": 0.00010581715733393378, "loss": 0.0095, "step": 14714 }, { "epoch": 3.0, "learning_rate": 0.00010579863236021861, "loss": 0.01, "step": 14715 }, { "epoch": 3.0, "learning_rate": 0.00010578010812474973, "loss": 0.011, "step": 14716 }, { "epoch": 3.0, "learning_rate": 0.00010576158462783654, "loss": 0.0074, "step": 14717 }, { "epoch": 3.0, "learning_rate": 0.00010574306186978831, "loss": 0.0023, "step": 14718 }, { "epoch": 3.0, "learning_rate": 0.00010572453985091459, "loss": 0.0131, "step": 14719 }, { "epoch": 3.0, "learning_rate": 0.00010570601857152453, "loss": 0.0149, "step": 14720 }, { "epoch": 3.0, "learning_rate": 0.00010568749803192762, "loss": 0.0015, "step": 14721 }, { "epoch": 3.0, "learning_rate": 0.00010566897823243317, "loss": 0.002, "step": 14722 }, { "epoch": 3.0, "learning_rate": 0.00010565045917335039, "loss": 0.004, "step": 14723 }, { "epoch": 3.0, "learning_rate": 0.00010563194085498875, "loss": 0.012, "step": 14724 }, { "epoch": 3.0, "learning_rate": 0.00010561342327765734, "loss": 0.0012, "step": 14725 }, { "epoch": 3.0, "learning_rate": 0.00010559490644166564, "loss": 0.0066, "step": 14726 }, { "epoch": 3.0, "learning_rate": 0.00010557639034732283, "loss": 0.0044, "step": 14727 }, { "epoch": 3.0, "learning_rate": 0.00010555787499493807, "loss": 0.0021, "step": 14728 }, { "epoch": 3.0, "learning_rate": 0.00010553936038482077, "loss": 0.0032, "step": 14729 }, { "epoch": 3.0, "learning_rate": 0.00010552084651728004, "loss": 0.0043, "step": 14730 }, { "epoch": 3.0, "learning_rate": 0.00010550233339262512, "loss": 0.0143, "step": 14731 }, { "epoch": 3.0, "learning_rate": 0.00010548382101116524, "loss": 0.0198, "step": 14732 }, { "epoch": 3.0, "learning_rate": 0.00010546530937320954, "loss": 0.0072, "step": 14733 }, { "epoch": 3.0, "learning_rate": 0.00010544679847906731, "loss": 0.0055, "step": 14734 }, { "epoch": 3.0, "learning_rate": 0.00010542828832904763, "loss": 0.0055, "step": 14735 }, { "epoch": 3.0, "learning_rate": 0.00010540977892345963, "loss": 0.0037, "step": 14736 }, { "epoch": 3.0, "learning_rate": 0.00010539127026261254, "loss": 0.002, "step": 14737 }, { "epoch": 3.0, "learning_rate": 0.00010537276234681537, "loss": 0.0088, "step": 14738 }, { "epoch": 3.0, "learning_rate": 0.0001053542551763774, "loss": 0.0055, "step": 14739 }, { "epoch": 3.0, "learning_rate": 0.0001053357487516076, "loss": 0.0069, "step": 14740 }, { "epoch": 3.0, "learning_rate": 0.0001053172430728151, "loss": 0.0009, "step": 14741 }, { "epoch": 3.0, "learning_rate": 0.00010529873814030897, "loss": 0.0082, "step": 14742 }, { "epoch": 3.0, "learning_rate": 0.00010528023395439829, "loss": 0.0043, "step": 14743 }, { "epoch": 3.0, "learning_rate": 0.00010526173051539218, "loss": 0.0052, "step": 14744 }, { "epoch": 3.0, "learning_rate": 0.0001052432278235996, "loss": 0.002, "step": 14745 }, { "epoch": 3.0, "learning_rate": 0.00010522472587932955, "loss": 0.006, "step": 14746 }, { "epoch": 3.0, "learning_rate": 0.00010520622468289116, "loss": 0.0022, "step": 14747 }, { "epoch": 3.0, "learning_rate": 0.00010518772423459331, "loss": 0.0098, "step": 14748 }, { "epoch": 3.0, "learning_rate": 0.00010516922453474511, "loss": 0.0042, "step": 14749 }, { "epoch": 3.0, "learning_rate": 0.00010515072558365546, "loss": 0.0052, "step": 14750 }, { "epoch": 3.0, "learning_rate": 0.00010513222738163333, "loss": 0.0083, "step": 14751 }, { "epoch": 3.0, "learning_rate": 0.00010511372992898772, "loss": 0.0031, "step": 14752 }, { "epoch": 3.0, "learning_rate": 0.00010509523322602757, "loss": 0.0095, "step": 14753 }, { "epoch": 3.0, "learning_rate": 0.00010507673727306173, "loss": 0.0069, "step": 14754 }, { "epoch": 3.0, "learning_rate": 0.00010505824207039924, "loss": 0.0061, "step": 14755 }, { "epoch": 3.0, "learning_rate": 0.00010503974761834887, "loss": 0.0037, "step": 14756 }, { "epoch": 3.0, "learning_rate": 0.00010502125391721967, "loss": 0.0036, "step": 14757 }, { "epoch": 3.01, "learning_rate": 0.00010500276096732042, "loss": 0.0065, "step": 14758 }, { "epoch": 3.01, "learning_rate": 0.00010498426876895994, "loss": 0.0061, "step": 14759 }, { "epoch": 3.01, "learning_rate": 0.00010496577732244718, "loss": 0.0014, "step": 14760 }, { "epoch": 3.01, "learning_rate": 0.0001049472866280909, "loss": 0.0044, "step": 14761 }, { "epoch": 3.01, "learning_rate": 0.00010492879668620003, "loss": 0.0104, "step": 14762 }, { "epoch": 3.01, "learning_rate": 0.00010491030749708333, "loss": 0.002, "step": 14763 }, { "epoch": 3.01, "learning_rate": 0.00010489181906104957, "loss": 0.0061, "step": 14764 }, { "epoch": 3.01, "learning_rate": 0.00010487333137840763, "loss": 0.0058, "step": 14765 }, { "epoch": 3.01, "learning_rate": 0.00010485484444946619, "loss": 0.0064, "step": 14766 }, { "epoch": 3.01, "learning_rate": 0.00010483635827453411, "loss": 0.0122, "step": 14767 }, { "epoch": 3.01, "learning_rate": 0.00010481787285392012, "loss": 0.0022, "step": 14768 }, { "epoch": 3.01, "learning_rate": 0.00010479938818793286, "loss": 0.003, "step": 14769 }, { "epoch": 3.01, "learning_rate": 0.00010478090427688122, "loss": 0.0038, "step": 14770 }, { "epoch": 3.01, "learning_rate": 0.00010476242112107375, "loss": 0.0032, "step": 14771 }, { "epoch": 3.01, "learning_rate": 0.00010474393872081931, "loss": 0.0004, "step": 14772 }, { "epoch": 3.01, "learning_rate": 0.00010472545707642648, "loss": 0.0148, "step": 14773 }, { "epoch": 3.01, "learning_rate": 0.00010470697618820397, "loss": 0.0045, "step": 14774 }, { "epoch": 3.01, "learning_rate": 0.00010468849605646051, "loss": 0.001, "step": 14775 }, { "epoch": 3.01, "learning_rate": 0.0001046700166815047, "loss": 0.0058, "step": 14776 }, { "epoch": 3.01, "learning_rate": 0.0001046515380636451, "loss": 0.0012, "step": 14777 }, { "epoch": 3.01, "learning_rate": 0.0001046330602031905, "loss": 0.0021, "step": 14778 }, { "epoch": 3.01, "learning_rate": 0.00010461458310044934, "loss": 0.0004, "step": 14779 }, { "epoch": 3.01, "learning_rate": 0.0001045961067557304, "loss": 0.0043, "step": 14780 }, { "epoch": 3.01, "learning_rate": 0.00010457763116934213, "loss": 0.0078, "step": 14781 }, { "epoch": 3.01, "learning_rate": 0.00010455915634159318, "loss": 0.0048, "step": 14782 }, { "epoch": 3.01, "learning_rate": 0.0001045406822727921, "loss": 0.003, "step": 14783 }, { "epoch": 3.01, "learning_rate": 0.00010452220896324742, "loss": 0.004, "step": 14784 }, { "epoch": 3.01, "learning_rate": 0.00010450373641326769, "loss": 0.0063, "step": 14785 }, { "epoch": 3.01, "learning_rate": 0.00010448526462316149, "loss": 0.0026, "step": 14786 }, { "epoch": 3.01, "learning_rate": 0.00010446679359323721, "loss": 0.0044, "step": 14787 }, { "epoch": 3.01, "learning_rate": 0.0001044483233238035, "loss": 0.0029, "step": 14788 }, { "epoch": 3.01, "learning_rate": 0.00010442985381516871, "loss": 0.006, "step": 14789 }, { "epoch": 3.01, "learning_rate": 0.00010441138506764144, "loss": 0.0031, "step": 14790 }, { "epoch": 3.01, "learning_rate": 0.0001043929170815301, "loss": 0.0066, "step": 14791 }, { "epoch": 3.01, "learning_rate": 0.00010437444985714306, "loss": 0.0052, "step": 14792 }, { "epoch": 3.01, "learning_rate": 0.00010435598339478889, "loss": 0.0087, "step": 14793 }, { "epoch": 3.01, "learning_rate": 0.00010433751769477592, "loss": 0.0055, "step": 14794 }, { "epoch": 3.01, "learning_rate": 0.00010431905275741263, "loss": 0.0058, "step": 14795 }, { "epoch": 3.01, "learning_rate": 0.00010430058858300739, "loss": 0.0078, "step": 14796 }, { "epoch": 3.01, "learning_rate": 0.00010428212517186855, "loss": 0.0126, "step": 14797 }, { "epoch": 3.01, "learning_rate": 0.00010426366252430457, "loss": 0.0028, "step": 14798 }, { "epoch": 3.01, "learning_rate": 0.00010424520064062368, "loss": 0.0013, "step": 14799 }, { "epoch": 3.01, "learning_rate": 0.00010422673952113441, "loss": 0.0027, "step": 14800 }, { "epoch": 3.01, "learning_rate": 0.00010420827916614496, "loss": 0.0096, "step": 14801 }, { "epoch": 3.01, "learning_rate": 0.00010418981957596363, "loss": 0.0021, "step": 14802 }, { "epoch": 3.01, "learning_rate": 0.00010417136075089884, "loss": 0.0004, "step": 14803 }, { "epoch": 3.01, "learning_rate": 0.00010415290269125882, "loss": 0.0012, "step": 14804 }, { "epoch": 3.01, "learning_rate": 0.00010413444539735183, "loss": 0.0032, "step": 14805 }, { "epoch": 3.01, "learning_rate": 0.00010411598886948624, "loss": 0.0079, "step": 14806 }, { "epoch": 3.01, "learning_rate": 0.00010409753310797018, "loss": 0.0015, "step": 14807 }, { "epoch": 3.02, "learning_rate": 0.00010407907811311203, "loss": 0.0012, "step": 14808 }, { "epoch": 3.02, "learning_rate": 0.00010406062388521998, "loss": 0.0019, "step": 14809 }, { "epoch": 3.02, "learning_rate": 0.00010404217042460213, "loss": 0.0011, "step": 14810 }, { "epoch": 3.02, "learning_rate": 0.00010402371773156686, "loss": 0.0046, "step": 14811 }, { "epoch": 3.02, "learning_rate": 0.00010400526580642223, "loss": 0.0009, "step": 14812 }, { "epoch": 3.02, "learning_rate": 0.00010398681464947654, "loss": 0.0043, "step": 14813 }, { "epoch": 3.02, "learning_rate": 0.00010396836426103788, "loss": 0.0037, "step": 14814 }, { "epoch": 3.02, "learning_rate": 0.0001039499146414144, "loss": 0.0141, "step": 14815 }, { "epoch": 3.02, "learning_rate": 0.00010393146579091432, "loss": 0.0052, "step": 14816 }, { "epoch": 3.02, "learning_rate": 0.00010391301770984567, "loss": 0.0018, "step": 14817 }, { "epoch": 3.02, "learning_rate": 0.00010389457039851669, "loss": 0.0072, "step": 14818 }, { "epoch": 3.02, "learning_rate": 0.00010387612385723539, "loss": 0.0052, "step": 14819 }, { "epoch": 3.02, "learning_rate": 0.00010385767808630983, "loss": 0.0126, "step": 14820 }, { "epoch": 3.02, "learning_rate": 0.00010383923308604822, "loss": 0.0092, "step": 14821 }, { "epoch": 3.02, "learning_rate": 0.00010382078885675849, "loss": 0.0146, "step": 14822 }, { "epoch": 3.02, "learning_rate": 0.0001038023453987488, "loss": 0.0083, "step": 14823 }, { "epoch": 3.02, "learning_rate": 0.00010378390271232712, "loss": 0.0084, "step": 14824 }, { "epoch": 3.02, "learning_rate": 0.00010376546079780152, "loss": 0.0033, "step": 14825 }, { "epoch": 3.02, "learning_rate": 0.00010374701965547998, "loss": 0.0237, "step": 14826 }, { "epoch": 3.02, "learning_rate": 0.00010372857928567057, "loss": 0.0005, "step": 14827 }, { "epoch": 3.02, "learning_rate": 0.00010371013968868115, "loss": 0.0032, "step": 14828 }, { "epoch": 3.02, "learning_rate": 0.00010369170086481986, "loss": 0.0047, "step": 14829 }, { "epoch": 3.02, "learning_rate": 0.0001036732628143945, "loss": 0.0017, "step": 14830 }, { "epoch": 3.02, "learning_rate": 0.00010365482553771315, "loss": 0.0061, "step": 14831 }, { "epoch": 3.02, "learning_rate": 0.00010363638903508372, "loss": 0.0086, "step": 14832 }, { "epoch": 3.02, "learning_rate": 0.00010361795330681404, "loss": 0.0011, "step": 14833 }, { "epoch": 3.02, "learning_rate": 0.00010359951835321211, "loss": 0.0012, "step": 14834 }, { "epoch": 3.02, "learning_rate": 0.00010358108417458581, "loss": 0.0023, "step": 14835 }, { "epoch": 3.02, "learning_rate": 0.00010356265077124306, "loss": 0.0063, "step": 14836 }, { "epoch": 3.02, "learning_rate": 0.00010354421814349171, "loss": 0.0067, "step": 14837 }, { "epoch": 3.02, "learning_rate": 0.00010352578629163953, "loss": 0.0033, "step": 14838 }, { "epoch": 3.02, "learning_rate": 0.00010350735521599451, "loss": 0.0078, "step": 14839 }, { "epoch": 3.02, "learning_rate": 0.00010348892491686437, "loss": 0.0043, "step": 14840 }, { "epoch": 3.02, "learning_rate": 0.00010347049539455707, "loss": 0.0034, "step": 14841 }, { "epoch": 3.02, "learning_rate": 0.00010345206664938028, "loss": 0.0026, "step": 14842 }, { "epoch": 3.02, "learning_rate": 0.0001034336386816418, "loss": 0.0009, "step": 14843 }, { "epoch": 3.02, "learning_rate": 0.00010341521149164952, "loss": 0.0141, "step": 14844 }, { "epoch": 3.02, "learning_rate": 0.00010339678507971108, "loss": 0.0077, "step": 14845 }, { "epoch": 3.02, "learning_rate": 0.0001033783594461343, "loss": 0.0026, "step": 14846 }, { "epoch": 3.02, "learning_rate": 0.000103359934591227, "loss": 0.0031, "step": 14847 }, { "epoch": 3.02, "learning_rate": 0.00010334151051529674, "loss": 0.0045, "step": 14848 }, { "epoch": 3.02, "learning_rate": 0.0001033230872186514, "loss": 0.0025, "step": 14849 }, { "epoch": 3.02, "learning_rate": 0.0001033046647015986, "loss": 0.0191, "step": 14850 }, { "epoch": 3.02, "learning_rate": 0.00010328624296444601, "loss": 0.005, "step": 14851 }, { "epoch": 3.02, "learning_rate": 0.00010326782200750137, "loss": 0.0018, "step": 14852 }, { "epoch": 3.02, "learning_rate": 0.00010324940183107227, "loss": 0.002, "step": 14853 }, { "epoch": 3.02, "learning_rate": 0.00010323098243546646, "loss": 0.0075, "step": 14854 }, { "epoch": 3.02, "learning_rate": 0.00010321256382099152, "loss": 0.0036, "step": 14855 }, { "epoch": 3.02, "learning_rate": 0.00010319414598795507, "loss": 0.0008, "step": 14856 }, { "epoch": 3.03, "learning_rate": 0.00010317572893666472, "loss": 0.0024, "step": 14857 }, { "epoch": 3.03, "learning_rate": 0.00010315731266742806, "loss": 0.0029, "step": 14858 }, { "epoch": 3.03, "learning_rate": 0.00010313889718055277, "loss": 0.0108, "step": 14859 }, { "epoch": 3.03, "learning_rate": 0.00010312048247634634, "loss": 0.0061, "step": 14860 }, { "epoch": 3.03, "learning_rate": 0.00010310206855511629, "loss": 0.0065, "step": 14861 }, { "epoch": 3.03, "learning_rate": 0.00010308365541717029, "loss": 0.0037, "step": 14862 }, { "epoch": 3.03, "learning_rate": 0.00010306524306281574, "loss": 0.0001, "step": 14863 }, { "epoch": 3.03, "learning_rate": 0.00010304683149236026, "loss": 0.0113, "step": 14864 }, { "epoch": 3.03, "learning_rate": 0.00010302842070611134, "loss": 0.0023, "step": 14865 }, { "epoch": 3.03, "learning_rate": 0.00010301001070437642, "loss": 0.0004, "step": 14866 }, { "epoch": 3.03, "learning_rate": 0.00010299160148746304, "loss": 0.0004, "step": 14867 }, { "epoch": 3.03, "learning_rate": 0.00010297319305567864, "loss": 0.0037, "step": 14868 }, { "epoch": 3.03, "learning_rate": 0.0001029547854093307, "loss": 0.0006, "step": 14869 }, { "epoch": 3.03, "learning_rate": 0.00010293637854872669, "loss": 0.0114, "step": 14870 }, { "epoch": 3.03, "learning_rate": 0.00010291797247417392, "loss": 0.0033, "step": 14871 }, { "epoch": 3.03, "learning_rate": 0.00010289956718597992, "loss": 0.0006, "step": 14872 }, { "epoch": 3.03, "learning_rate": 0.00010288116268445203, "loss": 0.0025, "step": 14873 }, { "epoch": 3.03, "learning_rate": 0.00010286275896989773, "loss": 0.0159, "step": 14874 }, { "epoch": 3.03, "learning_rate": 0.00010284435604262426, "loss": 0.0008, "step": 14875 }, { "epoch": 3.03, "learning_rate": 0.00010282595390293909, "loss": 0.0006, "step": 14876 }, { "epoch": 3.03, "learning_rate": 0.00010280755255114954, "loss": 0.0061, "step": 14877 }, { "epoch": 3.03, "learning_rate": 0.00010278915198756298, "loss": 0.0028, "step": 14878 }, { "epoch": 3.03, "learning_rate": 0.00010277075221248661, "loss": 0.0045, "step": 14879 }, { "epoch": 3.03, "learning_rate": 0.00010275235322622791, "loss": 0.0014, "step": 14880 }, { "epoch": 3.03, "learning_rate": 0.00010273395502909402, "loss": 0.0028, "step": 14881 }, { "epoch": 3.03, "learning_rate": 0.0001027155576213924, "loss": 0.0009, "step": 14882 }, { "epoch": 3.03, "learning_rate": 0.00010269716100343018, "loss": 0.0072, "step": 14883 }, { "epoch": 3.03, "learning_rate": 0.0001026787651755146, "loss": 0.0021, "step": 14884 }, { "epoch": 3.03, "learning_rate": 0.00010266037013795307, "loss": 0.0029, "step": 14885 }, { "epoch": 3.03, "learning_rate": 0.00010264197589105262, "loss": 0.0007, "step": 14886 }, { "epoch": 3.03, "learning_rate": 0.00010262358243512064, "loss": 0.0028, "step": 14887 }, { "epoch": 3.03, "learning_rate": 0.00010260518977046426, "loss": 0.011, "step": 14888 }, { "epoch": 3.03, "learning_rate": 0.00010258679789739061, "loss": 0.01, "step": 14889 }, { "epoch": 3.03, "learning_rate": 0.000102568406816207, "loss": 0.0017, "step": 14890 }, { "epoch": 3.03, "learning_rate": 0.00010255001652722048, "loss": 0.0059, "step": 14891 }, { "epoch": 3.03, "learning_rate": 0.0001025316270307383, "loss": 0.0225, "step": 14892 }, { "epoch": 3.03, "learning_rate": 0.00010251323832706755, "loss": 0.0061, "step": 14893 }, { "epoch": 3.03, "learning_rate": 0.0001024948504165153, "loss": 0.0049, "step": 14894 }, { "epoch": 3.03, "learning_rate": 0.00010247646329938879, "loss": 0.0104, "step": 14895 }, { "epoch": 3.03, "learning_rate": 0.000102458076975995, "loss": 0.0017, "step": 14896 }, { "epoch": 3.03, "learning_rate": 0.0001024396914466411, "loss": 0.0042, "step": 14897 }, { "epoch": 3.03, "learning_rate": 0.0001024213067116341, "loss": 0.006, "step": 14898 }, { "epoch": 3.03, "learning_rate": 0.00010240292277128107, "loss": 0.0058, "step": 14899 }, { "epoch": 3.03, "learning_rate": 0.00010238453962588914, "loss": 0.0054, "step": 14900 }, { "epoch": 3.03, "learning_rate": 0.00010236615727576528, "loss": 0.0058, "step": 14901 }, { "epoch": 3.03, "learning_rate": 0.00010234777572121643, "loss": 0.0045, "step": 14902 }, { "epoch": 3.03, "learning_rate": 0.00010232939496254976, "loss": 0.0005, "step": 14903 }, { "epoch": 3.03, "learning_rate": 0.00010231101500007211, "loss": 0.0003, "step": 14904 }, { "epoch": 3.03, "learning_rate": 0.00010229263583409058, "loss": 0.0051, "step": 14905 }, { "epoch": 3.04, "learning_rate": 0.00010227425746491205, "loss": 0.0003, "step": 14906 }, { "epoch": 3.04, "learning_rate": 0.00010225587989284353, "loss": 0.0019, "step": 14907 }, { "epoch": 3.04, "learning_rate": 0.00010223750311819191, "loss": 0.0074, "step": 14908 }, { "epoch": 3.04, "learning_rate": 0.00010221912714126417, "loss": 0.0076, "step": 14909 }, { "epoch": 3.04, "learning_rate": 0.0001022007519623672, "loss": 0.0003, "step": 14910 }, { "epoch": 3.04, "learning_rate": 0.00010218237758180793, "loss": 0.0061, "step": 14911 }, { "epoch": 3.04, "learning_rate": 0.00010216400399989314, "loss": 0.0035, "step": 14912 }, { "epoch": 3.04, "learning_rate": 0.00010214563121692986, "loss": 0.0049, "step": 14913 }, { "epoch": 3.04, "learning_rate": 0.0001021272592332248, "loss": 0.0064, "step": 14914 }, { "epoch": 3.04, "learning_rate": 0.00010210888804908493, "loss": 0.0002, "step": 14915 }, { "epoch": 3.04, "learning_rate": 0.00010209051766481705, "loss": 0.0155, "step": 14916 }, { "epoch": 3.04, "learning_rate": 0.00010207214808072786, "loss": 0.0061, "step": 14917 }, { "epoch": 3.04, "learning_rate": 0.00010205377929712434, "loss": 0.0063, "step": 14918 }, { "epoch": 3.04, "learning_rate": 0.0001020354113143132, "loss": 0.0131, "step": 14919 }, { "epoch": 3.04, "learning_rate": 0.00010201704413260123, "loss": 0.0063, "step": 14920 }, { "epoch": 3.04, "learning_rate": 0.00010199867775229523, "loss": 0.0007, "step": 14921 }, { "epoch": 3.04, "learning_rate": 0.00010198031217370184, "loss": 0.001, "step": 14922 }, { "epoch": 3.04, "learning_rate": 0.00010196194739712797, "loss": 0.0067, "step": 14923 }, { "epoch": 3.04, "learning_rate": 0.00010194358342288025, "loss": 0.0005, "step": 14924 }, { "epoch": 3.04, "learning_rate": 0.00010192522025126532, "loss": 0.0117, "step": 14925 }, { "epoch": 3.04, "learning_rate": 0.00010190685788259004, "loss": 0.0035, "step": 14926 }, { "epoch": 3.04, "learning_rate": 0.00010188849631716094, "loss": 0.0042, "step": 14927 }, { "epoch": 3.04, "learning_rate": 0.0001018701355552848, "loss": 0.0062, "step": 14928 }, { "epoch": 3.04, "learning_rate": 0.00010185177559726828, "loss": 0.0184, "step": 14929 }, { "epoch": 3.04, "learning_rate": 0.00010183341644341794, "loss": 0.0034, "step": 14930 }, { "epoch": 3.04, "learning_rate": 0.00010181505809404051, "loss": 0.002, "step": 14931 }, { "epoch": 3.04, "learning_rate": 0.00010179670054944254, "loss": 0.0039, "step": 14932 }, { "epoch": 3.04, "learning_rate": 0.00010177834380993068, "loss": 0.0044, "step": 14933 }, { "epoch": 3.04, "learning_rate": 0.00010175998787581152, "loss": 0.0078, "step": 14934 }, { "epoch": 3.04, "learning_rate": 0.00010174163274739157, "loss": 0.0177, "step": 14935 }, { "epoch": 3.04, "learning_rate": 0.0001017232784249775, "loss": 0.0144, "step": 14936 }, { "epoch": 3.04, "learning_rate": 0.00010170492490887577, "loss": 0.0011, "step": 14937 }, { "epoch": 3.04, "learning_rate": 0.00010168657219939299, "loss": 0.0047, "step": 14938 }, { "epoch": 3.04, "learning_rate": 0.00010166822029683563, "loss": 0.0069, "step": 14939 }, { "epoch": 3.04, "learning_rate": 0.00010164986920151018, "loss": 0.0013, "step": 14940 }, { "epoch": 3.04, "learning_rate": 0.00010163151891372327, "loss": 0.0039, "step": 14941 }, { "epoch": 3.04, "learning_rate": 0.00010161316943378122, "loss": 0.0086, "step": 14942 }, { "epoch": 3.04, "learning_rate": 0.00010159482076199064, "loss": 0.0046, "step": 14943 }, { "epoch": 3.04, "learning_rate": 0.00010157647289865794, "loss": 0.0069, "step": 14944 }, { "epoch": 3.04, "learning_rate": 0.00010155812584408945, "loss": 0.0002, "step": 14945 }, { "epoch": 3.04, "learning_rate": 0.00010153977959859177, "loss": 0.0018, "step": 14946 }, { "epoch": 3.04, "learning_rate": 0.00010152143416247121, "loss": 0.0064, "step": 14947 }, { "epoch": 3.04, "learning_rate": 0.00010150308953603426, "loss": 0.0022, "step": 14948 }, { "epoch": 3.04, "learning_rate": 0.00010148474571958722, "loss": 0.0039, "step": 14949 }, { "epoch": 3.04, "learning_rate": 0.00010146640271343651, "loss": 0.0063, "step": 14950 }, { "epoch": 3.04, "learning_rate": 0.00010144806051788849, "loss": 0.0032, "step": 14951 }, { "epoch": 3.04, "learning_rate": 0.00010142971913324954, "loss": 0.0061, "step": 14952 }, { "epoch": 3.04, "learning_rate": 0.00010141137855982591, "loss": 0.0026, "step": 14953 }, { "epoch": 3.04, "learning_rate": 0.000101393038797924, "loss": 0.0016, "step": 14954 }, { "epoch": 3.05, "learning_rate": 0.00010137469984785008, "loss": 0.0047, "step": 14955 }, { "epoch": 3.05, "learning_rate": 0.00010135636170991049, "loss": 0.0062, "step": 14956 }, { "epoch": 3.05, "learning_rate": 0.0001013380243844115, "loss": 0.0058, "step": 14957 }, { "epoch": 3.05, "learning_rate": 0.00010131968787165929, "loss": 0.0024, "step": 14958 }, { "epoch": 3.05, "learning_rate": 0.0001013013521719602, "loss": 0.0068, "step": 14959 }, { "epoch": 3.05, "learning_rate": 0.00010128301728562048, "loss": 0.0042, "step": 14960 }, { "epoch": 3.05, "learning_rate": 0.00010126468321294631, "loss": 0.0137, "step": 14961 }, { "epoch": 3.05, "learning_rate": 0.00010124634995424395, "loss": 0.0016, "step": 14962 }, { "epoch": 3.05, "learning_rate": 0.00010122801750981955, "loss": 0.0056, "step": 14963 }, { "epoch": 3.05, "learning_rate": 0.00010120968587997934, "loss": 0.0029, "step": 14964 }, { "epoch": 3.05, "learning_rate": 0.00010119135506502944, "loss": 0.0043, "step": 14965 }, { "epoch": 3.05, "learning_rate": 0.00010117302506527608, "loss": 0.0017, "step": 14966 }, { "epoch": 3.05, "learning_rate": 0.00010115469588102541, "loss": 0.0047, "step": 14967 }, { "epoch": 3.05, "learning_rate": 0.00010113636751258341, "loss": 0.0195, "step": 14968 }, { "epoch": 3.05, "learning_rate": 0.00010111803996025641, "loss": 0.003, "step": 14969 }, { "epoch": 3.05, "learning_rate": 0.00010109971322435032, "loss": 0.0071, "step": 14970 }, { "epoch": 3.05, "learning_rate": 0.00010108138730517139, "loss": 0.0094, "step": 14971 }, { "epoch": 3.05, "learning_rate": 0.00010106306220302564, "loss": 0.004, "step": 14972 }, { "epoch": 3.05, "learning_rate": 0.00010104473791821907, "loss": 0.004, "step": 14973 }, { "epoch": 3.05, "learning_rate": 0.00010102641445105786, "loss": 0.0042, "step": 14974 }, { "epoch": 3.05, "learning_rate": 0.00010100809180184795, "loss": 0.0022, "step": 14975 }, { "epoch": 3.05, "learning_rate": 0.00010098976997089533, "loss": 0.0091, "step": 14976 }, { "epoch": 3.05, "learning_rate": 0.00010097144895850613, "loss": 0.0018, "step": 14977 }, { "epoch": 3.05, "learning_rate": 0.00010095312876498623, "loss": 0.0059, "step": 14978 }, { "epoch": 3.05, "learning_rate": 0.0001009348093906417, "loss": 0.0089, "step": 14979 }, { "epoch": 3.05, "learning_rate": 0.00010091649083577847, "loss": 0.0003, "step": 14980 }, { "epoch": 3.05, "learning_rate": 0.00010089817310070244, "loss": 0.014, "step": 14981 }, { "epoch": 3.05, "learning_rate": 0.00010087985618571969, "loss": 0.0151, "step": 14982 }, { "epoch": 3.05, "learning_rate": 0.00010086154009113598, "loss": 0.0098, "step": 14983 }, { "epoch": 3.05, "learning_rate": 0.00010084322481725738, "loss": 0.003, "step": 14984 }, { "epoch": 3.05, "learning_rate": 0.00010082491036438972, "loss": 0.001, "step": 14985 }, { "epoch": 3.05, "learning_rate": 0.0001008065967328388, "loss": 0.0056, "step": 14986 }, { "epoch": 3.05, "learning_rate": 0.00010078828392291064, "loss": 0.0058, "step": 14987 }, { "epoch": 3.05, "learning_rate": 0.00010076997193491097, "loss": 0.0105, "step": 14988 }, { "epoch": 3.05, "learning_rate": 0.00010075166076914576, "loss": 0.0051, "step": 14989 }, { "epoch": 3.05, "learning_rate": 0.00010073335042592076, "loss": 0.0025, "step": 14990 }, { "epoch": 3.05, "learning_rate": 0.00010071504090554177, "loss": 0.0096, "step": 14991 }, { "epoch": 3.05, "learning_rate": 0.00010069673220831468, "loss": 0.0024, "step": 14992 }, { "epoch": 3.05, "learning_rate": 0.00010067842433454516, "loss": 0.0081, "step": 14993 }, { "epoch": 3.05, "learning_rate": 0.00010066011728453914, "loss": 0.0081, "step": 14994 }, { "epoch": 3.05, "learning_rate": 0.00010064181105860228, "loss": 0.0071, "step": 14995 }, { "epoch": 3.05, "learning_rate": 0.00010062350565704029, "loss": 0.0176, "step": 14996 }, { "epoch": 3.05, "learning_rate": 0.00010060520108015902, "loss": 0.0028, "step": 14997 }, { "epoch": 3.05, "learning_rate": 0.00010058689732826413, "loss": 0.0069, "step": 14998 }, { "epoch": 3.05, "learning_rate": 0.00010056859440166126, "loss": 0.0054, "step": 14999 }, { "epoch": 3.05, "learning_rate": 0.00010055029230065622, "loss": 0.02, "step": 15000 }, { "epoch": 3.05, "learning_rate": 0.00010053199102555463, "loss": 0.0066, "step": 15001 }, { "epoch": 3.05, "learning_rate": 0.00010051369057666218, "loss": 0.0036, "step": 15002 }, { "epoch": 3.05, "learning_rate": 0.00010049539095428452, "loss": 0.0028, "step": 15003 }, { "epoch": 3.06, "learning_rate": 0.00010047709215872724, "loss": 0.0035, "step": 15004 }, { "epoch": 3.06, "learning_rate": 0.00010045879419029605, "loss": 0.0061, "step": 15005 }, { "epoch": 3.06, "learning_rate": 0.00010044049704929644, "loss": 0.0039, "step": 15006 }, { "epoch": 3.06, "learning_rate": 0.00010042220073603417, "loss": 0.0008, "step": 15007 }, { "epoch": 3.06, "learning_rate": 0.00010040390525081472, "loss": 0.0055, "step": 15008 }, { "epoch": 3.06, "learning_rate": 0.0001003856105939436, "loss": 0.0049, "step": 15009 }, { "epoch": 3.06, "learning_rate": 0.00010036731676572649, "loss": 0.005, "step": 15010 }, { "epoch": 3.06, "learning_rate": 0.00010034902376646884, "loss": 0.0127, "step": 15011 }, { "epoch": 3.06, "learning_rate": 0.00010033073159647623, "loss": 0.0026, "step": 15012 }, { "epoch": 3.06, "learning_rate": 0.0001003124402560542, "loss": 0.0062, "step": 15013 }, { "epoch": 3.06, "learning_rate": 0.00010029414974550816, "loss": 0.0005, "step": 15014 }, { "epoch": 3.06, "learning_rate": 0.00010027586006514368, "loss": 0.0093, "step": 15015 }, { "epoch": 3.06, "learning_rate": 0.00010025757121526614, "loss": 0.0035, "step": 15016 }, { "epoch": 3.06, "learning_rate": 0.00010023928319618115, "loss": 0.0061, "step": 15017 }, { "epoch": 3.06, "learning_rate": 0.00010022099600819404, "loss": 0.001, "step": 15018 }, { "epoch": 3.06, "learning_rate": 0.00010020270965161018, "loss": 0.0103, "step": 15019 }, { "epoch": 3.06, "learning_rate": 0.00010018442412673514, "loss": 0.0012, "step": 15020 }, { "epoch": 3.06, "learning_rate": 0.0001001661394338742, "loss": 0.005, "step": 15021 }, { "epoch": 3.06, "learning_rate": 0.00010014785557333286, "loss": 0.0096, "step": 15022 }, { "epoch": 3.06, "learning_rate": 0.00010012957254541641, "loss": 0.0056, "step": 15023 }, { "epoch": 3.06, "learning_rate": 0.0001001112903504302, "loss": 0.0088, "step": 15024 }, { "epoch": 3.06, "learning_rate": 0.00010009300898867967, "loss": 0.0043, "step": 15025 }, { "epoch": 3.06, "learning_rate": 0.0001000747284604701, "loss": 0.0005, "step": 15026 }, { "epoch": 3.06, "learning_rate": 0.00010005644876610673, "loss": 0.0038, "step": 15027 }, { "epoch": 3.06, "learning_rate": 0.00010003816990589501, "loss": 0.0117, "step": 15028 }, { "epoch": 3.06, "learning_rate": 0.0001000198918801401, "loss": 0.0019, "step": 15029 }, { "epoch": 3.06, "learning_rate": 0.00010000161468914741, "loss": 0.001, "step": 15030 }, { "epoch": 3.06, "learning_rate": 9.99833383332221e-05, "loss": 0.0035, "step": 15031 }, { "epoch": 3.06, "learning_rate": 9.996506281266944e-05, "loss": 0.0088, "step": 15032 }, { "epoch": 3.06, "learning_rate": 9.99467881277947e-05, "loss": 0.0088, "step": 15033 }, { "epoch": 3.06, "learning_rate": 9.992851427890303e-05, "loss": 0.0023, "step": 15034 }, { "epoch": 3.06, "learning_rate": 9.991024126629976e-05, "loss": 0.0037, "step": 15035 }, { "epoch": 3.06, "learning_rate": 9.989196909029e-05, "loss": 0.0024, "step": 15036 }, { "epoch": 3.06, "learning_rate": 9.987369775117891e-05, "loss": 0.0037, "step": 15037 }, { "epoch": 3.06, "learning_rate": 9.985542724927171e-05, "loss": 0.0021, "step": 15038 }, { "epoch": 3.06, "learning_rate": 9.983715758487348e-05, "loss": 0.0018, "step": 15039 }, { "epoch": 3.06, "learning_rate": 9.981888875828948e-05, "loss": 0.0159, "step": 15040 }, { "epoch": 3.06, "learning_rate": 9.980062076982477e-05, "loss": 0.0039, "step": 15041 }, { "epoch": 3.06, "learning_rate": 9.978235361978438e-05, "loss": 0.0044, "step": 15042 }, { "epoch": 3.06, "learning_rate": 9.976408730847351e-05, "loss": 0.0037, "step": 15043 }, { "epoch": 3.06, "learning_rate": 9.974582183619719e-05, "loss": 0.0004, "step": 15044 }, { "epoch": 3.06, "learning_rate": 9.972755720326052e-05, "loss": 0.0052, "step": 15045 }, { "epoch": 3.06, "learning_rate": 9.970929340996858e-05, "loss": 0.0059, "step": 15046 }, { "epoch": 3.06, "learning_rate": 9.96910304566263e-05, "loss": 0.0044, "step": 15047 }, { "epoch": 3.06, "learning_rate": 9.967276834353885e-05, "loss": 0.007, "step": 15048 }, { "epoch": 3.06, "learning_rate": 9.965450707101115e-05, "loss": 0.0039, "step": 15049 }, { "epoch": 3.06, "learning_rate": 9.963624663934817e-05, "loss": 0.0078, "step": 15050 }, { "epoch": 3.06, "learning_rate": 9.961798704885497e-05, "loss": 0.006, "step": 15051 }, { "epoch": 3.06, "learning_rate": 9.959972829983645e-05, "loss": 0.0084, "step": 15052 }, { "epoch": 3.07, "learning_rate": 9.958147039259763e-05, "loss": 0.0061, "step": 15053 }, { "epoch": 3.07, "learning_rate": 9.956321332744347e-05, "loss": 0.0047, "step": 15054 }, { "epoch": 3.07, "learning_rate": 9.954495710467879e-05, "loss": 0.0006, "step": 15055 }, { "epoch": 3.07, "learning_rate": 9.952670172460862e-05, "loss": 0.0004, "step": 15056 }, { "epoch": 3.07, "learning_rate": 9.950844718753774e-05, "loss": 0.0028, "step": 15057 }, { "epoch": 3.07, "learning_rate": 9.949019349377116e-05, "loss": 0.0012, "step": 15058 }, { "epoch": 3.07, "learning_rate": 9.947194064361372e-05, "loss": 0.0005, "step": 15059 }, { "epoch": 3.07, "learning_rate": 9.945368863737018e-05, "loss": 0.0047, "step": 15060 }, { "epoch": 3.07, "learning_rate": 9.94354374753455e-05, "loss": 0.001, "step": 15061 }, { "epoch": 3.07, "learning_rate": 9.94171871578444e-05, "loss": 0.0074, "step": 15062 }, { "epoch": 3.07, "learning_rate": 9.939893768517183e-05, "loss": 0.0026, "step": 15063 }, { "epoch": 3.07, "learning_rate": 9.938068905763247e-05, "loss": 0.0186, "step": 15064 }, { "epoch": 3.07, "learning_rate": 9.936244127553113e-05, "loss": 0.0067, "step": 15065 }, { "epoch": 3.07, "learning_rate": 9.934419433917267e-05, "loss": 0.002, "step": 15066 }, { "epoch": 3.07, "learning_rate": 9.932594824886173e-05, "loss": 0.0009, "step": 15067 }, { "epoch": 3.07, "learning_rate": 9.930770300490315e-05, "loss": 0.0078, "step": 15068 }, { "epoch": 3.07, "learning_rate": 9.928945860760163e-05, "loss": 0.0073, "step": 15069 }, { "epoch": 3.07, "learning_rate": 9.927121505726183e-05, "loss": 0.0076, "step": 15070 }, { "epoch": 3.07, "learning_rate": 9.925297235418853e-05, "loss": 0.0065, "step": 15071 }, { "epoch": 3.07, "learning_rate": 9.923473049868635e-05, "loss": 0.0034, "step": 15072 }, { "epoch": 3.07, "learning_rate": 9.921648949106001e-05, "loss": 0.0066, "step": 15073 }, { "epoch": 3.07, "learning_rate": 9.919824933161416e-05, "loss": 0.003, "step": 15074 }, { "epoch": 3.07, "learning_rate": 9.918001002065345e-05, "loss": 0.0044, "step": 15075 }, { "epoch": 3.07, "learning_rate": 9.916177155848249e-05, "loss": 0.006, "step": 15076 }, { "epoch": 3.07, "learning_rate": 9.914353394540594e-05, "loss": 0.0125, "step": 15077 }, { "epoch": 3.07, "learning_rate": 9.91252971817283e-05, "loss": 0.0117, "step": 15078 }, { "epoch": 3.07, "learning_rate": 9.910706126775432e-05, "loss": 0.0055, "step": 15079 }, { "epoch": 3.07, "learning_rate": 9.908882620378839e-05, "loss": 0.002, "step": 15080 }, { "epoch": 3.07, "learning_rate": 9.907059199013526e-05, "loss": 0.005, "step": 15081 }, { "epoch": 3.07, "learning_rate": 9.905235862709934e-05, "loss": 0.0024, "step": 15082 }, { "epoch": 3.07, "learning_rate": 9.903412611498516e-05, "loss": 0.0058, "step": 15083 }, { "epoch": 3.07, "learning_rate": 9.90158944540973e-05, "loss": 0.0062, "step": 15084 }, { "epoch": 3.07, "learning_rate": 9.899766364474025e-05, "loss": 0.0037, "step": 15085 }, { "epoch": 3.07, "learning_rate": 9.897943368721849e-05, "loss": 0.0148, "step": 15086 }, { "epoch": 3.07, "learning_rate": 9.896120458183653e-05, "loss": 0.0013, "step": 15087 }, { "epoch": 3.07, "learning_rate": 9.894297632889872e-05, "loss": 0.014, "step": 15088 }, { "epoch": 3.07, "learning_rate": 9.892474892870966e-05, "loss": 0.0061, "step": 15089 }, { "epoch": 3.07, "learning_rate": 9.890652238157364e-05, "loss": 0.0022, "step": 15090 }, { "epoch": 3.07, "learning_rate": 9.888829668779521e-05, "loss": 0.0048, "step": 15091 }, { "epoch": 3.07, "learning_rate": 9.88700718476787e-05, "loss": 0.004, "step": 15092 }, { "epoch": 3.07, "learning_rate": 9.885184786152844e-05, "loss": 0.0142, "step": 15093 }, { "epoch": 3.07, "learning_rate": 9.883362472964893e-05, "loss": 0.0111, "step": 15094 }, { "epoch": 3.07, "learning_rate": 9.881540245234442e-05, "loss": 0.0046, "step": 15095 }, { "epoch": 3.07, "learning_rate": 9.879718102991932e-05, "loss": 0.0056, "step": 15096 }, { "epoch": 3.07, "learning_rate": 9.877896046267799e-05, "loss": 0.0098, "step": 15097 }, { "epoch": 3.07, "learning_rate": 9.876074075092464e-05, "loss": 0.0043, "step": 15098 }, { "epoch": 3.07, "learning_rate": 9.87425218949637e-05, "loss": 0.0036, "step": 15099 }, { "epoch": 3.07, "learning_rate": 9.87243038950994e-05, "loss": 0.0089, "step": 15100 }, { "epoch": 3.07, "learning_rate": 9.870608675163596e-05, "loss": 0.0086, "step": 15101 }, { "epoch": 3.08, "learning_rate": 9.868787046487778e-05, "loss": 0.0089, "step": 15102 }, { "epoch": 3.08, "learning_rate": 9.866965503512891e-05, "loss": 0.0086, "step": 15103 }, { "epoch": 3.08, "learning_rate": 9.865144046269377e-05, "loss": 0.0083, "step": 15104 }, { "epoch": 3.08, "learning_rate": 9.86332267478765e-05, "loss": 0.007, "step": 15105 }, { "epoch": 3.08, "learning_rate": 9.861501389098125e-05, "loss": 0.0126, "step": 15106 }, { "epoch": 3.08, "learning_rate": 9.859680189231233e-05, "loss": 0.0116, "step": 15107 }, { "epoch": 3.08, "learning_rate": 9.857859075217379e-05, "loss": 0.0023, "step": 15108 }, { "epoch": 3.08, "learning_rate": 9.85603804708699e-05, "loss": 0.003, "step": 15109 }, { "epoch": 3.08, "learning_rate": 9.854217104870477e-05, "loss": 0.0113, "step": 15110 }, { "epoch": 3.08, "learning_rate": 9.852396248598247e-05, "loss": 0.0095, "step": 15111 }, { "epoch": 3.08, "learning_rate": 9.850575478300719e-05, "loss": 0.0214, "step": 15112 }, { "epoch": 3.08, "learning_rate": 9.848754794008295e-05, "loss": 0.0071, "step": 15113 }, { "epoch": 3.08, "learning_rate": 9.846934195751396e-05, "loss": 0.0009, "step": 15114 }, { "epoch": 3.08, "learning_rate": 9.845113683560423e-05, "loss": 0.0086, "step": 15115 }, { "epoch": 3.08, "learning_rate": 9.843293257465779e-05, "loss": 0.0017, "step": 15116 }, { "epoch": 3.08, "learning_rate": 9.841472917497874e-05, "loss": 0.0044, "step": 15117 }, { "epoch": 3.08, "learning_rate": 9.839652663687103e-05, "loss": 0.0073, "step": 15118 }, { "epoch": 3.08, "learning_rate": 9.83783249606388e-05, "loss": 0.0016, "step": 15119 }, { "epoch": 3.08, "learning_rate": 9.8360124146586e-05, "loss": 0.009, "step": 15120 }, { "epoch": 3.08, "learning_rate": 9.834192419501654e-05, "loss": 0.0032, "step": 15121 }, { "epoch": 3.08, "learning_rate": 9.83237251062345e-05, "loss": 0.0021, "step": 15122 }, { "epoch": 3.08, "learning_rate": 9.830552688054382e-05, "loss": 0.0158, "step": 15123 }, { "epoch": 3.08, "learning_rate": 9.828732951824836e-05, "loss": 0.0068, "step": 15124 }, { "epoch": 3.08, "learning_rate": 9.826913301965211e-05, "loss": 0.0064, "step": 15125 }, { "epoch": 3.08, "learning_rate": 9.825093738505902e-05, "loss": 0.0135, "step": 15126 }, { "epoch": 3.08, "learning_rate": 9.823274261477296e-05, "loss": 0.0033, "step": 15127 }, { "epoch": 3.08, "learning_rate": 9.821454870909782e-05, "loss": 0.0008, "step": 15128 }, { "epoch": 3.08, "learning_rate": 9.819635566833743e-05, "loss": 0.0057, "step": 15129 }, { "epoch": 3.08, "learning_rate": 9.817816349279573e-05, "loss": 0.0076, "step": 15130 }, { "epoch": 3.08, "learning_rate": 9.815997218277648e-05, "loss": 0.0022, "step": 15131 }, { "epoch": 3.08, "learning_rate": 9.81417817385836e-05, "loss": 0.0017, "step": 15132 }, { "epoch": 3.08, "learning_rate": 9.812359216052085e-05, "loss": 0.0005, "step": 15133 }, { "epoch": 3.08, "learning_rate": 9.810540344889197e-05, "loss": 0.0004, "step": 15134 }, { "epoch": 3.08, "learning_rate": 9.808721560400088e-05, "loss": 0.0011, "step": 15135 }, { "epoch": 3.08, "learning_rate": 9.806902862615123e-05, "loss": 0.0052, "step": 15136 }, { "epoch": 3.08, "learning_rate": 9.805084251564683e-05, "loss": 0.0112, "step": 15137 }, { "epoch": 3.08, "learning_rate": 9.803265727279149e-05, "loss": 0.0032, "step": 15138 }, { "epoch": 3.08, "learning_rate": 9.801447289788878e-05, "loss": 0.0016, "step": 15139 }, { "epoch": 3.08, "learning_rate": 9.799628939124257e-05, "loss": 0.0012, "step": 15140 }, { "epoch": 3.08, "learning_rate": 9.797810675315642e-05, "loss": 0.0038, "step": 15141 }, { "epoch": 3.08, "learning_rate": 9.795992498393416e-05, "loss": 0.0031, "step": 15142 }, { "epoch": 3.08, "learning_rate": 9.79417440838794e-05, "loss": 0.0033, "step": 15143 }, { "epoch": 3.08, "learning_rate": 9.79235640532957e-05, "loss": 0.0022, "step": 15144 }, { "epoch": 3.08, "learning_rate": 9.790538489248685e-05, "loss": 0.0033, "step": 15145 }, { "epoch": 3.08, "learning_rate": 9.788720660175637e-05, "loss": 0.0055, "step": 15146 }, { "epoch": 3.08, "learning_rate": 9.786902918140792e-05, "loss": 0.0025, "step": 15147 }, { "epoch": 3.08, "learning_rate": 9.785085263174508e-05, "loss": 0.0065, "step": 15148 }, { "epoch": 3.08, "learning_rate": 9.78326769530714e-05, "loss": 0.0003, "step": 15149 }, { "epoch": 3.08, "learning_rate": 9.781450214569057e-05, "loss": 0.0052, "step": 15150 }, { "epoch": 3.09, "learning_rate": 9.779632820990604e-05, "loss": 0.0004, "step": 15151 }, { "epoch": 3.09, "learning_rate": 9.777815514602131e-05, "loss": 0.0051, "step": 15152 }, { "epoch": 3.09, "learning_rate": 9.775998295434003e-05, "loss": 0.0085, "step": 15153 }, { "epoch": 3.09, "learning_rate": 9.77418116351656e-05, "loss": 0.0016, "step": 15154 }, { "epoch": 3.09, "learning_rate": 9.772364118880161e-05, "loss": 0.0026, "step": 15155 }, { "epoch": 3.09, "learning_rate": 9.770547161555146e-05, "loss": 0.0024, "step": 15156 }, { "epoch": 3.09, "learning_rate": 9.768730291571865e-05, "loss": 0.0049, "step": 15157 }, { "epoch": 3.09, "learning_rate": 9.766913508960662e-05, "loss": 0.0099, "step": 15158 }, { "epoch": 3.09, "learning_rate": 9.765096813751878e-05, "loss": 0.0048, "step": 15159 }, { "epoch": 3.09, "learning_rate": 9.763280205975866e-05, "loss": 0.012, "step": 15160 }, { "epoch": 3.09, "learning_rate": 9.76146368566296e-05, "loss": 0.0063, "step": 15161 }, { "epoch": 3.09, "learning_rate": 9.759647252843492e-05, "loss": 0.0035, "step": 15162 }, { "epoch": 3.09, "learning_rate": 9.757830907547814e-05, "loss": 0.003, "step": 15163 }, { "epoch": 3.09, "learning_rate": 9.756014649806247e-05, "loss": 0.0122, "step": 15164 }, { "epoch": 3.09, "learning_rate": 9.75419847964914e-05, "loss": 0.0019, "step": 15165 }, { "epoch": 3.09, "learning_rate": 9.752382397106821e-05, "loss": 0.0032, "step": 15166 }, { "epoch": 3.09, "learning_rate": 9.750566402209619e-05, "loss": 0.0028, "step": 15167 }, { "epoch": 3.09, "learning_rate": 9.748750494987867e-05, "loss": 0.0072, "step": 15168 }, { "epoch": 3.09, "learning_rate": 9.746934675471894e-05, "loss": 0.0063, "step": 15169 }, { "epoch": 3.09, "learning_rate": 9.745118943692028e-05, "loss": 0.0144, "step": 15170 }, { "epoch": 3.09, "learning_rate": 9.743303299678598e-05, "loss": 0.0115, "step": 15171 }, { "epoch": 3.09, "learning_rate": 9.741487743461921e-05, "loss": 0.0146, "step": 15172 }, { "epoch": 3.09, "learning_rate": 9.73967227507233e-05, "loss": 0.0064, "step": 15173 }, { "epoch": 3.09, "learning_rate": 9.73785689454014e-05, "loss": 0.0051, "step": 15174 }, { "epoch": 3.09, "learning_rate": 9.736041601895667e-05, "loss": 0.0032, "step": 15175 }, { "epoch": 3.09, "learning_rate": 9.734226397169245e-05, "loss": 0.0031, "step": 15176 }, { "epoch": 3.09, "learning_rate": 9.732411280391174e-05, "loss": 0.0078, "step": 15177 }, { "epoch": 3.09, "learning_rate": 9.73059625159178e-05, "loss": 0.0026, "step": 15178 }, { "epoch": 3.09, "learning_rate": 9.72878131080138e-05, "loss": 0.0027, "step": 15179 }, { "epoch": 3.09, "learning_rate": 9.726966458050274e-05, "loss": 0.0005, "step": 15180 }, { "epoch": 3.09, "learning_rate": 9.725151693368791e-05, "loss": 0.0061, "step": 15181 }, { "epoch": 3.09, "learning_rate": 9.723337016787222e-05, "loss": 0.002, "step": 15182 }, { "epoch": 3.09, "learning_rate": 9.721522428335893e-05, "loss": 0.0162, "step": 15183 }, { "epoch": 3.09, "learning_rate": 9.719707928045103e-05, "loss": 0.0013, "step": 15184 }, { "epoch": 3.09, "learning_rate": 9.717893515945151e-05, "loss": 0.021, "step": 15185 }, { "epoch": 3.09, "learning_rate": 9.716079192066356e-05, "loss": 0.0044, "step": 15186 }, { "epoch": 3.09, "learning_rate": 9.714264956439005e-05, "loss": 0.0002, "step": 15187 }, { "epoch": 3.09, "learning_rate": 9.712450809093414e-05, "loss": 0.0021, "step": 15188 }, { "epoch": 3.09, "learning_rate": 9.710636750059872e-05, "loss": 0.0013, "step": 15189 }, { "epoch": 3.09, "learning_rate": 9.708822779368678e-05, "loss": 0.0054, "step": 15190 }, { "epoch": 3.09, "learning_rate": 9.707008897050135e-05, "loss": 0.0047, "step": 15191 }, { "epoch": 3.09, "learning_rate": 9.705195103134531e-05, "loss": 0.0008, "step": 15192 }, { "epoch": 3.09, "learning_rate": 9.70338139765217e-05, "loss": 0.002, "step": 15193 }, { "epoch": 3.09, "learning_rate": 9.701567780633336e-05, "loss": 0.0041, "step": 15194 }, { "epoch": 3.09, "learning_rate": 9.699754252108317e-05, "loss": 0.0071, "step": 15195 }, { "epoch": 3.09, "learning_rate": 9.697940812107412e-05, "loss": 0.0026, "step": 15196 }, { "epoch": 3.09, "learning_rate": 9.6961274606609e-05, "loss": 0.0053, "step": 15197 }, { "epoch": 3.09, "learning_rate": 9.694314197799072e-05, "loss": 0.0093, "step": 15198 }, { "epoch": 3.09, "learning_rate": 9.692501023552212e-05, "loss": 0.0003, "step": 15199 }, { "epoch": 3.1, "learning_rate": 9.690687937950603e-05, "loss": 0.0069, "step": 15200 }, { "epoch": 3.1, "learning_rate": 9.68887494102453e-05, "loss": 0.0031, "step": 15201 }, { "epoch": 3.1, "learning_rate": 9.687062032804272e-05, "loss": 0.0007, "step": 15202 }, { "epoch": 3.1, "learning_rate": 9.6852492133201e-05, "loss": 0.0119, "step": 15203 }, { "epoch": 3.1, "learning_rate": 9.683436482602307e-05, "loss": 0.0004, "step": 15204 }, { "epoch": 3.1, "learning_rate": 9.681623840681152e-05, "loss": 0.0025, "step": 15205 }, { "epoch": 3.1, "learning_rate": 9.679811287586926e-05, "loss": 0.0037, "step": 15206 }, { "epoch": 3.1, "learning_rate": 9.677998823349892e-05, "loss": 0.0156, "step": 15207 }, { "epoch": 3.1, "learning_rate": 9.676186448000318e-05, "loss": 0.019, "step": 15208 }, { "epoch": 3.1, "learning_rate": 9.674374161568484e-05, "loss": 0.0008, "step": 15209 }, { "epoch": 3.1, "learning_rate": 9.672561964084653e-05, "loss": 0.0019, "step": 15210 }, { "epoch": 3.1, "learning_rate": 9.670749855579095e-05, "loss": 0.0138, "step": 15211 }, { "epoch": 3.1, "learning_rate": 9.668937836082076e-05, "loss": 0.0004, "step": 15212 }, { "epoch": 3.1, "learning_rate": 9.667125905623853e-05, "loss": 0.0044, "step": 15213 }, { "epoch": 3.1, "learning_rate": 9.6653140642347e-05, "loss": 0.0059, "step": 15214 }, { "epoch": 3.1, "learning_rate": 9.663502311944864e-05, "loss": 0.0044, "step": 15215 }, { "epoch": 3.1, "learning_rate": 9.66169064878462e-05, "loss": 0.0037, "step": 15216 }, { "epoch": 3.1, "learning_rate": 9.65987907478422e-05, "loss": 0.0036, "step": 15217 }, { "epoch": 3.1, "learning_rate": 9.658067589973912e-05, "loss": 0.0066, "step": 15218 }, { "epoch": 3.1, "learning_rate": 9.656256194383962e-05, "loss": 0.0127, "step": 15219 }, { "epoch": 3.1, "learning_rate": 9.654444888044626e-05, "loss": 0.0073, "step": 15220 }, { "epoch": 3.1, "learning_rate": 9.652633670986141e-05, "loss": 0.009, "step": 15221 }, { "epoch": 3.1, "learning_rate": 9.650822543238777e-05, "loss": 0.013, "step": 15222 }, { "epoch": 3.1, "learning_rate": 9.649011504832766e-05, "loss": 0.0033, "step": 15223 }, { "epoch": 3.1, "learning_rate": 9.647200555798371e-05, "loss": 0.0046, "step": 15224 }, { "epoch": 3.1, "learning_rate": 9.645389696165829e-05, "loss": 0.0054, "step": 15225 }, { "epoch": 3.1, "learning_rate": 9.643578925965383e-05, "loss": 0.0075, "step": 15226 }, { "epoch": 3.1, "learning_rate": 9.641768245227284e-05, "loss": 0.0113, "step": 15227 }, { "epoch": 3.1, "learning_rate": 9.639957653981763e-05, "loss": 0.004, "step": 15228 }, { "epoch": 3.1, "learning_rate": 9.638147152259075e-05, "loss": 0.0022, "step": 15229 }, { "epoch": 3.1, "learning_rate": 9.636336740089447e-05, "loss": 0.0057, "step": 15230 }, { "epoch": 3.1, "learning_rate": 9.634526417503116e-05, "loss": 0.0096, "step": 15231 }, { "epoch": 3.1, "learning_rate": 9.632716184530327e-05, "loss": 0.0018, "step": 15232 }, { "epoch": 3.1, "learning_rate": 9.630906041201307e-05, "loss": 0.0058, "step": 15233 }, { "epoch": 3.1, "learning_rate": 9.629095987546294e-05, "loss": 0.0015, "step": 15234 }, { "epoch": 3.1, "learning_rate": 9.627286023595518e-05, "loss": 0.0017, "step": 15235 }, { "epoch": 3.1, "learning_rate": 9.6254761493792e-05, "loss": 0.0003, "step": 15236 }, { "epoch": 3.1, "learning_rate": 9.623666364927582e-05, "loss": 0.0008, "step": 15237 }, { "epoch": 3.1, "learning_rate": 9.621856670270876e-05, "loss": 0.0068, "step": 15238 }, { "epoch": 3.1, "learning_rate": 9.620047065439325e-05, "loss": 0.002, "step": 15239 }, { "epoch": 3.1, "learning_rate": 9.61823755046314e-05, "loss": 0.0065, "step": 15240 }, { "epoch": 3.1, "learning_rate": 9.616428125372546e-05, "loss": 0.0033, "step": 15241 }, { "epoch": 3.1, "learning_rate": 9.614618790197764e-05, "loss": 0.0011, "step": 15242 }, { "epoch": 3.1, "learning_rate": 9.61280954496901e-05, "loss": 0.005, "step": 15243 }, { "epoch": 3.1, "learning_rate": 9.611000389716513e-05, "loss": 0.0024, "step": 15244 }, { "epoch": 3.1, "learning_rate": 9.609191324470482e-05, "loss": 0.0077, "step": 15245 }, { "epoch": 3.1, "learning_rate": 9.607382349261126e-05, "loss": 0.0033, "step": 15246 }, { "epoch": 3.1, "learning_rate": 9.605573464118668e-05, "loss": 0.0097, "step": 15247 }, { "epoch": 3.1, "learning_rate": 9.603764669073318e-05, "loss": 0.0085, "step": 15248 }, { "epoch": 3.1, "learning_rate": 9.601955964155276e-05, "loss": 0.0051, "step": 15249 }, { "epoch": 3.11, "learning_rate": 9.600147349394763e-05, "loss": 0.0007, "step": 15250 }, { "epoch": 3.11, "learning_rate": 9.598338824821983e-05, "loss": 0.0078, "step": 15251 }, { "epoch": 3.11, "learning_rate": 9.596530390467141e-05, "loss": 0.009, "step": 15252 }, { "epoch": 3.11, "learning_rate": 9.594722046360444e-05, "loss": 0.0091, "step": 15253 }, { "epoch": 3.11, "learning_rate": 9.592913792532086e-05, "loss": 0.0033, "step": 15254 }, { "epoch": 3.11, "learning_rate": 9.59110562901228e-05, "loss": 0.0056, "step": 15255 }, { "epoch": 3.11, "learning_rate": 9.589297555831213e-05, "loss": 0.0124, "step": 15256 }, { "epoch": 3.11, "learning_rate": 9.587489573019099e-05, "loss": 0.0026, "step": 15257 }, { "epoch": 3.11, "learning_rate": 9.585681680606124e-05, "loss": 0.0041, "step": 15258 }, { "epoch": 3.11, "learning_rate": 9.58387387862248e-05, "loss": 0.0055, "step": 15259 }, { "epoch": 3.11, "learning_rate": 9.58206616709837e-05, "loss": 0.004, "step": 15260 }, { "epoch": 3.11, "learning_rate": 9.580258546063978e-05, "loss": 0.0044, "step": 15261 }, { "epoch": 3.11, "learning_rate": 9.578451015549501e-05, "loss": 0.0114, "step": 15262 }, { "epoch": 3.11, "learning_rate": 9.57664357558513e-05, "loss": 0.0104, "step": 15263 }, { "epoch": 3.11, "learning_rate": 9.574836226201042e-05, "loss": 0.0043, "step": 15264 }, { "epoch": 3.11, "learning_rate": 9.573028967427435e-05, "loss": 0.0066, "step": 15265 }, { "epoch": 3.11, "learning_rate": 9.571221799294482e-05, "loss": 0.0082, "step": 15266 }, { "epoch": 3.11, "learning_rate": 9.56941472183238e-05, "loss": 0.003, "step": 15267 }, { "epoch": 3.11, "learning_rate": 9.567607735071302e-05, "loss": 0.0016, "step": 15268 }, { "epoch": 3.11, "learning_rate": 9.565800839041423e-05, "loss": 0.0002, "step": 15269 }, { "epoch": 3.11, "learning_rate": 9.563994033772936e-05, "loss": 0.0047, "step": 15270 }, { "epoch": 3.11, "learning_rate": 9.562187319296006e-05, "loss": 0.0023, "step": 15271 }, { "epoch": 3.11, "learning_rate": 9.560380695640807e-05, "loss": 0.0037, "step": 15272 }, { "epoch": 3.11, "learning_rate": 9.558574162837526e-05, "loss": 0.0103, "step": 15273 }, { "epoch": 3.11, "learning_rate": 9.556767720916322e-05, "loss": 0.0044, "step": 15274 }, { "epoch": 3.11, "learning_rate": 9.554961369907378e-05, "loss": 0.0016, "step": 15275 }, { "epoch": 3.11, "learning_rate": 9.553155109840857e-05, "loss": 0.0036, "step": 15276 }, { "epoch": 3.11, "learning_rate": 9.551348940746921e-05, "loss": 0.0108, "step": 15277 }, { "epoch": 3.11, "learning_rate": 9.549542862655751e-05, "loss": 0.0039, "step": 15278 }, { "epoch": 3.11, "learning_rate": 9.547736875597495e-05, "loss": 0.0116, "step": 15279 }, { "epoch": 3.11, "learning_rate": 9.545930979602333e-05, "loss": 0.0019, "step": 15280 }, { "epoch": 3.11, "learning_rate": 9.544125174700414e-05, "loss": 0.0035, "step": 15281 }, { "epoch": 3.11, "learning_rate": 9.542319460921904e-05, "loss": 0.0053, "step": 15282 }, { "epoch": 3.11, "learning_rate": 9.540513838296962e-05, "loss": 0.0029, "step": 15283 }, { "epoch": 3.11, "learning_rate": 9.538708306855739e-05, "loss": 0.0027, "step": 15284 }, { "epoch": 3.11, "learning_rate": 9.536902866628406e-05, "loss": 0.0019, "step": 15285 }, { "epoch": 3.11, "learning_rate": 9.535097517645104e-05, "loss": 0.0049, "step": 15286 }, { "epoch": 3.11, "learning_rate": 9.533292259935984e-05, "loss": 0.0022, "step": 15287 }, { "epoch": 3.11, "learning_rate": 9.53148709353121e-05, "loss": 0.0086, "step": 15288 }, { "epoch": 3.11, "learning_rate": 9.529682018460916e-05, "loss": 0.0124, "step": 15289 }, { "epoch": 3.11, "learning_rate": 9.527877034755265e-05, "loss": 0.0048, "step": 15290 }, { "epoch": 3.11, "learning_rate": 9.526072142444394e-05, "loss": 0.0088, "step": 15291 }, { "epoch": 3.11, "learning_rate": 9.524267341558452e-05, "loss": 0.0068, "step": 15292 }, { "epoch": 3.11, "learning_rate": 9.52246263212758e-05, "loss": 0.0092, "step": 15293 }, { "epoch": 3.11, "learning_rate": 9.520658014181925e-05, "loss": 0.01, "step": 15294 }, { "epoch": 3.11, "learning_rate": 9.51885348775162e-05, "loss": 0.0004, "step": 15295 }, { "epoch": 3.11, "learning_rate": 9.517049052866813e-05, "loss": 0.0008, "step": 15296 }, { "epoch": 3.11, "learning_rate": 9.51524470955763e-05, "loss": 0.0084, "step": 15297 }, { "epoch": 3.11, "learning_rate": 9.51344045785422e-05, "loss": 0.0107, "step": 15298 }, { "epoch": 3.12, "learning_rate": 9.511636297786711e-05, "loss": 0.0043, "step": 15299 }, { "epoch": 3.12, "learning_rate": 9.509832229385228e-05, "loss": 0.0054, "step": 15300 }, { "epoch": 3.12, "learning_rate": 9.508028252679919e-05, "loss": 0.0005, "step": 15301 }, { "epoch": 3.12, "learning_rate": 9.506224367700897e-05, "loss": 0.0082, "step": 15302 }, { "epoch": 3.12, "learning_rate": 9.504420574478302e-05, "loss": 0.0009, "step": 15303 }, { "epoch": 3.12, "learning_rate": 9.502616873042261e-05, "loss": 0.0031, "step": 15304 }, { "epoch": 3.12, "learning_rate": 9.500813263422887e-05, "loss": 0.0032, "step": 15305 }, { "epoch": 3.12, "learning_rate": 9.49900974565032e-05, "loss": 0.0171, "step": 15306 }, { "epoch": 3.12, "learning_rate": 9.497206319754667e-05, "loss": 0.0004, "step": 15307 }, { "epoch": 3.12, "learning_rate": 9.495402985766063e-05, "loss": 0.0083, "step": 15308 }, { "epoch": 3.12, "learning_rate": 9.49359974371462e-05, "loss": 0.0088, "step": 15309 }, { "epoch": 3.12, "learning_rate": 9.491796593630448e-05, "loss": 0.0102, "step": 15310 }, { "epoch": 3.12, "learning_rate": 9.489993535543677e-05, "loss": 0.0011, "step": 15311 }, { "epoch": 3.12, "learning_rate": 9.488190569484408e-05, "loss": 0.0046, "step": 15312 }, { "epoch": 3.12, "learning_rate": 9.486387695482767e-05, "loss": 0.0006, "step": 15313 }, { "epoch": 3.12, "learning_rate": 9.484584913568857e-05, "loss": 0.0054, "step": 15314 }, { "epoch": 3.12, "learning_rate": 9.482782223772786e-05, "loss": 0.0017, "step": 15315 }, { "epoch": 3.12, "learning_rate": 9.480979626124672e-05, "loss": 0.0032, "step": 15316 }, { "epoch": 3.12, "learning_rate": 9.479177120654611e-05, "loss": 0.0006, "step": 15317 }, { "epoch": 3.12, "learning_rate": 9.47737470739272e-05, "loss": 0.0099, "step": 15318 }, { "epoch": 3.12, "learning_rate": 9.475572386369095e-05, "loss": 0.0036, "step": 15319 }, { "epoch": 3.12, "learning_rate": 9.473770157613834e-05, "loss": 0.0007, "step": 15320 }, { "epoch": 3.12, "learning_rate": 9.471968021157049e-05, "loss": 0.0067, "step": 15321 }, { "epoch": 3.12, "learning_rate": 9.47016597702883e-05, "loss": 0.0057, "step": 15322 }, { "epoch": 3.12, "learning_rate": 9.468364025259275e-05, "loss": 0.0034, "step": 15323 }, { "epoch": 3.12, "learning_rate": 9.466562165878486e-05, "loss": 0.0136, "step": 15324 }, { "epoch": 3.12, "learning_rate": 9.464760398916549e-05, "loss": 0.0081, "step": 15325 }, { "epoch": 3.12, "learning_rate": 9.462958724403568e-05, "loss": 0.0014, "step": 15326 }, { "epoch": 3.12, "learning_rate": 9.46115714236963e-05, "loss": 0.0002, "step": 15327 }, { "epoch": 3.12, "learning_rate": 9.459355652844814e-05, "loss": 0.0045, "step": 15328 }, { "epoch": 3.12, "learning_rate": 9.457554255859226e-05, "loss": 0.0038, "step": 15329 }, { "epoch": 3.12, "learning_rate": 9.455752951442936e-05, "loss": 0.0088, "step": 15330 }, { "epoch": 3.12, "learning_rate": 9.453951739626044e-05, "loss": 0.0015, "step": 15331 }, { "epoch": 3.12, "learning_rate": 9.452150620438627e-05, "loss": 0.0032, "step": 15332 }, { "epoch": 3.12, "learning_rate": 9.450349593910761e-05, "loss": 0.0045, "step": 15333 }, { "epoch": 3.12, "learning_rate": 9.448548660072536e-05, "loss": 0.0171, "step": 15334 }, { "epoch": 3.12, "learning_rate": 9.446747818954025e-05, "loss": 0.0031, "step": 15335 }, { "epoch": 3.12, "learning_rate": 9.444947070585311e-05, "loss": 0.0032, "step": 15336 }, { "epoch": 3.12, "learning_rate": 9.443146414996468e-05, "loss": 0.005, "step": 15337 }, { "epoch": 3.12, "learning_rate": 9.441345852217564e-05, "loss": 0.0033, "step": 15338 }, { "epoch": 3.12, "learning_rate": 9.439545382278682e-05, "loss": 0.0009, "step": 15339 }, { "epoch": 3.12, "learning_rate": 9.437745005209883e-05, "loss": 0.0012, "step": 15340 }, { "epoch": 3.12, "learning_rate": 9.435944721041248e-05, "loss": 0.0061, "step": 15341 }, { "epoch": 3.12, "learning_rate": 9.434144529802839e-05, "loss": 0.0037, "step": 15342 }, { "epoch": 3.12, "learning_rate": 9.432344431524718e-05, "loss": 0.0148, "step": 15343 }, { "epoch": 3.12, "learning_rate": 9.430544426236955e-05, "loss": 0.0066, "step": 15344 }, { "epoch": 3.12, "learning_rate": 9.428744513969618e-05, "loss": 0.003, "step": 15345 }, { "epoch": 3.12, "learning_rate": 9.426944694752756e-05, "loss": 0.0089, "step": 15346 }, { "epoch": 3.12, "learning_rate": 9.425144968616445e-05, "loss": 0.0071, "step": 15347 }, { "epoch": 3.13, "learning_rate": 9.42334533559073e-05, "loss": 0.0064, "step": 15348 }, { "epoch": 3.13, "learning_rate": 9.421545795705682e-05, "loss": 0.0036, "step": 15349 }, { "epoch": 3.13, "learning_rate": 9.419746348991347e-05, "loss": 0.0047, "step": 15350 }, { "epoch": 3.13, "learning_rate": 9.417946995477778e-05, "loss": 0.0013, "step": 15351 }, { "epoch": 3.13, "learning_rate": 9.416147735195035e-05, "loss": 0.0026, "step": 15352 }, { "epoch": 3.13, "learning_rate": 9.41434856817316e-05, "loss": 0.0021, "step": 15353 }, { "epoch": 3.13, "learning_rate": 9.412549494442213e-05, "loss": 0.0154, "step": 15354 }, { "epoch": 3.13, "learning_rate": 9.410750514032234e-05, "loss": 0.0077, "step": 15355 }, { "epoch": 3.13, "learning_rate": 9.408951626973268e-05, "loss": 0.0253, "step": 15356 }, { "epoch": 3.13, "learning_rate": 9.407152833295372e-05, "loss": 0.0014, "step": 15357 }, { "epoch": 3.13, "learning_rate": 9.405354133028572e-05, "loss": 0.0103, "step": 15358 }, { "epoch": 3.13, "learning_rate": 9.403555526202927e-05, "loss": 0.0015, "step": 15359 }, { "epoch": 3.13, "learning_rate": 9.401757012848467e-05, "loss": 0.0017, "step": 15360 }, { "epoch": 3.13, "learning_rate": 9.399958592995228e-05, "loss": 0.0015, "step": 15361 }, { "epoch": 3.13, "learning_rate": 9.398160266673255e-05, "loss": 0.0048, "step": 15362 }, { "epoch": 3.13, "learning_rate": 9.396362033912575e-05, "loss": 0.0024, "step": 15363 }, { "epoch": 3.13, "learning_rate": 9.394563894743234e-05, "loss": 0.0038, "step": 15364 }, { "epoch": 3.13, "learning_rate": 9.392765849195252e-05, "loss": 0.0061, "step": 15365 }, { "epoch": 3.13, "learning_rate": 9.390967897298666e-05, "loss": 0.0035, "step": 15366 }, { "epoch": 3.13, "learning_rate": 9.389170039083502e-05, "loss": 0.0058, "step": 15367 }, { "epoch": 3.13, "learning_rate": 9.387372274579789e-05, "loss": 0.0053, "step": 15368 }, { "epoch": 3.13, "learning_rate": 9.385574603817559e-05, "loss": 0.0141, "step": 15369 }, { "epoch": 3.13, "learning_rate": 9.38377702682683e-05, "loss": 0.0052, "step": 15370 }, { "epoch": 3.13, "learning_rate": 9.381979543637621e-05, "loss": 0.0021, "step": 15371 }, { "epoch": 3.13, "learning_rate": 9.380182154279964e-05, "loss": 0.0044, "step": 15372 }, { "epoch": 3.13, "learning_rate": 9.378384858783874e-05, "loss": 0.0029, "step": 15373 }, { "epoch": 3.13, "learning_rate": 9.37658765717936e-05, "loss": 0.0041, "step": 15374 }, { "epoch": 3.13, "learning_rate": 9.374790549496451e-05, "loss": 0.0044, "step": 15375 }, { "epoch": 3.13, "learning_rate": 9.372993535765159e-05, "loss": 0.0009, "step": 15376 }, { "epoch": 3.13, "learning_rate": 9.371196616015498e-05, "loss": 0.0053, "step": 15377 }, { "epoch": 3.13, "learning_rate": 9.36939979027748e-05, "loss": 0.0059, "step": 15378 }, { "epoch": 3.13, "learning_rate": 9.367603058581107e-05, "loss": 0.0029, "step": 15379 }, { "epoch": 3.13, "learning_rate": 9.365806420956402e-05, "loss": 0.0031, "step": 15380 }, { "epoch": 3.13, "learning_rate": 9.36400987743336e-05, "loss": 0.0055, "step": 15381 }, { "epoch": 3.13, "learning_rate": 9.362213428041997e-05, "loss": 0.007, "step": 15382 }, { "epoch": 3.13, "learning_rate": 9.36041707281231e-05, "loss": 0.0049, "step": 15383 }, { "epoch": 3.13, "learning_rate": 9.358620811774299e-05, "loss": 0.0016, "step": 15384 }, { "epoch": 3.13, "learning_rate": 9.356824644957976e-05, "loss": 0.0049, "step": 15385 }, { "epoch": 3.13, "learning_rate": 9.355028572393327e-05, "loss": 0.0161, "step": 15386 }, { "epoch": 3.13, "learning_rate": 9.35323259411036e-05, "loss": 0.0076, "step": 15387 }, { "epoch": 3.13, "learning_rate": 9.35143671013907e-05, "loss": 0.0049, "step": 15388 }, { "epoch": 3.13, "learning_rate": 9.349640920509444e-05, "loss": 0.0046, "step": 15389 }, { "epoch": 3.13, "learning_rate": 9.347845225251484e-05, "loss": 0.0071, "step": 15390 }, { "epoch": 3.13, "learning_rate": 9.346049624395175e-05, "loss": 0.0077, "step": 15391 }, { "epoch": 3.13, "learning_rate": 9.344254117970515e-05, "loss": 0.0069, "step": 15392 }, { "epoch": 3.13, "learning_rate": 9.342458706007487e-05, "loss": 0.0041, "step": 15393 }, { "epoch": 3.13, "learning_rate": 9.34066338853607e-05, "loss": 0.0021, "step": 15394 }, { "epoch": 3.13, "learning_rate": 9.338868165586268e-05, "loss": 0.004, "step": 15395 }, { "epoch": 3.13, "learning_rate": 9.337073037188046e-05, "loss": 0.0002, "step": 15396 }, { "epoch": 3.14, "learning_rate": 9.335278003371394e-05, "loss": 0.0153, "step": 15397 }, { "epoch": 3.14, "learning_rate": 9.333483064166295e-05, "loss": 0.001, "step": 15398 }, { "epoch": 3.14, "learning_rate": 9.331688219602721e-05, "loss": 0.0134, "step": 15399 }, { "epoch": 3.14, "learning_rate": 9.32989346971066e-05, "loss": 0.0133, "step": 15400 }, { "epoch": 3.14, "learning_rate": 9.328098814520081e-05, "loss": 0.0055, "step": 15401 }, { "epoch": 3.14, "learning_rate": 9.326304254060952e-05, "loss": 0.0056, "step": 15402 }, { "epoch": 3.14, "learning_rate": 9.324509788363257e-05, "loss": 0.0069, "step": 15403 }, { "epoch": 3.14, "learning_rate": 9.322715417456958e-05, "loss": 0.0149, "step": 15404 }, { "epoch": 3.14, "learning_rate": 9.32092114137203e-05, "loss": 0.0058, "step": 15405 }, { "epoch": 3.14, "learning_rate": 9.319126960138441e-05, "loss": 0.004, "step": 15406 }, { "epoch": 3.14, "learning_rate": 9.317332873786151e-05, "loss": 0.002, "step": 15407 }, { "epoch": 3.14, "learning_rate": 9.315538882345131e-05, "loss": 0.0019, "step": 15408 }, { "epoch": 3.14, "learning_rate": 9.31374498584534e-05, "loss": 0.0077, "step": 15409 }, { "epoch": 3.14, "learning_rate": 9.311951184316743e-05, "loss": 0.0016, "step": 15410 }, { "epoch": 3.14, "learning_rate": 9.310157477789302e-05, "loss": 0.0038, "step": 15411 }, { "epoch": 3.14, "learning_rate": 9.308363866292965e-05, "loss": 0.0074, "step": 15412 }, { "epoch": 3.14, "learning_rate": 9.3065703498577e-05, "loss": 0.0092, "step": 15413 }, { "epoch": 3.14, "learning_rate": 9.304776928513451e-05, "loss": 0.0089, "step": 15414 }, { "epoch": 3.14, "learning_rate": 9.302983602290186e-05, "loss": 0.0004, "step": 15415 }, { "epoch": 3.14, "learning_rate": 9.301190371217844e-05, "loss": 0.0014, "step": 15416 }, { "epoch": 3.14, "learning_rate": 9.29939723532638e-05, "loss": 0.0121, "step": 15417 }, { "epoch": 3.14, "learning_rate": 9.297604194645743e-05, "loss": 0.0066, "step": 15418 }, { "epoch": 3.14, "learning_rate": 9.295811249205884e-05, "loss": 0.0016, "step": 15419 }, { "epoch": 3.14, "learning_rate": 9.294018399036738e-05, "loss": 0.0043, "step": 15420 }, { "epoch": 3.14, "learning_rate": 9.29222564416826e-05, "loss": 0.0035, "step": 15421 }, { "epoch": 3.14, "learning_rate": 9.290432984630385e-05, "loss": 0.002, "step": 15422 }, { "epoch": 3.14, "learning_rate": 9.288640420453061e-05, "loss": 0.0028, "step": 15423 }, { "epoch": 3.14, "learning_rate": 9.286847951666222e-05, "loss": 0.0024, "step": 15424 }, { "epoch": 3.14, "learning_rate": 9.285055578299801e-05, "loss": 0.002, "step": 15425 }, { "epoch": 3.14, "learning_rate": 9.283263300383745e-05, "loss": 0.0016, "step": 15426 }, { "epoch": 3.14, "learning_rate": 9.281471117947979e-05, "loss": 0.0069, "step": 15427 }, { "epoch": 3.14, "learning_rate": 9.279679031022442e-05, "loss": 0.0061, "step": 15428 }, { "epoch": 3.14, "learning_rate": 9.277887039637066e-05, "loss": 0.0087, "step": 15429 }, { "epoch": 3.14, "learning_rate": 9.276095143821771e-05, "loss": 0.0077, "step": 15430 }, { "epoch": 3.14, "learning_rate": 9.274303343606497e-05, "loss": 0.0036, "step": 15431 }, { "epoch": 3.14, "learning_rate": 9.27251163902116e-05, "loss": 0.0099, "step": 15432 }, { "epoch": 3.14, "learning_rate": 9.270720030095698e-05, "loss": 0.0014, "step": 15433 }, { "epoch": 3.14, "learning_rate": 9.268928516860023e-05, "loss": 0.0036, "step": 15434 }, { "epoch": 3.14, "learning_rate": 9.267137099344058e-05, "loss": 0.0022, "step": 15435 }, { "epoch": 3.14, "learning_rate": 9.265345777577728e-05, "loss": 0.0073, "step": 15436 }, { "epoch": 3.14, "learning_rate": 9.263554551590943e-05, "loss": 0.005, "step": 15437 }, { "epoch": 3.14, "learning_rate": 9.261763421413631e-05, "loss": 0.0044, "step": 15438 }, { "epoch": 3.14, "learning_rate": 9.2599723870757e-05, "loss": 0.0027, "step": 15439 }, { "epoch": 3.14, "learning_rate": 9.258181448607062e-05, "loss": 0.0051, "step": 15440 }, { "epoch": 3.14, "learning_rate": 9.256390606037637e-05, "loss": 0.008, "step": 15441 }, { "epoch": 3.14, "learning_rate": 9.254599859397323e-05, "loss": 0.0013, "step": 15442 }, { "epoch": 3.14, "learning_rate": 9.252809208716047e-05, "loss": 0.0056, "step": 15443 }, { "epoch": 3.14, "learning_rate": 9.251018654023701e-05, "loss": 0.0026, "step": 15444 }, { "epoch": 3.14, "learning_rate": 9.249228195350192e-05, "loss": 0.0011, "step": 15445 }, { "epoch": 3.15, "learning_rate": 9.247437832725435e-05, "loss": 0.0001, "step": 15446 }, { "epoch": 3.15, "learning_rate": 9.24564756617932e-05, "loss": 0.0062, "step": 15447 }, { "epoch": 3.15, "learning_rate": 9.243857395741753e-05, "loss": 0.0058, "step": 15448 }, { "epoch": 3.15, "learning_rate": 9.242067321442634e-05, "loss": 0.0105, "step": 15449 }, { "epoch": 3.15, "learning_rate": 9.240277343311854e-05, "loss": 0.0022, "step": 15450 }, { "epoch": 3.15, "learning_rate": 9.238487461379323e-05, "loss": 0.0047, "step": 15451 }, { "epoch": 3.15, "learning_rate": 9.236697675674927e-05, "loss": 0.0032, "step": 15452 }, { "epoch": 3.15, "learning_rate": 9.234907986228552e-05, "loss": 0.005, "step": 15453 }, { "epoch": 3.15, "learning_rate": 9.233118393070103e-05, "loss": 0.0094, "step": 15454 }, { "epoch": 3.15, "learning_rate": 9.231328896229454e-05, "loss": 0.0011, "step": 15455 }, { "epoch": 3.15, "learning_rate": 9.22953949573651e-05, "loss": 0.0091, "step": 15456 }, { "epoch": 3.15, "learning_rate": 9.227750191621146e-05, "loss": 0.0103, "step": 15457 }, { "epoch": 3.15, "learning_rate": 9.225960983913248e-05, "loss": 0.0008, "step": 15458 }, { "epoch": 3.15, "learning_rate": 9.2241718726427e-05, "loss": 0.0049, "step": 15459 }, { "epoch": 3.15, "learning_rate": 9.222382857839387e-05, "loss": 0.0073, "step": 15460 }, { "epoch": 3.15, "learning_rate": 9.220593939533186e-05, "loss": 0.0006, "step": 15461 }, { "epoch": 3.15, "learning_rate": 9.218805117753979e-05, "loss": 0.0244, "step": 15462 }, { "epoch": 3.15, "learning_rate": 9.217016392531632e-05, "loss": 0.0089, "step": 15463 }, { "epoch": 3.15, "learning_rate": 9.215227763896033e-05, "loss": 0.002, "step": 15464 }, { "epoch": 3.15, "learning_rate": 9.213439231877046e-05, "loss": 0.0012, "step": 15465 }, { "epoch": 3.15, "learning_rate": 9.211650796504551e-05, "loss": 0.0045, "step": 15466 }, { "epoch": 3.15, "learning_rate": 9.209862457808414e-05, "loss": 0.0043, "step": 15467 }, { "epoch": 3.15, "learning_rate": 9.208074215818498e-05, "loss": 0.0116, "step": 15468 }, { "epoch": 3.15, "learning_rate": 9.206286070564678e-05, "loss": 0.0089, "step": 15469 }, { "epoch": 3.15, "learning_rate": 9.204498022076822e-05, "loss": 0.0055, "step": 15470 }, { "epoch": 3.15, "learning_rate": 9.20271007038478e-05, "loss": 0.0053, "step": 15471 }, { "epoch": 3.15, "learning_rate": 9.200922215518431e-05, "loss": 0.0186, "step": 15472 }, { "epoch": 3.15, "learning_rate": 9.19913445750762e-05, "loss": 0.0079, "step": 15473 }, { "epoch": 3.15, "learning_rate": 9.197346796382222e-05, "loss": 0.0093, "step": 15474 }, { "epoch": 3.15, "learning_rate": 9.195559232172083e-05, "loss": 0.0044, "step": 15475 }, { "epoch": 3.15, "learning_rate": 9.193771764907058e-05, "loss": 0.0054, "step": 15476 }, { "epoch": 3.15, "learning_rate": 9.191984394617008e-05, "loss": 0.0093, "step": 15477 }, { "epoch": 3.15, "learning_rate": 9.190197121331778e-05, "loss": 0.0022, "step": 15478 }, { "epoch": 3.15, "learning_rate": 9.188409945081228e-05, "loss": 0.002, "step": 15479 }, { "epoch": 3.15, "learning_rate": 9.186622865895199e-05, "loss": 0.0015, "step": 15480 }, { "epoch": 3.15, "learning_rate": 9.18483588380354e-05, "loss": 0.0068, "step": 15481 }, { "epoch": 3.15, "learning_rate": 9.183048998836102e-05, "loss": 0.0071, "step": 15482 }, { "epoch": 3.15, "learning_rate": 9.181262211022722e-05, "loss": 0.0044, "step": 15483 }, { "epoch": 3.15, "learning_rate": 9.179475520393252e-05, "loss": 0.0084, "step": 15484 }, { "epoch": 3.15, "learning_rate": 9.177688926977529e-05, "loss": 0.0016, "step": 15485 }, { "epoch": 3.15, "learning_rate": 9.175902430805385e-05, "loss": 0.0018, "step": 15486 }, { "epoch": 3.15, "learning_rate": 9.174116031906667e-05, "loss": 0.0059, "step": 15487 }, { "epoch": 3.15, "learning_rate": 9.172329730311206e-05, "loss": 0.006, "step": 15488 }, { "epoch": 3.15, "learning_rate": 9.170543526048844e-05, "loss": 0.0092, "step": 15489 }, { "epoch": 3.15, "learning_rate": 9.168757419149405e-05, "loss": 0.0041, "step": 15490 }, { "epoch": 3.15, "learning_rate": 9.166971409642727e-05, "loss": 0.0026, "step": 15491 }, { "epoch": 3.15, "learning_rate": 9.165185497558636e-05, "loss": 0.0033, "step": 15492 }, { "epoch": 3.15, "learning_rate": 9.163399682926962e-05, "loss": 0.0099, "step": 15493 }, { "epoch": 3.15, "learning_rate": 9.161613965777528e-05, "loss": 0.0082, "step": 15494 }, { "epoch": 3.16, "learning_rate": 9.159828346140164e-05, "loss": 0.0041, "step": 15495 }, { "epoch": 3.16, "learning_rate": 9.158042824044686e-05, "loss": 0.0028, "step": 15496 }, { "epoch": 3.16, "learning_rate": 9.156257399520928e-05, "loss": 0.0029, "step": 15497 }, { "epoch": 3.16, "learning_rate": 9.154472072598702e-05, "loss": 0.0111, "step": 15498 }, { "epoch": 3.16, "learning_rate": 9.15268684330782e-05, "loss": 0.0009, "step": 15499 }, { "epoch": 3.16, "learning_rate": 9.150901711678106e-05, "loss": 0.0035, "step": 15500 }, { "epoch": 3.16, "learning_rate": 9.149116677739377e-05, "loss": 0.007, "step": 15501 }, { "epoch": 3.16, "learning_rate": 9.147331741521443e-05, "loss": 0.0029, "step": 15502 }, { "epoch": 3.16, "learning_rate": 9.145546903054118e-05, "loss": 0.0064, "step": 15503 }, { "epoch": 3.16, "learning_rate": 9.143762162367208e-05, "loss": 0.0012, "step": 15504 }, { "epoch": 3.16, "learning_rate": 9.14197751949053e-05, "loss": 0.001, "step": 15505 }, { "epoch": 3.16, "learning_rate": 9.140192974453876e-05, "loss": 0.0021, "step": 15506 }, { "epoch": 3.16, "learning_rate": 9.138408527287069e-05, "loss": 0.0177, "step": 15507 }, { "epoch": 3.16, "learning_rate": 9.136624178019904e-05, "loss": 0.0022, "step": 15508 }, { "epoch": 3.16, "learning_rate": 9.134839926682179e-05, "loss": 0.0115, "step": 15509 }, { "epoch": 3.16, "learning_rate": 9.133055773303698e-05, "loss": 0.009, "step": 15510 }, { "epoch": 3.16, "learning_rate": 9.131271717914262e-05, "loss": 0.0066, "step": 15511 }, { "epoch": 3.16, "learning_rate": 9.129487760543664e-05, "loss": 0.0018, "step": 15512 }, { "epoch": 3.16, "learning_rate": 9.127703901221707e-05, "loss": 0.0047, "step": 15513 }, { "epoch": 3.16, "learning_rate": 9.125920139978174e-05, "loss": 0.0039, "step": 15514 }, { "epoch": 3.16, "learning_rate": 9.124136476842867e-05, "loss": 0.005, "step": 15515 }, { "epoch": 3.16, "learning_rate": 9.122352911845568e-05, "loss": 0.0098, "step": 15516 }, { "epoch": 3.16, "learning_rate": 9.120569445016075e-05, "loss": 0.0021, "step": 15517 }, { "epoch": 3.16, "learning_rate": 9.118786076384172e-05, "loss": 0.001, "step": 15518 }, { "epoch": 3.16, "learning_rate": 9.117002805979636e-05, "loss": 0.0069, "step": 15519 }, { "epoch": 3.16, "learning_rate": 9.115219633832265e-05, "loss": 0.0119, "step": 15520 }, { "epoch": 3.16, "learning_rate": 9.11343655997183e-05, "loss": 0.0084, "step": 15521 }, { "epoch": 3.16, "learning_rate": 9.111653584428114e-05, "loss": 0.0043, "step": 15522 }, { "epoch": 3.16, "learning_rate": 9.109870707230904e-05, "loss": 0.0028, "step": 15523 }, { "epoch": 3.16, "learning_rate": 9.108087928409965e-05, "loss": 0.0108, "step": 15524 }, { "epoch": 3.16, "learning_rate": 9.106305247995086e-05, "loss": 0.0119, "step": 15525 }, { "epoch": 3.16, "learning_rate": 9.104522666016033e-05, "loss": 0.0086, "step": 15526 }, { "epoch": 3.16, "learning_rate": 9.102740182502576e-05, "loss": 0.0027, "step": 15527 }, { "epoch": 3.16, "learning_rate": 9.100957797484495e-05, "loss": 0.0004, "step": 15528 }, { "epoch": 3.16, "learning_rate": 9.09917551099155e-05, "loss": 0.0076, "step": 15529 }, { "epoch": 3.16, "learning_rate": 9.097393323053517e-05, "loss": 0.0031, "step": 15530 }, { "epoch": 3.16, "learning_rate": 9.095611233700152e-05, "loss": 0.0043, "step": 15531 }, { "epoch": 3.16, "learning_rate": 9.093829242961228e-05, "loss": 0.0064, "step": 15532 }, { "epoch": 3.16, "learning_rate": 9.092047350866503e-05, "loss": 0.0044, "step": 15533 }, { "epoch": 3.16, "learning_rate": 9.090265557445737e-05, "loss": 0.0036, "step": 15534 }, { "epoch": 3.16, "learning_rate": 9.088483862728696e-05, "loss": 0.0004, "step": 15535 }, { "epoch": 3.16, "learning_rate": 9.086702266745135e-05, "loss": 0.0056, "step": 15536 }, { "epoch": 3.16, "learning_rate": 9.084920769524803e-05, "loss": 0.003, "step": 15537 }, { "epoch": 3.16, "learning_rate": 9.083139371097464e-05, "loss": 0.0182, "step": 15538 }, { "epoch": 3.16, "learning_rate": 9.081358071492862e-05, "loss": 0.0089, "step": 15539 }, { "epoch": 3.16, "learning_rate": 9.079576870740754e-05, "loss": 0.0015, "step": 15540 }, { "epoch": 3.16, "learning_rate": 9.07779576887089e-05, "loss": 0.0046, "step": 15541 }, { "epoch": 3.16, "learning_rate": 9.076014765913013e-05, "loss": 0.0069, "step": 15542 }, { "epoch": 3.16, "learning_rate": 9.074233861896874e-05, "loss": 0.005, "step": 15543 }, { "epoch": 3.17, "learning_rate": 9.072453056852215e-05, "loss": 0.0027, "step": 15544 }, { "epoch": 3.17, "learning_rate": 9.070672350808775e-05, "loss": 0.0072, "step": 15545 }, { "epoch": 3.17, "learning_rate": 9.068891743796305e-05, "loss": 0.0055, "step": 15546 }, { "epoch": 3.17, "learning_rate": 9.067111235844531e-05, "loss": 0.0112, "step": 15547 }, { "epoch": 3.17, "learning_rate": 9.065330826983207e-05, "loss": 0.004, "step": 15548 }, { "epoch": 3.17, "learning_rate": 9.06355051724206e-05, "loss": 0.0039, "step": 15549 }, { "epoch": 3.17, "learning_rate": 9.061770306650817e-05, "loss": 0.0027, "step": 15550 }, { "epoch": 3.17, "learning_rate": 9.059990195239227e-05, "loss": 0.0032, "step": 15551 }, { "epoch": 3.17, "learning_rate": 9.058210183037007e-05, "loss": 0.0107, "step": 15552 }, { "epoch": 3.17, "learning_rate": 9.056430270073895e-05, "loss": 0.0045, "step": 15553 }, { "epoch": 3.17, "learning_rate": 9.054650456379623e-05, "loss": 0.003, "step": 15554 }, { "epoch": 3.17, "learning_rate": 9.052870741983901e-05, "loss": 0.0173, "step": 15555 }, { "epoch": 3.17, "learning_rate": 9.051091126916471e-05, "loss": 0.0092, "step": 15556 }, { "epoch": 3.17, "learning_rate": 9.049311611207043e-05, "loss": 0.003, "step": 15557 }, { "epoch": 3.17, "learning_rate": 9.04753219488535e-05, "loss": 0.0026, "step": 15558 }, { "epoch": 3.17, "learning_rate": 9.045752877981105e-05, "loss": 0.0009, "step": 15559 }, { "epoch": 3.17, "learning_rate": 9.043973660524022e-05, "loss": 0.0056, "step": 15560 }, { "epoch": 3.17, "learning_rate": 9.042194542543825e-05, "loss": 0.0141, "step": 15561 }, { "epoch": 3.17, "learning_rate": 9.040415524070221e-05, "loss": 0.0081, "step": 15562 }, { "epoch": 3.17, "learning_rate": 9.038636605132929e-05, "loss": 0.0013, "step": 15563 }, { "epoch": 3.17, "learning_rate": 9.036857785761663e-05, "loss": 0.0025, "step": 15564 }, { "epoch": 3.17, "learning_rate": 9.035079065986122e-05, "loss": 0.006, "step": 15565 }, { "epoch": 3.17, "learning_rate": 9.033300445836025e-05, "loss": 0.0036, "step": 15566 }, { "epoch": 3.17, "learning_rate": 9.031521925341073e-05, "loss": 0.009, "step": 15567 }, { "epoch": 3.17, "learning_rate": 9.029743504530968e-05, "loss": 0.005, "step": 15568 }, { "epoch": 3.17, "learning_rate": 9.02796518343542e-05, "loss": 0.005, "step": 15569 }, { "epoch": 3.17, "learning_rate": 9.026186962084122e-05, "loss": 0.004, "step": 15570 }, { "epoch": 3.17, "learning_rate": 9.024408840506782e-05, "loss": 0.0084, "step": 15571 }, { "epoch": 3.17, "learning_rate": 9.02263081873309e-05, "loss": 0.002, "step": 15572 }, { "epoch": 3.17, "learning_rate": 9.02085289679275e-05, "loss": 0.0117, "step": 15573 }, { "epoch": 3.17, "learning_rate": 9.019075074715452e-05, "loss": 0.0012, "step": 15574 }, { "epoch": 3.17, "learning_rate": 9.017297352530887e-05, "loss": 0.0028, "step": 15575 }, { "epoch": 3.17, "learning_rate": 9.015519730268754e-05, "loss": 0.0012, "step": 15576 }, { "epoch": 3.17, "learning_rate": 9.013742207958741e-05, "loss": 0.0088, "step": 15577 }, { "epoch": 3.17, "learning_rate": 9.011964785630523e-05, "loss": 0.0024, "step": 15578 }, { "epoch": 3.17, "learning_rate": 9.010187463313805e-05, "loss": 0.0082, "step": 15579 }, { "epoch": 3.17, "learning_rate": 9.008410241038257e-05, "loss": 0.0037, "step": 15580 }, { "epoch": 3.17, "learning_rate": 9.006633118833572e-05, "loss": 0.0015, "step": 15581 }, { "epoch": 3.17, "learning_rate": 9.004856096729425e-05, "loss": 0.0034, "step": 15582 }, { "epoch": 3.17, "learning_rate": 9.003079174755499e-05, "loss": 0.005, "step": 15583 }, { "epoch": 3.17, "learning_rate": 9.001302352941471e-05, "loss": 0.0047, "step": 15584 }, { "epoch": 3.17, "learning_rate": 8.999525631317015e-05, "loss": 0.0007, "step": 15585 }, { "epoch": 3.17, "learning_rate": 8.997749009911808e-05, "loss": 0.0061, "step": 15586 }, { "epoch": 3.17, "learning_rate": 8.995972488755527e-05, "loss": 0.0011, "step": 15587 }, { "epoch": 3.17, "learning_rate": 8.99419606787783e-05, "loss": 0.0009, "step": 15588 }, { "epoch": 3.17, "learning_rate": 8.992419747308406e-05, "loss": 0.0007, "step": 15589 }, { "epoch": 3.17, "learning_rate": 8.990643527076902e-05, "loss": 0.0046, "step": 15590 }, { "epoch": 3.17, "learning_rate": 8.988867407213001e-05, "loss": 0.0074, "step": 15591 }, { "epoch": 3.17, "learning_rate": 8.987091387746366e-05, "loss": 0.0074, "step": 15592 }, { "epoch": 3.18, "learning_rate": 8.985315468706643e-05, "loss": 0.0132, "step": 15593 }, { "epoch": 3.18, "learning_rate": 8.983539650123512e-05, "loss": 0.0048, "step": 15594 }, { "epoch": 3.18, "learning_rate": 8.981763932026627e-05, "loss": 0.0042, "step": 15595 }, { "epoch": 3.18, "learning_rate": 8.979988314445638e-05, "loss": 0.0064, "step": 15596 }, { "epoch": 3.18, "learning_rate": 8.978212797410216e-05, "loss": 0.0014, "step": 15597 }, { "epoch": 3.18, "learning_rate": 8.97643738095e-05, "loss": 0.0019, "step": 15598 }, { "epoch": 3.18, "learning_rate": 8.974662065094655e-05, "loss": 0.0066, "step": 15599 }, { "epoch": 3.18, "learning_rate": 8.972886849873828e-05, "loss": 0.0029, "step": 15600 }, { "epoch": 3.18, "learning_rate": 8.971111735317162e-05, "loss": 0.0016, "step": 15601 }, { "epoch": 3.18, "learning_rate": 8.969336721454317e-05, "loss": 0.0015, "step": 15602 }, { "epoch": 3.18, "learning_rate": 8.967561808314923e-05, "loss": 0.007, "step": 15603 }, { "epoch": 3.18, "learning_rate": 8.965786995928644e-05, "loss": 0.0082, "step": 15604 }, { "epoch": 3.18, "learning_rate": 8.964012284325108e-05, "loss": 0.003, "step": 15605 }, { "epoch": 3.18, "learning_rate": 8.962237673533957e-05, "loss": 0.001, "step": 15606 }, { "epoch": 3.18, "learning_rate": 8.96046316358484e-05, "loss": 0.003, "step": 15607 }, { "epoch": 3.18, "learning_rate": 8.958688754507383e-05, "loss": 0.0043, "step": 15608 }, { "epoch": 3.18, "learning_rate": 8.956914446331232e-05, "loss": 0.0131, "step": 15609 }, { "epoch": 3.18, "learning_rate": 8.95514023908602e-05, "loss": 0.0014, "step": 15610 }, { "epoch": 3.18, "learning_rate": 8.95336613280137e-05, "loss": 0.0033, "step": 15611 }, { "epoch": 3.18, "learning_rate": 8.951592127506923e-05, "loss": 0.0141, "step": 15612 }, { "epoch": 3.18, "learning_rate": 8.949818223232301e-05, "loss": 0.0024, "step": 15613 }, { "epoch": 3.18, "learning_rate": 8.948044420007138e-05, "loss": 0.0015, "step": 15614 }, { "epoch": 3.18, "learning_rate": 8.946270717861058e-05, "loss": 0.0053, "step": 15615 }, { "epoch": 3.18, "learning_rate": 8.944497116823682e-05, "loss": 0.0018, "step": 15616 }, { "epoch": 3.18, "learning_rate": 8.942723616924635e-05, "loss": 0.0054, "step": 15617 }, { "epoch": 3.18, "learning_rate": 8.94095021819354e-05, "loss": 0.007, "step": 15618 }, { "epoch": 3.18, "learning_rate": 8.939176920660009e-05, "loss": 0.0068, "step": 15619 }, { "epoch": 3.18, "learning_rate": 8.93740372435367e-05, "loss": 0.0012, "step": 15620 }, { "epoch": 3.18, "learning_rate": 8.935630629304125e-05, "loss": 0.0079, "step": 15621 }, { "epoch": 3.18, "learning_rate": 8.933857635541003e-05, "loss": 0.0125, "step": 15622 }, { "epoch": 3.18, "learning_rate": 8.932084743093911e-05, "loss": 0.0079, "step": 15623 }, { "epoch": 3.18, "learning_rate": 8.93031195199245e-05, "loss": 0.0118, "step": 15624 }, { "epoch": 3.18, "learning_rate": 8.928539262266236e-05, "loss": 0.003, "step": 15625 }, { "epoch": 3.18, "learning_rate": 8.926766673944882e-05, "loss": 0.0091, "step": 15626 }, { "epoch": 3.18, "learning_rate": 8.924994187057987e-05, "loss": 0.0218, "step": 15627 }, { "epoch": 3.18, "learning_rate": 8.923221801635161e-05, "loss": 0.0035, "step": 15628 }, { "epoch": 3.18, "learning_rate": 8.921449517705994e-05, "loss": 0.0051, "step": 15629 }, { "epoch": 3.18, "learning_rate": 8.9196773353001e-05, "loss": 0.0096, "step": 15630 }, { "epoch": 3.18, "learning_rate": 8.917905254447067e-05, "loss": 0.0062, "step": 15631 }, { "epoch": 3.18, "learning_rate": 8.916133275176501e-05, "loss": 0.0048, "step": 15632 }, { "epoch": 3.18, "learning_rate": 8.914361397517995e-05, "loss": 0.0002, "step": 15633 }, { "epoch": 3.18, "learning_rate": 8.912589621501135e-05, "loss": 0.0002, "step": 15634 }, { "epoch": 3.18, "learning_rate": 8.910817947155523e-05, "loss": 0.0119, "step": 15635 }, { "epoch": 3.18, "learning_rate": 8.909046374510744e-05, "loss": 0.0082, "step": 15636 }, { "epoch": 3.18, "learning_rate": 8.907274903596387e-05, "loss": 0.0009, "step": 15637 }, { "epoch": 3.18, "learning_rate": 8.905503534442047e-05, "loss": 0.0087, "step": 15638 }, { "epoch": 3.18, "learning_rate": 8.903732267077292e-05, "loss": 0.0092, "step": 15639 }, { "epoch": 3.18, "learning_rate": 8.901961101531724e-05, "loss": 0.0081, "step": 15640 }, { "epoch": 3.18, "learning_rate": 8.900190037834915e-05, "loss": 0.014, "step": 15641 }, { "epoch": 3.19, "learning_rate": 8.89841907601644e-05, "loss": 0.0028, "step": 15642 }, { "epoch": 3.19, "learning_rate": 8.896648216105894e-05, "loss": 0.0033, "step": 15643 }, { "epoch": 3.19, "learning_rate": 8.894877458132833e-05, "loss": 0.0043, "step": 15644 }, { "epoch": 3.19, "learning_rate": 8.893106802126851e-05, "loss": 0.0031, "step": 15645 }, { "epoch": 3.19, "learning_rate": 8.891336248117509e-05, "loss": 0.0013, "step": 15646 }, { "epoch": 3.19, "learning_rate": 8.88956579613438e-05, "loss": 0.004, "step": 15647 }, { "epoch": 3.19, "learning_rate": 8.887795446207044e-05, "loss": 0.0004, "step": 15648 }, { "epoch": 3.19, "learning_rate": 8.886025198365054e-05, "loss": 0.0029, "step": 15649 }, { "epoch": 3.19, "learning_rate": 8.88425505263799e-05, "loss": 0.0011, "step": 15650 }, { "epoch": 3.19, "learning_rate": 8.882485009055412e-05, "loss": 0.0038, "step": 15651 }, { "epoch": 3.19, "learning_rate": 8.880715067646876e-05, "loss": 0.0013, "step": 15652 }, { "epoch": 3.19, "learning_rate": 8.878945228441954e-05, "loss": 0.0017, "step": 15653 }, { "epoch": 3.19, "learning_rate": 8.877175491470197e-05, "loss": 0.0014, "step": 15654 }, { "epoch": 3.19, "learning_rate": 8.87540585676117e-05, "loss": 0.0051, "step": 15655 }, { "epoch": 3.19, "learning_rate": 8.873636324344425e-05, "loss": 0.0012, "step": 15656 }, { "epoch": 3.19, "learning_rate": 8.871866894249516e-05, "loss": 0.0027, "step": 15657 }, { "epoch": 3.19, "learning_rate": 8.870097566505999e-05, "loss": 0.0021, "step": 15658 }, { "epoch": 3.19, "learning_rate": 8.868328341143423e-05, "loss": 0.0043, "step": 15659 }, { "epoch": 3.19, "learning_rate": 8.86655921819134e-05, "loss": 0.0031, "step": 15660 }, { "epoch": 3.19, "learning_rate": 8.864790197679299e-05, "loss": 0.0005, "step": 15661 }, { "epoch": 3.19, "learning_rate": 8.863021279636835e-05, "loss": 0.003, "step": 15662 }, { "epoch": 3.19, "learning_rate": 8.861252464093506e-05, "loss": 0.0051, "step": 15663 }, { "epoch": 3.19, "learning_rate": 8.859483751078842e-05, "loss": 0.0042, "step": 15664 }, { "epoch": 3.19, "learning_rate": 8.857715140622397e-05, "loss": 0.0009, "step": 15665 }, { "epoch": 3.19, "learning_rate": 8.855946632753701e-05, "loss": 0.0007, "step": 15666 }, { "epoch": 3.19, "learning_rate": 8.854178227502294e-05, "loss": 0.004, "step": 15667 }, { "epoch": 3.19, "learning_rate": 8.852409924897711e-05, "loss": 0.0211, "step": 15668 }, { "epoch": 3.19, "learning_rate": 8.85064172496949e-05, "loss": 0.0025, "step": 15669 }, { "epoch": 3.19, "learning_rate": 8.848873627747155e-05, "loss": 0.0033, "step": 15670 }, { "epoch": 3.19, "learning_rate": 8.847105633260247e-05, "loss": 0.0061, "step": 15671 }, { "epoch": 3.19, "learning_rate": 8.845337741538282e-05, "loss": 0.0018, "step": 15672 }, { "epoch": 3.19, "learning_rate": 8.8435699526108e-05, "loss": 0.002, "step": 15673 }, { "epoch": 3.19, "learning_rate": 8.841802266507322e-05, "loss": 0.0059, "step": 15674 }, { "epoch": 3.19, "learning_rate": 8.840034683257364e-05, "loss": 0.0152, "step": 15675 }, { "epoch": 3.19, "learning_rate": 8.838267202890462e-05, "loss": 0.0015, "step": 15676 }, { "epoch": 3.19, "learning_rate": 8.836499825436122e-05, "loss": 0.003, "step": 15677 }, { "epoch": 3.19, "learning_rate": 8.834732550923873e-05, "loss": 0.0072, "step": 15678 }, { "epoch": 3.19, "learning_rate": 8.832965379383229e-05, "loss": 0.0043, "step": 15679 }, { "epoch": 3.19, "learning_rate": 8.831198310843701e-05, "loss": 0.0003, "step": 15680 }, { "epoch": 3.19, "learning_rate": 8.82943134533481e-05, "loss": 0.0015, "step": 15681 }, { "epoch": 3.19, "learning_rate": 8.827664482886058e-05, "loss": 0.0005, "step": 15682 }, { "epoch": 3.19, "learning_rate": 8.825897723526966e-05, "loss": 0.0064, "step": 15683 }, { "epoch": 3.19, "learning_rate": 8.824131067287038e-05, "loss": 0.0084, "step": 15684 }, { "epoch": 3.19, "learning_rate": 8.82236451419577e-05, "loss": 0.005, "step": 15685 }, { "epoch": 3.19, "learning_rate": 8.820598064282683e-05, "loss": 0.01, "step": 15686 }, { "epoch": 3.19, "learning_rate": 8.818831717577267e-05, "loss": 0.0012, "step": 15687 }, { "epoch": 3.19, "learning_rate": 8.817065474109032e-05, "loss": 0.0064, "step": 15688 }, { "epoch": 3.19, "learning_rate": 8.815299333907478e-05, "loss": 0.0052, "step": 15689 }, { "epoch": 3.19, "learning_rate": 8.813533297002094e-05, "loss": 0.0074, "step": 15690 }, { "epoch": 3.19, "learning_rate": 8.811767363422387e-05, "loss": 0.0076, "step": 15691 }, { "epoch": 3.2, "learning_rate": 8.810001533197846e-05, "loss": 0.0053, "step": 15692 }, { "epoch": 3.2, "learning_rate": 8.808235806357956e-05, "loss": 0.001, "step": 15693 }, { "epoch": 3.2, "learning_rate": 8.806470182932224e-05, "loss": 0.0019, "step": 15694 }, { "epoch": 3.2, "learning_rate": 8.804704662950126e-05, "loss": 0.0055, "step": 15695 }, { "epoch": 3.2, "learning_rate": 8.802939246441159e-05, "loss": 0.0019, "step": 15696 }, { "epoch": 3.2, "learning_rate": 8.801173933434801e-05, "loss": 0.0111, "step": 15697 }, { "epoch": 3.2, "learning_rate": 8.79940872396054e-05, "loss": 0.0019, "step": 15698 }, { "epoch": 3.2, "learning_rate": 8.797643618047859e-05, "loss": 0.0068, "step": 15699 }, { "epoch": 3.2, "learning_rate": 8.795878615726234e-05, "loss": 0.0022, "step": 15700 }, { "epoch": 3.2, "learning_rate": 8.79411371702515e-05, "loss": 0.0023, "step": 15701 }, { "epoch": 3.2, "learning_rate": 8.792348921974085e-05, "loss": 0.0014, "step": 15702 }, { "epoch": 3.2, "learning_rate": 8.790584230602504e-05, "loss": 0.0084, "step": 15703 }, { "epoch": 3.2, "learning_rate": 8.788819642939893e-05, "loss": 0.0099, "step": 15704 }, { "epoch": 3.2, "learning_rate": 8.787055159015712e-05, "loss": 0.0068, "step": 15705 }, { "epoch": 3.2, "learning_rate": 8.785290778859446e-05, "loss": 0.0031, "step": 15706 }, { "epoch": 3.2, "learning_rate": 8.783526502500548e-05, "loss": 0.001, "step": 15707 }, { "epoch": 3.2, "learning_rate": 8.781762329968495e-05, "loss": 0.0034, "step": 15708 }, { "epoch": 3.2, "learning_rate": 8.779998261292748e-05, "loss": 0.0065, "step": 15709 }, { "epoch": 3.2, "learning_rate": 8.778234296502771e-05, "loss": 0.0019, "step": 15710 }, { "epoch": 3.2, "learning_rate": 8.776470435628026e-05, "loss": 0.0066, "step": 15711 }, { "epoch": 3.2, "learning_rate": 8.774706678697975e-05, "loss": 0.0014, "step": 15712 }, { "epoch": 3.2, "learning_rate": 8.772943025742067e-05, "loss": 0.0021, "step": 15713 }, { "epoch": 3.2, "learning_rate": 8.771179476789772e-05, "loss": 0.0069, "step": 15714 }, { "epoch": 3.2, "learning_rate": 8.769416031870538e-05, "loss": 0.0062, "step": 15715 }, { "epoch": 3.2, "learning_rate": 8.767652691013809e-05, "loss": 0.0011, "step": 15716 }, { "epoch": 3.2, "learning_rate": 8.765889454249053e-05, "loss": 0.0043, "step": 15717 }, { "epoch": 3.2, "learning_rate": 8.764126321605703e-05, "loss": 0.0024, "step": 15718 }, { "epoch": 3.2, "learning_rate": 8.76236329311322e-05, "loss": 0.0065, "step": 15719 }, { "epoch": 3.2, "learning_rate": 8.760600368801044e-05, "loss": 0.0053, "step": 15720 }, { "epoch": 3.2, "learning_rate": 8.758837548698616e-05, "loss": 0.0053, "step": 15721 }, { "epoch": 3.2, "learning_rate": 8.757074832835386e-05, "loss": 0.0072, "step": 15722 }, { "epoch": 3.2, "learning_rate": 8.755312221240788e-05, "loss": 0.0056, "step": 15723 }, { "epoch": 3.2, "learning_rate": 8.753549713944266e-05, "loss": 0.0027, "step": 15724 }, { "epoch": 3.2, "learning_rate": 8.751787310975253e-05, "loss": 0.0077, "step": 15725 }, { "epoch": 3.2, "learning_rate": 8.750025012363185e-05, "loss": 0.0079, "step": 15726 }, { "epoch": 3.2, "learning_rate": 8.748262818137499e-05, "loss": 0.0052, "step": 15727 }, { "epoch": 3.2, "learning_rate": 8.746500728327624e-05, "loss": 0.0025, "step": 15728 }, { "epoch": 3.2, "learning_rate": 8.744738742962991e-05, "loss": 0.0002, "step": 15729 }, { "epoch": 3.2, "learning_rate": 8.742976862073034e-05, "loss": 0.0028, "step": 15730 }, { "epoch": 3.2, "learning_rate": 8.741215085687165e-05, "loss": 0.0029, "step": 15731 }, { "epoch": 3.2, "learning_rate": 8.739453413834827e-05, "loss": 0.0003, "step": 15732 }, { "epoch": 3.2, "learning_rate": 8.737691846545426e-05, "loss": 0.0038, "step": 15733 }, { "epoch": 3.2, "learning_rate": 8.735930383848402e-05, "loss": 0.0029, "step": 15734 }, { "epoch": 3.2, "learning_rate": 8.734169025773159e-05, "loss": 0.0044, "step": 15735 }, { "epoch": 3.2, "learning_rate": 8.732407772349116e-05, "loss": 0.0047, "step": 15736 }, { "epoch": 3.2, "learning_rate": 8.730646623605704e-05, "loss": 0.0014, "step": 15737 }, { "epoch": 3.2, "learning_rate": 8.728885579572318e-05, "loss": 0.0072, "step": 15738 }, { "epoch": 3.2, "learning_rate": 8.72712464027839e-05, "loss": 0.0057, "step": 15739 }, { "epoch": 3.2, "learning_rate": 8.725363805753317e-05, "loss": 0.0008, "step": 15740 }, { "epoch": 3.21, "learning_rate": 8.723603076026512e-05, "loss": 0.0062, "step": 15741 }, { "epoch": 3.21, "learning_rate": 8.721842451127383e-05, "loss": 0.0146, "step": 15742 }, { "epoch": 3.21, "learning_rate": 8.720081931085338e-05, "loss": 0.0011, "step": 15743 }, { "epoch": 3.21, "learning_rate": 8.718321515929778e-05, "loss": 0.0042, "step": 15744 }, { "epoch": 3.21, "learning_rate": 8.716561205690105e-05, "loss": 0.0004, "step": 15745 }, { "epoch": 3.21, "learning_rate": 8.71480100039572e-05, "loss": 0.0084, "step": 15746 }, { "epoch": 3.21, "learning_rate": 8.713040900076025e-05, "loss": 0.002, "step": 15747 }, { "epoch": 3.21, "learning_rate": 8.711280904760418e-05, "loss": 0.0139, "step": 15748 }, { "epoch": 3.21, "learning_rate": 8.70952101447828e-05, "loss": 0.001, "step": 15749 }, { "epoch": 3.21, "learning_rate": 8.707761229259027e-05, "loss": 0.008, "step": 15750 }, { "epoch": 3.21, "learning_rate": 8.706001549132027e-05, "loss": 0.0034, "step": 15751 }, { "epoch": 3.21, "learning_rate": 8.704241974126696e-05, "loss": 0.0083, "step": 15752 }, { "epoch": 3.21, "learning_rate": 8.702482504272399e-05, "loss": 0.0036, "step": 15753 }, { "epoch": 3.21, "learning_rate": 8.700723139598532e-05, "loss": 0.0006, "step": 15754 }, { "epoch": 3.21, "learning_rate": 8.698963880134479e-05, "loss": 0.0014, "step": 15755 }, { "epoch": 3.21, "learning_rate": 8.697204725909626e-05, "loss": 0.0018, "step": 15756 }, { "epoch": 3.21, "learning_rate": 8.695445676953349e-05, "loss": 0.0087, "step": 15757 }, { "epoch": 3.21, "learning_rate": 8.693686733295029e-05, "loss": 0.0056, "step": 15758 }, { "epoch": 3.21, "learning_rate": 8.691927894964046e-05, "loss": 0.0067, "step": 15759 }, { "epoch": 3.21, "learning_rate": 8.690169161989775e-05, "loss": 0.0014, "step": 15760 }, { "epoch": 3.21, "learning_rate": 8.688410534401589e-05, "loss": 0.0012, "step": 15761 }, { "epoch": 3.21, "learning_rate": 8.686652012228861e-05, "loss": 0.0056, "step": 15762 }, { "epoch": 3.21, "learning_rate": 8.684893595500967e-05, "loss": 0.002, "step": 15763 }, { "epoch": 3.21, "learning_rate": 8.68313528424726e-05, "loss": 0.0041, "step": 15764 }, { "epoch": 3.21, "learning_rate": 8.681377078497129e-05, "loss": 0.0006, "step": 15765 }, { "epoch": 3.21, "learning_rate": 8.679618978279923e-05, "loss": 0.0099, "step": 15766 }, { "epoch": 3.21, "learning_rate": 8.677860983625004e-05, "loss": 0.0036, "step": 15767 }, { "epoch": 3.21, "learning_rate": 8.67610309456175e-05, "loss": 0.0049, "step": 15768 }, { "epoch": 3.21, "learning_rate": 8.674345311119503e-05, "loss": 0.0052, "step": 15769 }, { "epoch": 3.21, "learning_rate": 8.67258763332764e-05, "loss": 0.0042, "step": 15770 }, { "epoch": 3.21, "learning_rate": 8.670830061215503e-05, "loss": 0.0021, "step": 15771 }, { "epoch": 3.21, "learning_rate": 8.669072594812449e-05, "loss": 0.0078, "step": 15772 }, { "epoch": 3.21, "learning_rate": 8.667315234147836e-05, "loss": 0.0024, "step": 15773 }, { "epoch": 3.21, "learning_rate": 8.66555797925101e-05, "loss": 0.003, "step": 15774 }, { "epoch": 3.21, "learning_rate": 8.663800830151322e-05, "loss": 0.0036, "step": 15775 }, { "epoch": 3.21, "learning_rate": 8.662043786878123e-05, "loss": 0.0041, "step": 15776 }, { "epoch": 3.21, "learning_rate": 8.660286849460755e-05, "loss": 0.0072, "step": 15777 }, { "epoch": 3.21, "learning_rate": 8.658530017928564e-05, "loss": 0.0085, "step": 15778 }, { "epoch": 3.21, "learning_rate": 8.656773292310894e-05, "loss": 0.0001, "step": 15779 }, { "epoch": 3.21, "learning_rate": 8.655016672637079e-05, "loss": 0.0003, "step": 15780 }, { "epoch": 3.21, "learning_rate": 8.653260158936473e-05, "loss": 0.0008, "step": 15781 }, { "epoch": 3.21, "learning_rate": 8.651503751238389e-05, "loss": 0.0007, "step": 15782 }, { "epoch": 3.21, "learning_rate": 8.649747449572188e-05, "loss": 0.0025, "step": 15783 }, { "epoch": 3.21, "learning_rate": 8.64799125396718e-05, "loss": 0.0031, "step": 15784 }, { "epoch": 3.21, "learning_rate": 8.64623516445272e-05, "loss": 0.0063, "step": 15785 }, { "epoch": 3.21, "learning_rate": 8.644479181058119e-05, "loss": 0.0128, "step": 15786 }, { "epoch": 3.21, "learning_rate": 8.642723303812714e-05, "loss": 0.0053, "step": 15787 }, { "epoch": 3.21, "learning_rate": 8.640967532745832e-05, "loss": 0.0099, "step": 15788 }, { "epoch": 3.21, "learning_rate": 8.639211867886792e-05, "loss": 0.0053, "step": 15789 }, { "epoch": 3.22, "learning_rate": 8.637456309264925e-05, "loss": 0.0055, "step": 15790 }, { "epoch": 3.22, "learning_rate": 8.635700856909543e-05, "loss": 0.0078, "step": 15791 }, { "epoch": 3.22, "learning_rate": 8.633945510849972e-05, "loss": 0.0008, "step": 15792 }, { "epoch": 3.22, "learning_rate": 8.632190271115527e-05, "loss": 0.0052, "step": 15793 }, { "epoch": 3.22, "learning_rate": 8.630435137735532e-05, "loss": 0.0008, "step": 15794 }, { "epoch": 3.22, "learning_rate": 8.62868011073928e-05, "loss": 0.0024, "step": 15795 }, { "epoch": 3.22, "learning_rate": 8.626925190156105e-05, "loss": 0.0026, "step": 15796 }, { "epoch": 3.22, "learning_rate": 8.62517037601531e-05, "loss": 0.0028, "step": 15797 }, { "epoch": 3.22, "learning_rate": 8.623415668346202e-05, "loss": 0.0015, "step": 15798 }, { "epoch": 3.22, "learning_rate": 8.621661067178094e-05, "loss": 0.0026, "step": 15799 }, { "epoch": 3.22, "learning_rate": 8.619906572540273e-05, "loss": 0.0027, "step": 15800 }, { "epoch": 3.22, "learning_rate": 8.61815218446207e-05, "loss": 0.0044, "step": 15801 }, { "epoch": 3.22, "learning_rate": 8.61639790297276e-05, "loss": 0.0013, "step": 15802 }, { "epoch": 3.22, "learning_rate": 8.614643728101665e-05, "loss": 0.0036, "step": 15803 }, { "epoch": 3.22, "learning_rate": 8.612889659878069e-05, "loss": 0.0033, "step": 15804 }, { "epoch": 3.22, "learning_rate": 8.611135698331272e-05, "loss": 0.0016, "step": 15805 }, { "epoch": 3.22, "learning_rate": 8.609381843490567e-05, "loss": 0.0027, "step": 15806 }, { "epoch": 3.22, "learning_rate": 8.607628095385249e-05, "loss": 0.0031, "step": 15807 }, { "epoch": 3.22, "learning_rate": 8.60587445404461e-05, "loss": 0.003, "step": 15808 }, { "epoch": 3.22, "learning_rate": 8.604120919497936e-05, "loss": 0.0027, "step": 15809 }, { "epoch": 3.22, "learning_rate": 8.602367491774516e-05, "loss": 0.0002, "step": 15810 }, { "epoch": 3.22, "learning_rate": 8.600614170903633e-05, "loss": 0.0006, "step": 15811 }, { "epoch": 3.22, "learning_rate": 8.598860956914576e-05, "loss": 0.0036, "step": 15812 }, { "epoch": 3.22, "learning_rate": 8.597107849836623e-05, "loss": 0.0037, "step": 15813 }, { "epoch": 3.22, "learning_rate": 8.595354849699059e-05, "loss": 0.0066, "step": 15814 }, { "epoch": 3.22, "learning_rate": 8.59360195653115e-05, "loss": 0.0067, "step": 15815 }, { "epoch": 3.22, "learning_rate": 8.591849170362192e-05, "loss": 0.006, "step": 15816 }, { "epoch": 3.22, "learning_rate": 8.590096491221445e-05, "loss": 0.0101, "step": 15817 }, { "epoch": 3.22, "learning_rate": 8.588343919138185e-05, "loss": 0.0003, "step": 15818 }, { "epoch": 3.22, "learning_rate": 8.586591454141682e-05, "loss": 0.0058, "step": 15819 }, { "epoch": 3.22, "learning_rate": 8.584839096261204e-05, "loss": 0.0178, "step": 15820 }, { "epoch": 3.22, "learning_rate": 8.583086845526034e-05, "loss": 0.0012, "step": 15821 }, { "epoch": 3.22, "learning_rate": 8.58133470196542e-05, "loss": 0.0015, "step": 15822 }, { "epoch": 3.22, "learning_rate": 8.579582665608636e-05, "loss": 0.0058, "step": 15823 }, { "epoch": 3.22, "learning_rate": 8.577830736484937e-05, "loss": 0.0027, "step": 15824 }, { "epoch": 3.22, "learning_rate": 8.576078914623589e-05, "loss": 0.0111, "step": 15825 }, { "epoch": 3.22, "learning_rate": 8.574327200053849e-05, "loss": 0.0007, "step": 15826 }, { "epoch": 3.22, "learning_rate": 8.572575592804974e-05, "loss": 0.0067, "step": 15827 }, { "epoch": 3.22, "learning_rate": 8.570824092906217e-05, "loss": 0.0009, "step": 15828 }, { "epoch": 3.22, "learning_rate": 8.569072700386835e-05, "loss": 0.0016, "step": 15829 }, { "epoch": 3.22, "learning_rate": 8.56732141527608e-05, "loss": 0.0002, "step": 15830 }, { "epoch": 3.22, "learning_rate": 8.565570237603199e-05, "loss": 0.0069, "step": 15831 }, { "epoch": 3.22, "learning_rate": 8.563819167397447e-05, "loss": 0.0077, "step": 15832 }, { "epoch": 3.22, "learning_rate": 8.562068204688052e-05, "loss": 0.0054, "step": 15833 }, { "epoch": 3.22, "learning_rate": 8.560317349504281e-05, "loss": 0.0068, "step": 15834 }, { "epoch": 3.22, "learning_rate": 8.558566601875354e-05, "loss": 0.0067, "step": 15835 }, { "epoch": 3.22, "learning_rate": 8.556815961830538e-05, "loss": 0.0101, "step": 15836 }, { "epoch": 3.22, "learning_rate": 8.555065429399052e-05, "loss": 0.0093, "step": 15837 }, { "epoch": 3.22, "learning_rate": 8.553315004610137e-05, "loss": 0.0029, "step": 15838 }, { "epoch": 3.23, "learning_rate": 8.55156468749303e-05, "loss": 0.0096, "step": 15839 }, { "epoch": 3.23, "learning_rate": 8.549814478076966e-05, "loss": 0.0054, "step": 15840 }, { "epoch": 3.23, "learning_rate": 8.548064376391177e-05, "loss": 0.0055, "step": 15841 }, { "epoch": 3.23, "learning_rate": 8.54631438246489e-05, "loss": 0.005, "step": 15842 }, { "epoch": 3.23, "learning_rate": 8.544564496327336e-05, "loss": 0.0054, "step": 15843 }, { "epoch": 3.23, "learning_rate": 8.54281471800774e-05, "loss": 0.0057, "step": 15844 }, { "epoch": 3.23, "learning_rate": 8.541065047535332e-05, "loss": 0.0008, "step": 15845 }, { "epoch": 3.23, "learning_rate": 8.539315484939321e-05, "loss": 0.0027, "step": 15846 }, { "epoch": 3.23, "learning_rate": 8.537566030248945e-05, "loss": 0.0034, "step": 15847 }, { "epoch": 3.23, "learning_rate": 8.535816683493406e-05, "loss": 0.0028, "step": 15848 }, { "epoch": 3.23, "learning_rate": 8.534067444701936e-05, "loss": 0.0057, "step": 15849 }, { "epoch": 3.23, "learning_rate": 8.532318313903747e-05, "loss": 0.0048, "step": 15850 }, { "epoch": 3.23, "learning_rate": 8.530569291128045e-05, "loss": 0.0038, "step": 15851 }, { "epoch": 3.23, "learning_rate": 8.528820376404055e-05, "loss": 0.0023, "step": 15852 }, { "epoch": 3.23, "learning_rate": 8.52707156976097e-05, "loss": 0.0067, "step": 15853 }, { "epoch": 3.23, "learning_rate": 8.52532287122802e-05, "loss": 0.0099, "step": 15854 }, { "epoch": 3.23, "learning_rate": 8.523574280834393e-05, "loss": 0.0056, "step": 15855 }, { "epoch": 3.23, "learning_rate": 8.5218257986093e-05, "loss": 0.0023, "step": 15856 }, { "epoch": 3.23, "learning_rate": 8.520077424581947e-05, "loss": 0.0088, "step": 15857 }, { "epoch": 3.23, "learning_rate": 8.518329158781532e-05, "loss": 0.0068, "step": 15858 }, { "epoch": 3.23, "learning_rate": 8.516581001237255e-05, "loss": 0.0004, "step": 15859 }, { "epoch": 3.23, "learning_rate": 8.514832951978314e-05, "loss": 0.0057, "step": 15860 }, { "epoch": 3.23, "learning_rate": 8.513085011033904e-05, "loss": 0.0072, "step": 15861 }, { "epoch": 3.23, "learning_rate": 8.511337178433219e-05, "loss": 0.0056, "step": 15862 }, { "epoch": 3.23, "learning_rate": 8.509589454205456e-05, "loss": 0.0091, "step": 15863 }, { "epoch": 3.23, "learning_rate": 8.50784183837979e-05, "loss": 0.0181, "step": 15864 }, { "epoch": 3.23, "learning_rate": 8.506094330985432e-05, "loss": 0.011, "step": 15865 }, { "epoch": 3.23, "learning_rate": 8.504346932051545e-05, "loss": 0.0041, "step": 15866 }, { "epoch": 3.23, "learning_rate": 8.502599641607337e-05, "loss": 0.0026, "step": 15867 }, { "epoch": 3.23, "learning_rate": 8.500852459681974e-05, "loss": 0.0099, "step": 15868 }, { "epoch": 3.23, "learning_rate": 8.499105386304644e-05, "loss": 0.0074, "step": 15869 }, { "epoch": 3.23, "learning_rate": 8.497358421504524e-05, "loss": 0.0019, "step": 15870 }, { "epoch": 3.23, "learning_rate": 8.495611565310793e-05, "loss": 0.0118, "step": 15871 }, { "epoch": 3.23, "learning_rate": 8.493864817752627e-05, "loss": 0.0041, "step": 15872 }, { "epoch": 3.23, "learning_rate": 8.4921181788592e-05, "loss": 0.0082, "step": 15873 }, { "epoch": 3.23, "learning_rate": 8.490371648659684e-05, "loss": 0.0016, "step": 15874 }, { "epoch": 3.23, "learning_rate": 8.48862522718325e-05, "loss": 0.0018, "step": 15875 }, { "epoch": 3.23, "learning_rate": 8.486878914459063e-05, "loss": 0.0037, "step": 15876 }, { "epoch": 3.23, "learning_rate": 8.485132710516295e-05, "loss": 0.0029, "step": 15877 }, { "epoch": 3.23, "learning_rate": 8.483386615384115e-05, "loss": 0.0008, "step": 15878 }, { "epoch": 3.23, "learning_rate": 8.481640629091666e-05, "loss": 0.0109, "step": 15879 }, { "epoch": 3.23, "learning_rate": 8.479894751668128e-05, "loss": 0.006, "step": 15880 }, { "epoch": 3.23, "learning_rate": 8.478148983142657e-05, "loss": 0.0121, "step": 15881 }, { "epoch": 3.23, "learning_rate": 8.476403323544408e-05, "loss": 0.0093, "step": 15882 }, { "epoch": 3.23, "learning_rate": 8.474657772902545e-05, "loss": 0.0031, "step": 15883 }, { "epoch": 3.23, "learning_rate": 8.4729123312462e-05, "loss": 0.006, "step": 15884 }, { "epoch": 3.23, "learning_rate": 8.471166998604553e-05, "loss": 0.0086, "step": 15885 }, { "epoch": 3.23, "learning_rate": 8.46942177500673e-05, "loss": 0.004, "step": 15886 }, { "epoch": 3.23, "learning_rate": 8.467676660481903e-05, "loss": 0.0012, "step": 15887 }, { "epoch": 3.24, "learning_rate": 8.465931655059199e-05, "loss": 0.0044, "step": 15888 }, { "epoch": 3.24, "learning_rate": 8.46418675876777e-05, "loss": 0.0013, "step": 15889 }, { "epoch": 3.24, "learning_rate": 8.462441971636761e-05, "loss": 0.0044, "step": 15890 }, { "epoch": 3.24, "learning_rate": 8.460697293695311e-05, "loss": 0.0046, "step": 15891 }, { "epoch": 3.24, "learning_rate": 8.45895272497256e-05, "loss": 0.0199, "step": 15892 }, { "epoch": 3.24, "learning_rate": 8.457208265497645e-05, "loss": 0.0113, "step": 15893 }, { "epoch": 3.24, "learning_rate": 8.455463915299703e-05, "loss": 0.002, "step": 15894 }, { "epoch": 3.24, "learning_rate": 8.453719674407866e-05, "loss": 0.0019, "step": 15895 }, { "epoch": 3.24, "learning_rate": 8.451975542851275e-05, "loss": 0.0039, "step": 15896 }, { "epoch": 3.24, "learning_rate": 8.45023152065904e-05, "loss": 0.0007, "step": 15897 }, { "epoch": 3.24, "learning_rate": 8.448487607860314e-05, "loss": 0.0138, "step": 15898 }, { "epoch": 3.24, "learning_rate": 8.446743804484199e-05, "loss": 0.0036, "step": 15899 }, { "epoch": 3.24, "learning_rate": 8.445000110559846e-05, "loss": 0.0017, "step": 15900 }, { "epoch": 3.24, "learning_rate": 8.443256526116361e-05, "loss": 0.0053, "step": 15901 }, { "epoch": 3.24, "learning_rate": 8.44151305118286e-05, "loss": 0.0027, "step": 15902 }, { "epoch": 3.24, "learning_rate": 8.439769685788482e-05, "loss": 0.0014, "step": 15903 }, { "epoch": 3.24, "learning_rate": 8.438026429962323e-05, "loss": 0.0036, "step": 15904 }, { "epoch": 3.24, "learning_rate": 8.43628328373352e-05, "loss": 0.0025, "step": 15905 }, { "epoch": 3.24, "learning_rate": 8.434540247131171e-05, "loss": 0.0011, "step": 15906 }, { "epoch": 3.24, "learning_rate": 8.432797320184392e-05, "loss": 0.0005, "step": 15907 }, { "epoch": 3.24, "learning_rate": 8.431054502922296e-05, "loss": 0.0049, "step": 15908 }, { "epoch": 3.24, "learning_rate": 8.42931179537399e-05, "loss": 0.0049, "step": 15909 }, { "epoch": 3.24, "learning_rate": 8.427569197568579e-05, "loss": 0.0108, "step": 15910 }, { "epoch": 3.24, "learning_rate": 8.425826709535167e-05, "loss": 0.021, "step": 15911 }, { "epoch": 3.24, "learning_rate": 8.424084331302861e-05, "loss": 0.0089, "step": 15912 }, { "epoch": 3.24, "learning_rate": 8.422342062900759e-05, "loss": 0.0126, "step": 15913 }, { "epoch": 3.24, "learning_rate": 8.420599904357967e-05, "loss": 0.002, "step": 15914 }, { "epoch": 3.24, "learning_rate": 8.418857855703564e-05, "loss": 0.0063, "step": 15915 }, { "epoch": 3.24, "learning_rate": 8.417115916966668e-05, "loss": 0.0084, "step": 15916 }, { "epoch": 3.24, "learning_rate": 8.415374088176352e-05, "loss": 0.0039, "step": 15917 }, { "epoch": 3.24, "learning_rate": 8.41363236936173e-05, "loss": 0.0015, "step": 15918 }, { "epoch": 3.24, "learning_rate": 8.411890760551873e-05, "loss": 0.0006, "step": 15919 }, { "epoch": 3.24, "learning_rate": 8.410149261775879e-05, "loss": 0.0014, "step": 15920 }, { "epoch": 3.24, "learning_rate": 8.408407873062826e-05, "loss": 0.0021, "step": 15921 }, { "epoch": 3.24, "learning_rate": 8.406666594441809e-05, "loss": 0.0016, "step": 15922 }, { "epoch": 3.24, "learning_rate": 8.404925425941904e-05, "loss": 0.0005, "step": 15923 }, { "epoch": 3.24, "learning_rate": 8.403184367592194e-05, "loss": 0.008, "step": 15924 }, { "epoch": 3.24, "learning_rate": 8.401443419421757e-05, "loss": 0.0003, "step": 15925 }, { "epoch": 3.24, "learning_rate": 8.39970258145967e-05, "loss": 0.0078, "step": 15926 }, { "epoch": 3.24, "learning_rate": 8.39796185373501e-05, "loss": 0.009, "step": 15927 }, { "epoch": 3.24, "learning_rate": 8.396221236276849e-05, "loss": 0.0035, "step": 15928 }, { "epoch": 3.24, "learning_rate": 8.394480729114265e-05, "loss": 0.0041, "step": 15929 }, { "epoch": 3.24, "learning_rate": 8.39274033227631e-05, "loss": 0.0066, "step": 15930 }, { "epoch": 3.24, "learning_rate": 8.391000045792074e-05, "loss": 0.0051, "step": 15931 }, { "epoch": 3.24, "learning_rate": 8.3892598696906e-05, "loss": 0.0111, "step": 15932 }, { "epoch": 3.24, "learning_rate": 8.387519804000974e-05, "loss": 0.0036, "step": 15933 }, { "epoch": 3.24, "learning_rate": 8.385779848752253e-05, "loss": 0.0066, "step": 15934 }, { "epoch": 3.24, "learning_rate": 8.384040003973483e-05, "loss": 0.0213, "step": 15935 }, { "epoch": 3.24, "learning_rate": 8.382300269693744e-05, "loss": 0.0059, "step": 15936 }, { "epoch": 3.25, "learning_rate": 8.380560645942077e-05, "loss": 0.0039, "step": 15937 }, { "epoch": 3.25, "learning_rate": 8.378821132747543e-05, "loss": 0.0054, "step": 15938 }, { "epoch": 3.25, "learning_rate": 8.377081730139192e-05, "loss": 0.0028, "step": 15939 }, { "epoch": 3.25, "learning_rate": 8.375342438146078e-05, "loss": 0.0005, "step": 15940 }, { "epoch": 3.25, "learning_rate": 8.373603256797253e-05, "loss": 0.0033, "step": 15941 }, { "epoch": 3.25, "learning_rate": 8.37186418612176e-05, "loss": 0.0077, "step": 15942 }, { "epoch": 3.25, "learning_rate": 8.370125226148647e-05, "loss": 0.0066, "step": 15943 }, { "epoch": 3.25, "learning_rate": 8.36838637690696e-05, "loss": 0.0026, "step": 15944 }, { "epoch": 3.25, "learning_rate": 8.366647638425735e-05, "loss": 0.0114, "step": 15945 }, { "epoch": 3.25, "learning_rate": 8.364909010734015e-05, "loss": 0.0083, "step": 15946 }, { "epoch": 3.25, "learning_rate": 8.363170493860849e-05, "loss": 0.0018, "step": 15947 }, { "epoch": 3.25, "learning_rate": 8.36143208783525e-05, "loss": 0.0003, "step": 15948 }, { "epoch": 3.25, "learning_rate": 8.359693792686277e-05, "loss": 0.008, "step": 15949 }, { "epoch": 3.25, "learning_rate": 8.35795560844294e-05, "loss": 0.0106, "step": 15950 }, { "epoch": 3.25, "learning_rate": 8.356217535134295e-05, "loss": 0.0014, "step": 15951 }, { "epoch": 3.25, "learning_rate": 8.354479572789354e-05, "loss": 0.0036, "step": 15952 }, { "epoch": 3.25, "learning_rate": 8.352741721437146e-05, "loss": 0.0166, "step": 15953 }, { "epoch": 3.25, "learning_rate": 8.351003981106699e-05, "loss": 0.0072, "step": 15954 }, { "epoch": 3.25, "learning_rate": 8.349266351827034e-05, "loss": 0.0069, "step": 15955 }, { "epoch": 3.25, "learning_rate": 8.347528833627182e-05, "loss": 0.0075, "step": 15956 }, { "epoch": 3.25, "learning_rate": 8.345791426536152e-05, "loss": 0.0105, "step": 15957 }, { "epoch": 3.25, "learning_rate": 8.344054130582966e-05, "loss": 0.0154, "step": 15958 }, { "epoch": 3.25, "learning_rate": 8.342316945796641e-05, "loss": 0.0011, "step": 15959 }, { "epoch": 3.25, "learning_rate": 8.340579872206188e-05, "loss": 0.0036, "step": 15960 }, { "epoch": 3.25, "learning_rate": 8.338842909840623e-05, "loss": 0.0024, "step": 15961 }, { "epoch": 3.25, "learning_rate": 8.337106058728956e-05, "loss": 0.0034, "step": 15962 }, { "epoch": 3.25, "learning_rate": 8.335369318900193e-05, "loss": 0.01, "step": 15963 }, { "epoch": 3.25, "learning_rate": 8.333632690383345e-05, "loss": 0.0069, "step": 15964 }, { "epoch": 3.25, "learning_rate": 8.331896173207418e-05, "loss": 0.0007, "step": 15965 }, { "epoch": 3.25, "learning_rate": 8.330159767401403e-05, "loss": 0.001, "step": 15966 }, { "epoch": 3.25, "learning_rate": 8.328423472994319e-05, "loss": 0.0024, "step": 15967 }, { "epoch": 3.25, "learning_rate": 8.326687290015146e-05, "loss": 0.0081, "step": 15968 }, { "epoch": 3.25, "learning_rate": 8.324951218492905e-05, "loss": 0.0036, "step": 15969 }, { "epoch": 3.25, "learning_rate": 8.323215258456572e-05, "loss": 0.0006, "step": 15970 }, { "epoch": 3.25, "learning_rate": 8.321479409935145e-05, "loss": 0.0102, "step": 15971 }, { "epoch": 3.25, "learning_rate": 8.31974367295762e-05, "loss": 0.0058, "step": 15972 }, { "epoch": 3.25, "learning_rate": 8.318008047552989e-05, "loss": 0.01, "step": 15973 }, { "epoch": 3.25, "learning_rate": 8.316272533750233e-05, "loss": 0.004, "step": 15974 }, { "epoch": 3.25, "learning_rate": 8.314537131578344e-05, "loss": 0.0103, "step": 15975 }, { "epoch": 3.25, "learning_rate": 8.312801841066303e-05, "loss": 0.0128, "step": 15976 }, { "epoch": 3.25, "learning_rate": 8.311066662243096e-05, "loss": 0.0077, "step": 15977 }, { "epoch": 3.25, "learning_rate": 8.309331595137698e-05, "loss": 0.0015, "step": 15978 }, { "epoch": 3.25, "learning_rate": 8.307596639779096e-05, "loss": 0.0034, "step": 15979 }, { "epoch": 3.25, "learning_rate": 8.305861796196268e-05, "loss": 0.0041, "step": 15980 }, { "epoch": 3.25, "learning_rate": 8.304127064418171e-05, "loss": 0.0096, "step": 15981 }, { "epoch": 3.25, "learning_rate": 8.302392444473805e-05, "loss": 0.0033, "step": 15982 }, { "epoch": 3.25, "learning_rate": 8.300657936392116e-05, "loss": 0.0055, "step": 15983 }, { "epoch": 3.25, "learning_rate": 8.298923540202094e-05, "loss": 0.0015, "step": 15984 }, { "epoch": 3.25, "learning_rate": 8.297189255932695e-05, "loss": 0.0018, "step": 15985 }, { "epoch": 3.26, "learning_rate": 8.295455083612882e-05, "loss": 0.0037, "step": 15986 }, { "epoch": 3.26, "learning_rate": 8.293721023271636e-05, "loss": 0.0036, "step": 15987 }, { "epoch": 3.26, "learning_rate": 8.291987074937901e-05, "loss": 0.0029, "step": 15988 }, { "epoch": 3.26, "learning_rate": 8.290253238640646e-05, "loss": 0.0024, "step": 15989 }, { "epoch": 3.26, "learning_rate": 8.288519514408828e-05, "loss": 0.0007, "step": 15990 }, { "epoch": 3.26, "learning_rate": 8.2867859022714e-05, "loss": 0.0035, "step": 15991 }, { "epoch": 3.26, "learning_rate": 8.285052402257321e-05, "loss": 0.005, "step": 15992 }, { "epoch": 3.26, "learning_rate": 8.283319014395543e-05, "loss": 0.0027, "step": 15993 }, { "epoch": 3.26, "learning_rate": 8.281585738715014e-05, "loss": 0.0057, "step": 15994 }, { "epoch": 3.26, "learning_rate": 8.279852575244687e-05, "loss": 0.0092, "step": 15995 }, { "epoch": 3.26, "learning_rate": 8.278119524013507e-05, "loss": 0.0043, "step": 15996 }, { "epoch": 3.26, "learning_rate": 8.276386585050419e-05, "loss": 0.0044, "step": 15997 }, { "epoch": 3.26, "learning_rate": 8.274653758384372e-05, "loss": 0.0023, "step": 15998 }, { "epoch": 3.26, "learning_rate": 8.27292104404429e-05, "loss": 0.0004, "step": 15999 }, { "epoch": 3.26, "learning_rate": 8.27118844205914e-05, "loss": 0.018, "step": 16000 }, { "epoch": 3.26, "learning_rate": 8.269455952457831e-05, "loss": 0.0022, "step": 16001 }, { "epoch": 3.26, "learning_rate": 8.267723575269323e-05, "loss": 0.0008, "step": 16002 }, { "epoch": 3.26, "learning_rate": 8.265991310522534e-05, "loss": 0.0034, "step": 16003 }, { "epoch": 3.26, "learning_rate": 8.264259158246402e-05, "loss": 0.0049, "step": 16004 }, { "epoch": 3.26, "learning_rate": 8.262527118469855e-05, "loss": 0.0049, "step": 16005 }, { "epoch": 3.26, "learning_rate": 8.260795191221826e-05, "loss": 0.0133, "step": 16006 }, { "epoch": 3.26, "learning_rate": 8.259063376531236e-05, "loss": 0.0016, "step": 16007 }, { "epoch": 3.26, "learning_rate": 8.257331674427012e-05, "loss": 0.0012, "step": 16008 }, { "epoch": 3.26, "learning_rate": 8.255600084938079e-05, "loss": 0.0058, "step": 16009 }, { "epoch": 3.26, "learning_rate": 8.253868608093354e-05, "loss": 0.0075, "step": 16010 }, { "epoch": 3.26, "learning_rate": 8.252137243921761e-05, "loss": 0.0082, "step": 16011 }, { "epoch": 3.26, "learning_rate": 8.250405992452206e-05, "loss": 0.0051, "step": 16012 }, { "epoch": 3.26, "learning_rate": 8.248674853713621e-05, "loss": 0.0019, "step": 16013 }, { "epoch": 3.26, "learning_rate": 8.246943827734897e-05, "loss": 0.0053, "step": 16014 }, { "epoch": 3.26, "learning_rate": 8.245212914544968e-05, "loss": 0.0114, "step": 16015 }, { "epoch": 3.26, "learning_rate": 8.243482114172739e-05, "loss": 0.0026, "step": 16016 }, { "epoch": 3.26, "learning_rate": 8.241751426647098e-05, "loss": 0.0053, "step": 16017 }, { "epoch": 3.26, "learning_rate": 8.240020851996979e-05, "loss": 0.0008, "step": 16018 }, { "epoch": 3.26, "learning_rate": 8.23829039025126e-05, "loss": 0.0169, "step": 16019 }, { "epoch": 3.26, "learning_rate": 8.236560041438866e-05, "loss": 0.0023, "step": 16020 }, { "epoch": 3.26, "learning_rate": 8.234829805588681e-05, "loss": 0.003, "step": 16021 }, { "epoch": 3.26, "learning_rate": 8.233099682729609e-05, "loss": 0.0044, "step": 16022 }, { "epoch": 3.26, "learning_rate": 8.231369672890545e-05, "loss": 0.0036, "step": 16023 }, { "epoch": 3.26, "learning_rate": 8.229639776100386e-05, "loss": 0.0011, "step": 16024 }, { "epoch": 3.26, "learning_rate": 8.227909992388021e-05, "loss": 0.0083, "step": 16025 }, { "epoch": 3.26, "learning_rate": 8.226180321782342e-05, "loss": 0.0062, "step": 16026 }, { "epoch": 3.26, "learning_rate": 8.22445076431224e-05, "loss": 0.0019, "step": 16027 }, { "epoch": 3.26, "learning_rate": 8.222721320006598e-05, "loss": 0.005, "step": 16028 }, { "epoch": 3.26, "learning_rate": 8.220991988894303e-05, "loss": 0.0059, "step": 16029 }, { "epoch": 3.26, "learning_rate": 8.21926277100424e-05, "loss": 0.0111, "step": 16030 }, { "epoch": 3.26, "learning_rate": 8.217533666365292e-05, "loss": 0.0081, "step": 16031 }, { "epoch": 3.26, "learning_rate": 8.215804675006323e-05, "loss": 0.0085, "step": 16032 }, { "epoch": 3.26, "learning_rate": 8.214075796956236e-05, "loss": 0.0015, "step": 16033 }, { "epoch": 3.26, "learning_rate": 8.212347032243878e-05, "loss": 0.01, "step": 16034 }, { "epoch": 3.27, "learning_rate": 8.210618380898151e-05, "loss": 0.0008, "step": 16035 }, { "epoch": 3.27, "learning_rate": 8.208889842947905e-05, "loss": 0.0098, "step": 16036 }, { "epoch": 3.27, "learning_rate": 8.207161418422019e-05, "loss": 0.0029, "step": 16037 }, { "epoch": 3.27, "learning_rate": 8.20543310734936e-05, "loss": 0.0009, "step": 16038 }, { "epoch": 3.27, "learning_rate": 8.203704909758792e-05, "loss": 0.0012, "step": 16039 }, { "epoch": 3.27, "learning_rate": 8.201976825679183e-05, "loss": 0.0011, "step": 16040 }, { "epoch": 3.27, "learning_rate": 8.200248855139393e-05, "loss": 0.0028, "step": 16041 }, { "epoch": 3.27, "learning_rate": 8.198520998168282e-05, "loss": 0.0031, "step": 16042 }, { "epoch": 3.27, "learning_rate": 8.196793254794709e-05, "loss": 0.0099, "step": 16043 }, { "epoch": 3.27, "learning_rate": 8.195065625047536e-05, "loss": 0.0076, "step": 16044 }, { "epoch": 3.27, "learning_rate": 8.1933381089556e-05, "loss": 0.0191, "step": 16045 }, { "epoch": 3.27, "learning_rate": 8.191610706547776e-05, "loss": 0.0159, "step": 16046 }, { "epoch": 3.27, "learning_rate": 8.189883417852901e-05, "loss": 0.0041, "step": 16047 }, { "epoch": 3.27, "learning_rate": 8.188156242899828e-05, "loss": 0.0104, "step": 16048 }, { "epoch": 3.27, "learning_rate": 8.186429181717412e-05, "loss": 0.007, "step": 16049 }, { "epoch": 3.27, "learning_rate": 8.184702234334476e-05, "loss": 0.0039, "step": 16050 }, { "epoch": 3.27, "learning_rate": 8.18297540077989e-05, "loss": 0.0062, "step": 16051 }, { "epoch": 3.27, "learning_rate": 8.181248681082472e-05, "loss": 0.0015, "step": 16052 }, { "epoch": 3.27, "learning_rate": 8.179522075271084e-05, "loss": 0.0078, "step": 16053 }, { "epoch": 3.27, "learning_rate": 8.177795583374545e-05, "loss": 0.0025, "step": 16054 }, { "epoch": 3.27, "learning_rate": 8.176069205421698e-05, "loss": 0.0086, "step": 16055 }, { "epoch": 3.27, "learning_rate": 8.174342941441377e-05, "loss": 0.0036, "step": 16056 }, { "epoch": 3.27, "learning_rate": 8.172616791462412e-05, "loss": 0.0017, "step": 16057 }, { "epoch": 3.27, "learning_rate": 8.170890755513635e-05, "loss": 0.0062, "step": 16058 }, { "epoch": 3.27, "learning_rate": 8.169164833623874e-05, "loss": 0.0042, "step": 16059 }, { "epoch": 3.27, "learning_rate": 8.167439025821954e-05, "loss": 0.0078, "step": 16060 }, { "epoch": 3.27, "learning_rate": 8.165713332136699e-05, "loss": 0.0031, "step": 16061 }, { "epoch": 3.27, "learning_rate": 8.163987752596938e-05, "loss": 0.0006, "step": 16062 }, { "epoch": 3.27, "learning_rate": 8.162262287231473e-05, "loss": 0.0003, "step": 16063 }, { "epoch": 3.27, "learning_rate": 8.16053693606915e-05, "loss": 0.0073, "step": 16064 }, { "epoch": 3.27, "learning_rate": 8.158811699138754e-05, "loss": 0.0029, "step": 16065 }, { "epoch": 3.27, "learning_rate": 8.157086576469131e-05, "loss": 0.0044, "step": 16066 }, { "epoch": 3.27, "learning_rate": 8.155361568089073e-05, "loss": 0.003, "step": 16067 }, { "epoch": 3.27, "learning_rate": 8.153636674027389e-05, "loss": 0.0106, "step": 16068 }, { "epoch": 3.27, "learning_rate": 8.151911894312911e-05, "loss": 0.0068, "step": 16069 }, { "epoch": 3.27, "learning_rate": 8.150187228974418e-05, "loss": 0.0016, "step": 16070 }, { "epoch": 3.27, "learning_rate": 8.148462678040738e-05, "loss": 0.0125, "step": 16071 }, { "epoch": 3.27, "learning_rate": 8.146738241540662e-05, "loss": 0.0028, "step": 16072 }, { "epoch": 3.27, "learning_rate": 8.145013919502992e-05, "loss": 0.0071, "step": 16073 }, { "epoch": 3.27, "learning_rate": 8.14328971195653e-05, "loss": 0.0036, "step": 16074 }, { "epoch": 3.27, "learning_rate": 8.141565618930071e-05, "loss": 0.0052, "step": 16075 }, { "epoch": 3.27, "learning_rate": 8.139841640452414e-05, "loss": 0.0137, "step": 16076 }, { "epoch": 3.27, "learning_rate": 8.138117776552349e-05, "loss": 0.0028, "step": 16077 }, { "epoch": 3.27, "learning_rate": 8.136394027258672e-05, "loss": 0.0053, "step": 16078 }, { "epoch": 3.27, "learning_rate": 8.13467039260017e-05, "loss": 0.0102, "step": 16079 }, { "epoch": 3.27, "learning_rate": 8.132946872605632e-05, "loss": 0.0012, "step": 16080 }, { "epoch": 3.27, "learning_rate": 8.131223467303844e-05, "loss": 0.0022, "step": 16081 }, { "epoch": 3.27, "learning_rate": 8.129500176723596e-05, "loss": 0.0025, "step": 16082 }, { "epoch": 3.27, "learning_rate": 8.12777700089365e-05, "loss": 0.0039, "step": 16083 }, { "epoch": 3.28, "learning_rate": 8.126053939842812e-05, "loss": 0.0046, "step": 16084 }, { "epoch": 3.28, "learning_rate": 8.12433099359984e-05, "loss": 0.0175, "step": 16085 }, { "epoch": 3.28, "learning_rate": 8.12260816219353e-05, "loss": 0.006, "step": 16086 }, { "epoch": 3.28, "learning_rate": 8.120885445652639e-05, "loss": 0.0083, "step": 16087 }, { "epoch": 3.28, "learning_rate": 8.119162844005946e-05, "loss": 0.0025, "step": 16088 }, { "epoch": 3.28, "learning_rate": 8.117440357282223e-05, "loss": 0.0024, "step": 16089 }, { "epoch": 3.28, "learning_rate": 8.115717985510238e-05, "loss": 0.0082, "step": 16090 }, { "epoch": 3.28, "learning_rate": 8.113995728718756e-05, "loss": 0.0031, "step": 16091 }, { "epoch": 3.28, "learning_rate": 8.112273586936544e-05, "loss": 0.0078, "step": 16092 }, { "epoch": 3.28, "learning_rate": 8.110551560192365e-05, "loss": 0.0049, "step": 16093 }, { "epoch": 3.28, "learning_rate": 8.10882964851498e-05, "loss": 0.0075, "step": 16094 }, { "epoch": 3.28, "learning_rate": 8.107107851933154e-05, "loss": 0.0029, "step": 16095 }, { "epoch": 3.28, "learning_rate": 8.105386170475627e-05, "loss": 0.0074, "step": 16096 }, { "epoch": 3.28, "learning_rate": 8.103664604171176e-05, "loss": 0.0047, "step": 16097 }, { "epoch": 3.28, "learning_rate": 8.101943153048531e-05, "loss": 0.0042, "step": 16098 }, { "epoch": 3.28, "learning_rate": 8.100221817136464e-05, "loss": 0.0019, "step": 16099 }, { "epoch": 3.28, "learning_rate": 8.098500596463722e-05, "loss": 0.0017, "step": 16100 }, { "epoch": 3.28, "learning_rate": 8.096779491059037e-05, "loss": 0.0042, "step": 16101 }, { "epoch": 3.28, "learning_rate": 8.095058500951176e-05, "loss": 0.0049, "step": 16102 }, { "epoch": 3.28, "learning_rate": 8.09333762616886e-05, "loss": 0.0021, "step": 16103 }, { "epoch": 3.28, "learning_rate": 8.091616866740855e-05, "loss": 0.001, "step": 16104 }, { "epoch": 3.28, "learning_rate": 8.089896222695882e-05, "loss": 0.0204, "step": 16105 }, { "epoch": 3.28, "learning_rate": 8.088175694062686e-05, "loss": 0.0044, "step": 16106 }, { "epoch": 3.28, "learning_rate": 8.086455280870005e-05, "loss": 0.0046, "step": 16107 }, { "epoch": 3.28, "learning_rate": 8.08473498314657e-05, "loss": 0.0182, "step": 16108 }, { "epoch": 3.28, "learning_rate": 8.083014800921114e-05, "loss": 0.0091, "step": 16109 }, { "epoch": 3.28, "learning_rate": 8.081294734222367e-05, "loss": 0.0048, "step": 16110 }, { "epoch": 3.28, "learning_rate": 8.079574783079058e-05, "loss": 0.0018, "step": 16111 }, { "epoch": 3.28, "learning_rate": 8.077854947519915e-05, "loss": 0.0051, "step": 16112 }, { "epoch": 3.28, "learning_rate": 8.076135227573665e-05, "loss": 0.0044, "step": 16113 }, { "epoch": 3.28, "learning_rate": 8.074415623269015e-05, "loss": 0.0105, "step": 16114 }, { "epoch": 3.28, "learning_rate": 8.072696134634709e-05, "loss": 0.0005, "step": 16115 }, { "epoch": 3.28, "learning_rate": 8.070976761699443e-05, "loss": 0.008, "step": 16116 }, { "epoch": 3.28, "learning_rate": 8.069257504491957e-05, "loss": 0.0066, "step": 16117 }, { "epoch": 3.28, "learning_rate": 8.067538363040944e-05, "loss": 0.0015, "step": 16118 }, { "epoch": 3.28, "learning_rate": 8.065819337375127e-05, "loss": 0.0055, "step": 16119 }, { "epoch": 3.28, "learning_rate": 8.064100427523218e-05, "loss": 0.0013, "step": 16120 }, { "epoch": 3.28, "learning_rate": 8.062381633513918e-05, "loss": 0.0058, "step": 16121 }, { "epoch": 3.28, "learning_rate": 8.060662955375953e-05, "loss": 0.0101, "step": 16122 }, { "epoch": 3.28, "learning_rate": 8.058944393138007e-05, "loss": 0.0066, "step": 16123 }, { "epoch": 3.28, "learning_rate": 8.057225946828795e-05, "loss": 0.0015, "step": 16124 }, { "epoch": 3.28, "learning_rate": 8.055507616477013e-05, "loss": 0.0036, "step": 16125 }, { "epoch": 3.28, "learning_rate": 8.053789402111364e-05, "loss": 0.0079, "step": 16126 }, { "epoch": 3.28, "learning_rate": 8.052071303760541e-05, "loss": 0.0018, "step": 16127 }, { "epoch": 3.28, "learning_rate": 8.050353321453245e-05, "loss": 0.0034, "step": 16128 }, { "epoch": 3.28, "learning_rate": 8.048635455218166e-05, "loss": 0.0116, "step": 16129 }, { "epoch": 3.28, "learning_rate": 8.046917705083998e-05, "loss": 0.0022, "step": 16130 }, { "epoch": 3.28, "learning_rate": 8.045200071079427e-05, "loss": 0.0055, "step": 16131 }, { "epoch": 3.28, "learning_rate": 8.043482553233144e-05, "loss": 0.007, "step": 16132 }, { "epoch": 3.28, "learning_rate": 8.04176515157384e-05, "loss": 0.0035, "step": 16133 }, { "epoch": 3.29, "learning_rate": 8.040047866130179e-05, "loss": 0.0064, "step": 16134 }, { "epoch": 3.29, "learning_rate": 8.038330696930869e-05, "loss": 0.0016, "step": 16135 }, { "epoch": 3.29, "learning_rate": 8.036613644004574e-05, "loss": 0.0032, "step": 16136 }, { "epoch": 3.29, "learning_rate": 8.034896707379973e-05, "loss": 0.0018, "step": 16137 }, { "epoch": 3.29, "learning_rate": 8.033179887085745e-05, "loss": 0.0022, "step": 16138 }, { "epoch": 3.29, "learning_rate": 8.031463183150563e-05, "loss": 0.0012, "step": 16139 }, { "epoch": 3.29, "learning_rate": 8.029746595603101e-05, "loss": 0.0023, "step": 16140 }, { "epoch": 3.29, "learning_rate": 8.028030124472027e-05, "loss": 0.0088, "step": 16141 }, { "epoch": 3.29, "learning_rate": 8.026313769786011e-05, "loss": 0.0031, "step": 16142 }, { "epoch": 3.29, "learning_rate": 8.02459753157372e-05, "loss": 0.0086, "step": 16143 }, { "epoch": 3.29, "learning_rate": 8.022881409863817e-05, "loss": 0.0055, "step": 16144 }, { "epoch": 3.29, "learning_rate": 8.021165404684963e-05, "loss": 0.0053, "step": 16145 }, { "epoch": 3.29, "learning_rate": 8.019449516065827e-05, "loss": 0.0035, "step": 16146 }, { "epoch": 3.29, "learning_rate": 8.01773374403505e-05, "loss": 0.002, "step": 16147 }, { "epoch": 3.29, "learning_rate": 8.01601808862131e-05, "loss": 0.0047, "step": 16148 }, { "epoch": 3.29, "learning_rate": 8.01430254985324e-05, "loss": 0.0005, "step": 16149 }, { "epoch": 3.29, "learning_rate": 8.012587127759515e-05, "loss": 0.001, "step": 16150 }, { "epoch": 3.29, "learning_rate": 8.010871822368769e-05, "loss": 0.0095, "step": 16151 }, { "epoch": 3.29, "learning_rate": 8.009156633709651e-05, "loss": 0.0045, "step": 16152 }, { "epoch": 3.29, "learning_rate": 8.007441561810825e-05, "loss": 0.011, "step": 16153 }, { "epoch": 3.29, "learning_rate": 8.00572660670091e-05, "loss": 0.0034, "step": 16154 }, { "epoch": 3.29, "learning_rate": 8.00401176840858e-05, "loss": 0.0014, "step": 16155 }, { "epoch": 3.29, "learning_rate": 8.002297046962452e-05, "loss": 0.0048, "step": 16156 }, { "epoch": 3.29, "learning_rate": 8.00058244239117e-05, "loss": 0.0047, "step": 16157 }, { "epoch": 3.29, "learning_rate": 7.998867954723374e-05, "loss": 0.0063, "step": 16158 }, { "epoch": 3.29, "learning_rate": 7.997153583987698e-05, "loss": 0.0029, "step": 16159 }, { "epoch": 3.29, "learning_rate": 7.995439330212779e-05, "loss": 0.0085, "step": 16160 }, { "epoch": 3.29, "learning_rate": 7.993725193427244e-05, "loss": 0.0117, "step": 16161 }, { "epoch": 3.29, "learning_rate": 7.992011173659722e-05, "loss": 0.0008, "step": 16162 }, { "epoch": 3.29, "learning_rate": 7.990297270938844e-05, "loss": 0.0052, "step": 16163 }, { "epoch": 3.29, "learning_rate": 7.988583485293239e-05, "loss": 0.0139, "step": 16164 }, { "epoch": 3.29, "learning_rate": 7.986869816751512e-05, "loss": 0.0027, "step": 16165 }, { "epoch": 3.29, "learning_rate": 7.98515626534231e-05, "loss": 0.007, "step": 16166 }, { "epoch": 3.29, "learning_rate": 7.983442831094226e-05, "loss": 0.0064, "step": 16167 }, { "epoch": 3.29, "learning_rate": 7.981729514035906e-05, "loss": 0.0026, "step": 16168 }, { "epoch": 3.29, "learning_rate": 7.980016314195944e-05, "loss": 0.0032, "step": 16169 }, { "epoch": 3.29, "learning_rate": 7.97830323160296e-05, "loss": 0.0084, "step": 16170 }, { "epoch": 3.29, "learning_rate": 7.976590266285567e-05, "loss": 0.003, "step": 16171 }, { "epoch": 3.29, "learning_rate": 7.974877418272376e-05, "loss": 0.0119, "step": 16172 }, { "epoch": 3.29, "learning_rate": 7.973164687591991e-05, "loss": 0.0044, "step": 16173 }, { "epoch": 3.29, "learning_rate": 7.971452074273019e-05, "loss": 0.0059, "step": 16174 }, { "epoch": 3.29, "learning_rate": 7.969739578344064e-05, "loss": 0.0008, "step": 16175 }, { "epoch": 3.29, "learning_rate": 7.968027199833732e-05, "loss": 0.0005, "step": 16176 }, { "epoch": 3.29, "learning_rate": 7.966314938770617e-05, "loss": 0.0019, "step": 16177 }, { "epoch": 3.29, "learning_rate": 7.96460279518332e-05, "loss": 0.0003, "step": 16178 }, { "epoch": 3.29, "learning_rate": 7.962890769100444e-05, "loss": 0.0028, "step": 16179 }, { "epoch": 3.29, "learning_rate": 7.961178860550563e-05, "loss": 0.0002, "step": 16180 }, { "epoch": 3.29, "learning_rate": 7.959467069562287e-05, "loss": 0.0146, "step": 16181 }, { "epoch": 3.29, "learning_rate": 7.957755396164201e-05, "loss": 0.0026, "step": 16182 }, { "epoch": 3.3, "learning_rate": 7.956043840384893e-05, "loss": 0.0036, "step": 16183 }, { "epoch": 3.3, "learning_rate": 7.954332402252956e-05, "loss": 0.0073, "step": 16184 }, { "epoch": 3.3, "learning_rate": 7.952621081796955e-05, "loss": 0.0236, "step": 16185 }, { "epoch": 3.3, "learning_rate": 7.950909879045497e-05, "loss": 0.003, "step": 16186 }, { "epoch": 3.3, "learning_rate": 7.949198794027144e-05, "loss": 0.002, "step": 16187 }, { "epoch": 3.3, "learning_rate": 7.947487826770478e-05, "loss": 0.0034, "step": 16188 }, { "epoch": 3.3, "learning_rate": 7.945776977304082e-05, "loss": 0.0021, "step": 16189 }, { "epoch": 3.3, "learning_rate": 7.944066245656524e-05, "loss": 0.0082, "step": 16190 }, { "epoch": 3.3, "learning_rate": 7.942355631856381e-05, "loss": 0.0007, "step": 16191 }, { "epoch": 3.3, "learning_rate": 7.940645135932218e-05, "loss": 0.0024, "step": 16192 }, { "epoch": 3.3, "learning_rate": 7.938934757912608e-05, "loss": 0.0009, "step": 16193 }, { "epoch": 3.3, "learning_rate": 7.937224497826117e-05, "loss": 0.0035, "step": 16194 }, { "epoch": 3.3, "learning_rate": 7.93551435570131e-05, "loss": 0.0153, "step": 16195 }, { "epoch": 3.3, "learning_rate": 7.933804331566745e-05, "loss": 0.0075, "step": 16196 }, { "epoch": 3.3, "learning_rate": 7.932094425450993e-05, "loss": 0.0038, "step": 16197 }, { "epoch": 3.3, "learning_rate": 7.930384637382595e-05, "loss": 0.0039, "step": 16198 }, { "epoch": 3.3, "learning_rate": 7.92867496739013e-05, "loss": 0.0029, "step": 16199 }, { "epoch": 3.3, "learning_rate": 7.926965415502128e-05, "loss": 0.0017, "step": 16200 }, { "epoch": 3.3, "learning_rate": 7.925255981747168e-05, "loss": 0.0028, "step": 16201 }, { "epoch": 3.3, "learning_rate": 7.923546666153782e-05, "loss": 0.0049, "step": 16202 }, { "epoch": 3.3, "learning_rate": 7.921837468750524e-05, "loss": 0.0047, "step": 16203 }, { "epoch": 3.3, "learning_rate": 7.920128389565941e-05, "loss": 0.003, "step": 16204 }, { "epoch": 3.3, "learning_rate": 7.918419428628571e-05, "loss": 0.006, "step": 16205 }, { "epoch": 3.3, "learning_rate": 7.916710585966978e-05, "loss": 0.0038, "step": 16206 }, { "epoch": 3.3, "learning_rate": 7.915001861609684e-05, "loss": 0.0016, "step": 16207 }, { "epoch": 3.3, "learning_rate": 7.91329325558523e-05, "loss": 0.0082, "step": 16208 }, { "epoch": 3.3, "learning_rate": 7.911584767922155e-05, "loss": 0.0047, "step": 16209 }, { "epoch": 3.3, "learning_rate": 7.909876398649003e-05, "loss": 0.0026, "step": 16210 }, { "epoch": 3.3, "learning_rate": 7.908168147794285e-05, "loss": 0.0038, "step": 16211 }, { "epoch": 3.3, "learning_rate": 7.906460015386554e-05, "loss": 0.0006, "step": 16212 }, { "epoch": 3.3, "learning_rate": 7.904752001454328e-05, "loss": 0.001, "step": 16213 }, { "epoch": 3.3, "learning_rate": 7.90304410602614e-05, "loss": 0.0023, "step": 16214 }, { "epoch": 3.3, "learning_rate": 7.901336329130514e-05, "loss": 0.0017, "step": 16215 }, { "epoch": 3.3, "learning_rate": 7.899628670795963e-05, "loss": 0.0091, "step": 16216 }, { "epoch": 3.3, "learning_rate": 7.897921131051026e-05, "loss": 0.0022, "step": 16217 }, { "epoch": 3.3, "learning_rate": 7.8962137099242e-05, "loss": 0.0184, "step": 16218 }, { "epoch": 3.3, "learning_rate": 7.894506407444028e-05, "loss": 0.006, "step": 16219 }, { "epoch": 3.3, "learning_rate": 7.892799223639003e-05, "loss": 0.0067, "step": 16220 }, { "epoch": 3.3, "learning_rate": 7.89109215853765e-05, "loss": 0.0124, "step": 16221 }, { "epoch": 3.3, "learning_rate": 7.889385212168473e-05, "loss": 0.0042, "step": 16222 }, { "epoch": 3.3, "learning_rate": 7.887678384559989e-05, "loss": 0.0016, "step": 16223 }, { "epoch": 3.3, "learning_rate": 7.885971675740699e-05, "loss": 0.0049, "step": 16224 }, { "epoch": 3.3, "learning_rate": 7.884265085739111e-05, "loss": 0.0025, "step": 16225 }, { "epoch": 3.3, "learning_rate": 7.882558614583729e-05, "loss": 0.0005, "step": 16226 }, { "epoch": 3.3, "learning_rate": 7.880852262303053e-05, "loss": 0.0037, "step": 16227 }, { "epoch": 3.3, "learning_rate": 7.879146028925582e-05, "loss": 0.0008, "step": 16228 }, { "epoch": 3.3, "learning_rate": 7.877439914479815e-05, "loss": 0.0044, "step": 16229 }, { "epoch": 3.3, "learning_rate": 7.87573391899425e-05, "loss": 0.0076, "step": 16230 }, { "epoch": 3.3, "learning_rate": 7.874028042497366e-05, "loss": 0.0046, "step": 16231 }, { "epoch": 3.31, "learning_rate": 7.872322285017676e-05, "loss": 0.0022, "step": 16232 }, { "epoch": 3.31, "learning_rate": 7.870616646583648e-05, "loss": 0.0149, "step": 16233 }, { "epoch": 3.31, "learning_rate": 7.86891112722379e-05, "loss": 0.0032, "step": 16234 }, { "epoch": 3.31, "learning_rate": 7.867205726966573e-05, "loss": 0.006, "step": 16235 }, { "epoch": 3.31, "learning_rate": 7.865500445840477e-05, "loss": 0.0108, "step": 16236 }, { "epoch": 3.31, "learning_rate": 7.863795283874004e-05, "loss": 0.0086, "step": 16237 }, { "epoch": 3.31, "learning_rate": 7.862090241095612e-05, "loss": 0.0014, "step": 16238 }, { "epoch": 3.31, "learning_rate": 7.860385317533789e-05, "loss": 0.0043, "step": 16239 }, { "epoch": 3.31, "learning_rate": 7.858680513217008e-05, "loss": 0.0043, "step": 16240 }, { "epoch": 3.31, "learning_rate": 7.856975828173741e-05, "loss": 0.0077, "step": 16241 }, { "epoch": 3.31, "learning_rate": 7.855271262432464e-05, "loss": 0.0069, "step": 16242 }, { "epoch": 3.31, "learning_rate": 7.85356681602164e-05, "loss": 0.0079, "step": 16243 }, { "epoch": 3.31, "learning_rate": 7.851862488969741e-05, "loss": 0.0003, "step": 16244 }, { "epoch": 3.31, "learning_rate": 7.850158281305233e-05, "loss": 0.0043, "step": 16245 }, { "epoch": 3.31, "learning_rate": 7.848454193056576e-05, "loss": 0.0021, "step": 16246 }, { "epoch": 3.31, "learning_rate": 7.846750224252236e-05, "loss": 0.0013, "step": 16247 }, { "epoch": 3.31, "learning_rate": 7.845046374920674e-05, "loss": 0.0059, "step": 16248 }, { "epoch": 3.31, "learning_rate": 7.843342645090333e-05, "loss": 0.0008, "step": 16249 }, { "epoch": 3.31, "learning_rate": 7.84163903478969e-05, "loss": 0.0011, "step": 16250 }, { "epoch": 3.31, "learning_rate": 7.839935544047174e-05, "loss": 0.0003, "step": 16251 }, { "epoch": 3.31, "learning_rate": 7.838232172891265e-05, "loss": 0.0198, "step": 16252 }, { "epoch": 3.31, "learning_rate": 7.836528921350391e-05, "loss": 0.001, "step": 16253 }, { "epoch": 3.31, "learning_rate": 7.834825789453005e-05, "loss": 0.0075, "step": 16254 }, { "epoch": 3.31, "learning_rate": 7.833122777227551e-05, "loss": 0.0032, "step": 16255 }, { "epoch": 3.31, "learning_rate": 7.831419884702478e-05, "loss": 0.0071, "step": 16256 }, { "epoch": 3.31, "learning_rate": 7.829717111906225e-05, "loss": 0.0064, "step": 16257 }, { "epoch": 3.31, "learning_rate": 7.82801445886723e-05, "loss": 0.0042, "step": 16258 }, { "epoch": 3.31, "learning_rate": 7.826311925613931e-05, "loss": 0.0009, "step": 16259 }, { "epoch": 3.31, "learning_rate": 7.824609512174766e-05, "loss": 0.0063, "step": 16260 }, { "epoch": 3.31, "learning_rate": 7.822907218578171e-05, "loss": 0.0052, "step": 16261 }, { "epoch": 3.31, "learning_rate": 7.821205044852562e-05, "loss": 0.009, "step": 16262 }, { "epoch": 3.31, "learning_rate": 7.81950299102639e-05, "loss": 0.0055, "step": 16263 }, { "epoch": 3.31, "learning_rate": 7.817801057128065e-05, "loss": 0.001, "step": 16264 }, { "epoch": 3.31, "learning_rate": 7.81609924318602e-05, "loss": 0.002, "step": 16265 }, { "epoch": 3.31, "learning_rate": 7.814397549228688e-05, "loss": 0.0051, "step": 16266 }, { "epoch": 3.31, "learning_rate": 7.812695975284469e-05, "loss": 0.0025, "step": 16267 }, { "epoch": 3.31, "learning_rate": 7.810994521381803e-05, "loss": 0.0084, "step": 16268 }, { "epoch": 3.31, "learning_rate": 7.809293187549089e-05, "loss": 0.0023, "step": 16269 }, { "epoch": 3.31, "learning_rate": 7.807591973814764e-05, "loss": 0.0028, "step": 16270 }, { "epoch": 3.31, "learning_rate": 7.805890880207223e-05, "loss": 0.0032, "step": 16271 }, { "epoch": 3.31, "learning_rate": 7.804189906754884e-05, "loss": 0.0045, "step": 16272 }, { "epoch": 3.31, "learning_rate": 7.802489053486158e-05, "loss": 0.0094, "step": 16273 }, { "epoch": 3.31, "learning_rate": 7.800788320429448e-05, "loss": 0.0147, "step": 16274 }, { "epoch": 3.31, "learning_rate": 7.799087707613166e-05, "loss": 0.0113, "step": 16275 }, { "epoch": 3.31, "learning_rate": 7.79738721506571e-05, "loss": 0.0043, "step": 16276 }, { "epoch": 3.31, "learning_rate": 7.795686842815482e-05, "loss": 0.0109, "step": 16277 }, { "epoch": 3.31, "learning_rate": 7.793986590890887e-05, "loss": 0.0052, "step": 16278 }, { "epoch": 3.31, "learning_rate": 7.792286459320315e-05, "loss": 0.0029, "step": 16279 }, { "epoch": 3.31, "learning_rate": 7.790586448132167e-05, "loss": 0.0109, "step": 16280 }, { "epoch": 3.32, "learning_rate": 7.788886557354837e-05, "loss": 0.0048, "step": 16281 }, { "epoch": 3.32, "learning_rate": 7.787186787016704e-05, "loss": 0.0027, "step": 16282 }, { "epoch": 3.32, "learning_rate": 7.785487137146178e-05, "loss": 0.0076, "step": 16283 }, { "epoch": 3.32, "learning_rate": 7.783787607771628e-05, "loss": 0.0049, "step": 16284 }, { "epoch": 3.32, "learning_rate": 7.782088198921448e-05, "loss": 0.0122, "step": 16285 }, { "epoch": 3.32, "learning_rate": 7.78038891062402e-05, "loss": 0.0023, "step": 16286 }, { "epoch": 3.32, "learning_rate": 7.778689742907725e-05, "loss": 0.0056, "step": 16287 }, { "epoch": 3.32, "learning_rate": 7.776990695800941e-05, "loss": 0.001, "step": 16288 }, { "epoch": 3.32, "learning_rate": 7.775291769332047e-05, "loss": 0.0032, "step": 16289 }, { "epoch": 3.32, "learning_rate": 7.77359296352942e-05, "loss": 0.0012, "step": 16290 }, { "epoch": 3.32, "learning_rate": 7.771894278421431e-05, "loss": 0.0004, "step": 16291 }, { "epoch": 3.32, "learning_rate": 7.77019571403645e-05, "loss": 0.0021, "step": 16292 }, { "epoch": 3.32, "learning_rate": 7.768497270402849e-05, "loss": 0.0154, "step": 16293 }, { "epoch": 3.32, "learning_rate": 7.766798947548999e-05, "loss": 0.0031, "step": 16294 }, { "epoch": 3.32, "learning_rate": 7.76510074550325e-05, "loss": 0.0006, "step": 16295 }, { "epoch": 3.32, "learning_rate": 7.763402664293979e-05, "loss": 0.0011, "step": 16296 }, { "epoch": 3.32, "learning_rate": 7.761704703949545e-05, "loss": 0.0029, "step": 16297 }, { "epoch": 3.32, "learning_rate": 7.760006864498305e-05, "loss": 0.002, "step": 16298 }, { "epoch": 3.32, "learning_rate": 7.758309145968624e-05, "loss": 0.0048, "step": 16299 }, { "epoch": 3.32, "learning_rate": 7.756611548388837e-05, "loss": 0.0104, "step": 16300 }, { "epoch": 3.32, "learning_rate": 7.754914071787323e-05, "loss": 0.0047, "step": 16301 }, { "epoch": 3.32, "learning_rate": 7.753216716192406e-05, "loss": 0.0002, "step": 16302 }, { "epoch": 3.32, "learning_rate": 7.751519481632462e-05, "loss": 0.0034, "step": 16303 }, { "epoch": 3.32, "learning_rate": 7.749822368135821e-05, "loss": 0.0048, "step": 16304 }, { "epoch": 3.32, "learning_rate": 7.74812537573083e-05, "loss": 0.0023, "step": 16305 }, { "epoch": 3.32, "learning_rate": 7.746428504445835e-05, "loss": 0.0061, "step": 16306 }, { "epoch": 3.32, "learning_rate": 7.744731754309176e-05, "loss": 0.0096, "step": 16307 }, { "epoch": 3.32, "learning_rate": 7.743035125349192e-05, "loss": 0.0087, "step": 16308 }, { "epoch": 3.32, "learning_rate": 7.74133861759422e-05, "loss": 0.0165, "step": 16309 }, { "epoch": 3.32, "learning_rate": 7.739642231072594e-05, "loss": 0.0022, "step": 16310 }, { "epoch": 3.32, "learning_rate": 7.737945965812648e-05, "loss": 0.0004, "step": 16311 }, { "epoch": 3.32, "learning_rate": 7.736249821842719e-05, "loss": 0.007, "step": 16312 }, { "epoch": 3.32, "learning_rate": 7.734553799191118e-05, "loss": 0.0099, "step": 16313 }, { "epoch": 3.32, "learning_rate": 7.732857897886193e-05, "loss": 0.0026, "step": 16314 }, { "epoch": 3.32, "learning_rate": 7.731162117956246e-05, "loss": 0.0031, "step": 16315 }, { "epoch": 3.32, "learning_rate": 7.729466459429629e-05, "loss": 0.0026, "step": 16316 }, { "epoch": 3.32, "learning_rate": 7.727770922334638e-05, "loss": 0.0087, "step": 16317 }, { "epoch": 3.32, "learning_rate": 7.726075506699592e-05, "loss": 0.0031, "step": 16318 }, { "epoch": 3.32, "learning_rate": 7.72438021255283e-05, "loss": 0.0017, "step": 16319 }, { "epoch": 3.32, "learning_rate": 7.722685039922639e-05, "loss": 0.0011, "step": 16320 }, { "epoch": 3.32, "learning_rate": 7.720989988837356e-05, "loss": 0.002, "step": 16321 }, { "epoch": 3.32, "learning_rate": 7.719295059325274e-05, "loss": 0.0034, "step": 16322 }, { "epoch": 3.32, "learning_rate": 7.71760025141471e-05, "loss": 0.0027, "step": 16323 }, { "epoch": 3.32, "learning_rate": 7.715905565133968e-05, "loss": 0.0019, "step": 16324 }, { "epoch": 3.32, "learning_rate": 7.714211000511353e-05, "loss": 0.0043, "step": 16325 }, { "epoch": 3.32, "learning_rate": 7.712516557575164e-05, "loss": 0.0126, "step": 16326 }, { "epoch": 3.32, "learning_rate": 7.710822236353707e-05, "loss": 0.0005, "step": 16327 }, { "epoch": 3.32, "learning_rate": 7.709128036875279e-05, "loss": 0.0002, "step": 16328 }, { "epoch": 3.32, "learning_rate": 7.707433959168173e-05, "loss": 0.0049, "step": 16329 }, { "epoch": 3.33, "learning_rate": 7.705740003260687e-05, "loss": 0.0061, "step": 16330 }, { "epoch": 3.33, "learning_rate": 7.704046169181112e-05, "loss": 0.0003, "step": 16331 }, { "epoch": 3.33, "learning_rate": 7.702352456957743e-05, "loss": 0.0042, "step": 16332 }, { "epoch": 3.33, "learning_rate": 7.700658866618851e-05, "loss": 0.0033, "step": 16333 }, { "epoch": 3.33, "learning_rate": 7.698965398192748e-05, "loss": 0.0008, "step": 16334 }, { "epoch": 3.33, "learning_rate": 7.697272051707697e-05, "loss": 0.0056, "step": 16335 }, { "epoch": 3.33, "learning_rate": 7.695578827191988e-05, "loss": 0.0106, "step": 16336 }, { "epoch": 3.33, "learning_rate": 7.693885724673902e-05, "loss": 0.0004, "step": 16337 }, { "epoch": 3.33, "learning_rate": 7.692192744181716e-05, "loss": 0.0021, "step": 16338 }, { "epoch": 3.33, "learning_rate": 7.690499885743704e-05, "loss": 0.0009, "step": 16339 }, { "epoch": 3.33, "learning_rate": 7.688807149388143e-05, "loss": 0.0021, "step": 16340 }, { "epoch": 3.33, "learning_rate": 7.6871145351433e-05, "loss": 0.0003, "step": 16341 }, { "epoch": 3.33, "learning_rate": 7.685422043037451e-05, "loss": 0.0149, "step": 16342 }, { "epoch": 3.33, "learning_rate": 7.683729673098861e-05, "loss": 0.0029, "step": 16343 }, { "epoch": 3.33, "learning_rate": 7.682037425355795e-05, "loss": 0.0016, "step": 16344 }, { "epoch": 3.33, "learning_rate": 7.680345299836524e-05, "loss": 0.0329, "step": 16345 }, { "epoch": 3.33, "learning_rate": 7.678653296569292e-05, "loss": 0.0062, "step": 16346 }, { "epoch": 3.33, "learning_rate": 7.676961415582382e-05, "loss": 0.0033, "step": 16347 }, { "epoch": 3.33, "learning_rate": 7.675269656904027e-05, "loss": 0.0077, "step": 16348 }, { "epoch": 3.33, "learning_rate": 7.6735780205625e-05, "loss": 0.0034, "step": 16349 }, { "epoch": 3.33, "learning_rate": 7.671886506586057e-05, "loss": 0.001, "step": 16350 }, { "epoch": 3.33, "learning_rate": 7.670195115002931e-05, "loss": 0.0066, "step": 16351 }, { "epoch": 3.33, "learning_rate": 7.668503845841393e-05, "loss": 0.0017, "step": 16352 }, { "epoch": 3.33, "learning_rate": 7.66681269912967e-05, "loss": 0.0008, "step": 16353 }, { "epoch": 3.33, "learning_rate": 7.665121674896026e-05, "loss": 0.0006, "step": 16354 }, { "epoch": 3.33, "learning_rate": 7.663430773168693e-05, "loss": 0.0049, "step": 16355 }, { "epoch": 3.33, "learning_rate": 7.661739993975914e-05, "loss": 0.0003, "step": 16356 }, { "epoch": 3.33, "learning_rate": 7.660049337345927e-05, "loss": 0.0025, "step": 16357 }, { "epoch": 3.33, "learning_rate": 7.658358803306974e-05, "loss": 0.0135, "step": 16358 }, { "epoch": 3.33, "learning_rate": 7.656668391887287e-05, "loss": 0.0004, "step": 16359 }, { "epoch": 3.33, "learning_rate": 7.654978103115097e-05, "loss": 0.0074, "step": 16360 }, { "epoch": 3.33, "learning_rate": 7.653287937018637e-05, "loss": 0.0112, "step": 16361 }, { "epoch": 3.33, "learning_rate": 7.651597893626138e-05, "loss": 0.0082, "step": 16362 }, { "epoch": 3.33, "learning_rate": 7.649907972965833e-05, "loss": 0.0032, "step": 16363 }, { "epoch": 3.33, "learning_rate": 7.648218175065925e-05, "loss": 0.0019, "step": 16364 }, { "epoch": 3.33, "learning_rate": 7.646528499954663e-05, "loss": 0.0056, "step": 16365 }, { "epoch": 3.33, "learning_rate": 7.644838947660244e-05, "loss": 0.0012, "step": 16366 }, { "epoch": 3.33, "learning_rate": 7.64314951821091e-05, "loss": 0.0009, "step": 16367 }, { "epoch": 3.33, "learning_rate": 7.64146021163486e-05, "loss": 0.0002, "step": 16368 }, { "epoch": 3.33, "learning_rate": 7.639771027960317e-05, "loss": 0.0058, "step": 16369 }, { "epoch": 3.33, "learning_rate": 7.63808196721549e-05, "loss": 0.0016, "step": 16370 }, { "epoch": 3.33, "learning_rate": 7.636393029428583e-05, "loss": 0.0145, "step": 16371 }, { "epoch": 3.33, "learning_rate": 7.634704214627825e-05, "loss": 0.0017, "step": 16372 }, { "epoch": 3.33, "learning_rate": 7.633015522841405e-05, "loss": 0.0015, "step": 16373 }, { "epoch": 3.33, "learning_rate": 7.631326954097531e-05, "loss": 0.0068, "step": 16374 }, { "epoch": 3.33, "learning_rate": 7.629638508424406e-05, "loss": 0.0092, "step": 16375 }, { "epoch": 3.33, "learning_rate": 7.62795018585023e-05, "loss": 0.003, "step": 16376 }, { "epoch": 3.33, "learning_rate": 7.626261986403203e-05, "loss": 0.004, "step": 16377 }, { "epoch": 3.33, "learning_rate": 7.62457391011152e-05, "loss": 0.0048, "step": 16378 }, { "epoch": 3.34, "learning_rate": 7.622885957003372e-05, "loss": 0.0072, "step": 16379 }, { "epoch": 3.34, "learning_rate": 7.621198127106956e-05, "loss": 0.0027, "step": 16380 }, { "epoch": 3.34, "learning_rate": 7.61951042045046e-05, "loss": 0.0233, "step": 16381 }, { "epoch": 3.34, "learning_rate": 7.617822837062071e-05, "loss": 0.0048, "step": 16382 }, { "epoch": 3.34, "learning_rate": 7.616135376969982e-05, "loss": 0.01, "step": 16383 }, { "epoch": 3.34, "learning_rate": 7.614448040202359e-05, "loss": 0.0009, "step": 16384 }, { "epoch": 3.34, "learning_rate": 7.612760826787406e-05, "loss": 0.0056, "step": 16385 }, { "epoch": 3.34, "learning_rate": 7.611073736753284e-05, "loss": 0.002, "step": 16386 }, { "epoch": 3.34, "learning_rate": 7.609386770128179e-05, "loss": 0.0136, "step": 16387 }, { "epoch": 3.34, "learning_rate": 7.607699926940268e-05, "loss": 0.0005, "step": 16388 }, { "epoch": 3.34, "learning_rate": 7.606013207217718e-05, "loss": 0.0018, "step": 16389 }, { "epoch": 3.34, "learning_rate": 7.604326610988709e-05, "loss": 0.0197, "step": 16390 }, { "epoch": 3.34, "learning_rate": 7.602640138281404e-05, "loss": 0.0004, "step": 16391 }, { "epoch": 3.34, "learning_rate": 7.600953789123971e-05, "loss": 0.0056, "step": 16392 }, { "epoch": 3.34, "learning_rate": 7.599267563544577e-05, "loss": 0.0033, "step": 16393 }, { "epoch": 3.34, "learning_rate": 7.597581461571385e-05, "loss": 0.0044, "step": 16394 }, { "epoch": 3.34, "learning_rate": 7.595895483232556e-05, "loss": 0.007, "step": 16395 }, { "epoch": 3.34, "learning_rate": 7.594209628556254e-05, "loss": 0.0042, "step": 16396 }, { "epoch": 3.34, "learning_rate": 7.59252389757062e-05, "loss": 0.0058, "step": 16397 }, { "epoch": 3.34, "learning_rate": 7.590838290303829e-05, "loss": 0.0137, "step": 16398 }, { "epoch": 3.34, "learning_rate": 7.589152806784016e-05, "loss": 0.0014, "step": 16399 }, { "epoch": 3.34, "learning_rate": 7.587467447039349e-05, "loss": 0.008, "step": 16400 }, { "epoch": 3.34, "learning_rate": 7.585782211097962e-05, "loss": 0.001, "step": 16401 }, { "epoch": 3.34, "learning_rate": 7.584097098988003e-05, "loss": 0.0065, "step": 16402 }, { "epoch": 3.34, "learning_rate": 7.582412110737632e-05, "loss": 0.0027, "step": 16403 }, { "epoch": 3.34, "learning_rate": 7.580727246374968e-05, "loss": 0.0028, "step": 16404 }, { "epoch": 3.34, "learning_rate": 7.579042505928176e-05, "loss": 0.0056, "step": 16405 }, { "epoch": 3.34, "learning_rate": 7.577357889425376e-05, "loss": 0.0072, "step": 16406 }, { "epoch": 3.34, "learning_rate": 7.575673396894711e-05, "loss": 0.0074, "step": 16407 }, { "epoch": 3.34, "learning_rate": 7.573989028364317e-05, "loss": 0.0095, "step": 16408 }, { "epoch": 3.34, "learning_rate": 7.572304783862319e-05, "loss": 0.0054, "step": 16409 }, { "epoch": 3.34, "learning_rate": 7.570620663416857e-05, "loss": 0.0032, "step": 16410 }, { "epoch": 3.34, "learning_rate": 7.568936667056049e-05, "loss": 0.0097, "step": 16411 }, { "epoch": 3.34, "learning_rate": 7.567252794808029e-05, "loss": 0.0018, "step": 16412 }, { "epoch": 3.34, "learning_rate": 7.565569046700918e-05, "loss": 0.0006, "step": 16413 }, { "epoch": 3.34, "learning_rate": 7.563885422762841e-05, "loss": 0.0056, "step": 16414 }, { "epoch": 3.34, "learning_rate": 7.562201923021902e-05, "loss": 0.0221, "step": 16415 }, { "epoch": 3.34, "learning_rate": 7.560518547506245e-05, "loss": 0.0027, "step": 16416 }, { "epoch": 3.34, "learning_rate": 7.558835296243959e-05, "loss": 0.0003, "step": 16417 }, { "epoch": 3.34, "learning_rate": 7.55715216926318e-05, "loss": 0.014, "step": 16418 }, { "epoch": 3.34, "learning_rate": 7.555469166592003e-05, "loss": 0.0024, "step": 16419 }, { "epoch": 3.34, "learning_rate": 7.553786288258547e-05, "loss": 0.0024, "step": 16420 }, { "epoch": 3.34, "learning_rate": 7.552103534290913e-05, "loss": 0.0011, "step": 16421 }, { "epoch": 3.34, "learning_rate": 7.550420904717208e-05, "loss": 0.0061, "step": 16422 }, { "epoch": 3.34, "learning_rate": 7.548738399565537e-05, "loss": 0.0056, "step": 16423 }, { "epoch": 3.34, "learning_rate": 7.547056018864002e-05, "loss": 0.0057, "step": 16424 }, { "epoch": 3.34, "learning_rate": 7.545373762640697e-05, "loss": 0.0285, "step": 16425 }, { "epoch": 3.34, "learning_rate": 7.543691630923723e-05, "loss": 0.0061, "step": 16426 }, { "epoch": 3.34, "learning_rate": 7.542009623741172e-05, "loss": 0.0035, "step": 16427 }, { "epoch": 3.35, "learning_rate": 7.54032774112114e-05, "loss": 0.0045, "step": 16428 }, { "epoch": 3.35, "learning_rate": 7.538645983091721e-05, "loss": 0.0049, "step": 16429 }, { "epoch": 3.35, "learning_rate": 7.536964349680988e-05, "loss": 0.0031, "step": 16430 }, { "epoch": 3.35, "learning_rate": 7.535282840917042e-05, "loss": 0.0085, "step": 16431 }, { "epoch": 3.35, "learning_rate": 7.53360145682797e-05, "loss": 0.0062, "step": 16432 }, { "epoch": 3.35, "learning_rate": 7.531920197441834e-05, "loss": 0.0035, "step": 16433 }, { "epoch": 3.35, "learning_rate": 7.530239062786742e-05, "loss": 0.0031, "step": 16434 }, { "epoch": 3.35, "learning_rate": 7.528558052890744e-05, "loss": 0.0041, "step": 16435 }, { "epoch": 3.35, "learning_rate": 7.526877167781943e-05, "loss": 0.0074, "step": 16436 }, { "epoch": 3.35, "learning_rate": 7.525196407488395e-05, "loss": 0.0029, "step": 16437 }, { "epoch": 3.35, "learning_rate": 7.523515772038175e-05, "loss": 0.0052, "step": 16438 }, { "epoch": 3.35, "learning_rate": 7.521835261459354e-05, "loss": 0.0025, "step": 16439 }, { "epoch": 3.35, "learning_rate": 7.520154875780001e-05, "loss": 0.0008, "step": 16440 }, { "epoch": 3.35, "learning_rate": 7.518474615028181e-05, "loss": 0.0041, "step": 16441 }, { "epoch": 3.35, "learning_rate": 7.516794479231957e-05, "loss": 0.0217, "step": 16442 }, { "epoch": 3.35, "learning_rate": 7.51511446841939e-05, "loss": 0.0025, "step": 16443 }, { "epoch": 3.35, "learning_rate": 7.513434582618541e-05, "loss": 0.0033, "step": 16444 }, { "epoch": 3.35, "learning_rate": 7.511754821857467e-05, "loss": 0.001, "step": 16445 }, { "epoch": 3.35, "learning_rate": 7.510075186164221e-05, "loss": 0.002, "step": 16446 }, { "epoch": 3.35, "learning_rate": 7.508395675566864e-05, "loss": 0.0027, "step": 16447 }, { "epoch": 3.35, "learning_rate": 7.506716290093431e-05, "loss": 0.0053, "step": 16448 }, { "epoch": 3.35, "learning_rate": 7.505037029771989e-05, "loss": 0.0056, "step": 16449 }, { "epoch": 3.35, "learning_rate": 7.503357894630566e-05, "loss": 0.0074, "step": 16450 }, { "epoch": 3.35, "learning_rate": 7.501678884697227e-05, "loss": 0.006, "step": 16451 }, { "epoch": 3.35, "learning_rate": 7.500000000000002e-05, "loss": 0.0017, "step": 16452 }, { "epoch": 3.35, "learning_rate": 7.498321240566933e-05, "loss": 0.0015, "step": 16453 }, { "epoch": 3.35, "learning_rate": 7.496642606426059e-05, "loss": 0.0026, "step": 16454 }, { "epoch": 3.35, "learning_rate": 7.494964097605412e-05, "loss": 0.0014, "step": 16455 }, { "epoch": 3.35, "learning_rate": 7.493285714133043e-05, "loss": 0.0032, "step": 16456 }, { "epoch": 3.35, "learning_rate": 7.491607456036968e-05, "loss": 0.0148, "step": 16457 }, { "epoch": 3.35, "learning_rate": 7.489929323345218e-05, "loss": 0.0009, "step": 16458 }, { "epoch": 3.35, "learning_rate": 7.488251316085828e-05, "loss": 0.0038, "step": 16459 }, { "epoch": 3.35, "learning_rate": 7.486573434286823e-05, "loss": 0.0026, "step": 16460 }, { "epoch": 3.35, "learning_rate": 7.484895677976216e-05, "loss": 0.004, "step": 16461 }, { "epoch": 3.35, "learning_rate": 7.483218047182041e-05, "loss": 0.0119, "step": 16462 }, { "epoch": 3.35, "learning_rate": 7.481540541932315e-05, "loss": 0.0022, "step": 16463 }, { "epoch": 3.35, "learning_rate": 7.479863162255051e-05, "loss": 0.0093, "step": 16464 }, { "epoch": 3.35, "learning_rate": 7.478185908178276e-05, "loss": 0.0044, "step": 16465 }, { "epoch": 3.35, "learning_rate": 7.476508779729982e-05, "loss": 0.0062, "step": 16466 }, { "epoch": 3.35, "learning_rate": 7.474831776938205e-05, "loss": 0.014, "step": 16467 }, { "epoch": 3.35, "learning_rate": 7.473154899830931e-05, "loss": 0.0074, "step": 16468 }, { "epoch": 3.35, "learning_rate": 7.471478148436189e-05, "loss": 0.0017, "step": 16469 }, { "epoch": 3.35, "learning_rate": 7.469801522781967e-05, "loss": 0.0066, "step": 16470 }, { "epoch": 3.35, "learning_rate": 7.468125022896274e-05, "loss": 0.0043, "step": 16471 }, { "epoch": 3.35, "learning_rate": 7.46644864880711e-05, "loss": 0.0016, "step": 16472 }, { "epoch": 3.35, "learning_rate": 7.464772400542476e-05, "loss": 0.0029, "step": 16473 }, { "epoch": 3.35, "learning_rate": 7.463096278130365e-05, "loss": 0.0016, "step": 16474 }, { "epoch": 3.35, "learning_rate": 7.461420281598773e-05, "loss": 0.001, "step": 16475 }, { "epoch": 3.35, "learning_rate": 7.459744410975694e-05, "loss": 0.0087, "step": 16476 }, { "epoch": 3.36, "learning_rate": 7.458068666289116e-05, "loss": 0.0066, "step": 16477 }, { "epoch": 3.36, "learning_rate": 7.456393047567025e-05, "loss": 0.0028, "step": 16478 }, { "epoch": 3.36, "learning_rate": 7.454717554837413e-05, "loss": 0.0031, "step": 16479 }, { "epoch": 3.36, "learning_rate": 7.453042188128265e-05, "loss": 0.0069, "step": 16480 }, { "epoch": 3.36, "learning_rate": 7.451366947467547e-05, "loss": 0.0089, "step": 16481 }, { "epoch": 3.36, "learning_rate": 7.449691832883261e-05, "loss": 0.0089, "step": 16482 }, { "epoch": 3.36, "learning_rate": 7.448016844403368e-05, "loss": 0.0008, "step": 16483 }, { "epoch": 3.36, "learning_rate": 7.446341982055844e-05, "loss": 0.0014, "step": 16484 }, { "epoch": 3.36, "learning_rate": 7.44466724586868e-05, "loss": 0.0035, "step": 16485 }, { "epoch": 3.36, "learning_rate": 7.44299263586982e-05, "loss": 0.0009, "step": 16486 }, { "epoch": 3.36, "learning_rate": 7.441318152087261e-05, "loss": 0.0047, "step": 16487 }, { "epoch": 3.36, "learning_rate": 7.439643794548952e-05, "loss": 0.0116, "step": 16488 }, { "epoch": 3.36, "learning_rate": 7.437969563282863e-05, "loss": 0.0039, "step": 16489 }, { "epoch": 3.36, "learning_rate": 7.436295458316955e-05, "loss": 0.0047, "step": 16490 }, { "epoch": 3.36, "learning_rate": 7.434621479679191e-05, "loss": 0.0026, "step": 16491 }, { "epoch": 3.36, "learning_rate": 7.432947627397528e-05, "loss": 0.0035, "step": 16492 }, { "epoch": 3.36, "learning_rate": 7.431273901499926e-05, "loss": 0.0061, "step": 16493 }, { "epoch": 3.36, "learning_rate": 7.429600302014335e-05, "loss": 0.001, "step": 16494 }, { "epoch": 3.36, "learning_rate": 7.42792682896871e-05, "loss": 0.0079, "step": 16495 }, { "epoch": 3.36, "learning_rate": 7.426253482391e-05, "loss": 0.0037, "step": 16496 }, { "epoch": 3.36, "learning_rate": 7.424580262309152e-05, "loss": 0.0055, "step": 16497 }, { "epoch": 3.36, "learning_rate": 7.42290716875112e-05, "loss": 0.0027, "step": 16498 }, { "epoch": 3.36, "learning_rate": 7.421234201744828e-05, "loss": 0.0032, "step": 16499 }, { "epoch": 3.36, "learning_rate": 7.419561361318245e-05, "loss": 0.006, "step": 16500 }, { "epoch": 3.36, "learning_rate": 7.417888647499284e-05, "loss": 0.0209, "step": 16501 }, { "epoch": 3.36, "learning_rate": 7.416216060315905e-05, "loss": 0.0015, "step": 16502 }, { "epoch": 3.36, "learning_rate": 7.414543599796029e-05, "loss": 0.0005, "step": 16503 }, { "epoch": 3.36, "learning_rate": 7.412871265967593e-05, "loss": 0.006, "step": 16504 }, { "epoch": 3.36, "learning_rate": 7.411199058858529e-05, "loss": 0.0103, "step": 16505 }, { "epoch": 3.36, "learning_rate": 7.409526978496764e-05, "loss": 0.0015, "step": 16506 }, { "epoch": 3.36, "learning_rate": 7.407855024910228e-05, "loss": 0.0023, "step": 16507 }, { "epoch": 3.36, "learning_rate": 7.406183198126843e-05, "loss": 0.0101, "step": 16508 }, { "epoch": 3.36, "learning_rate": 7.404511498174534e-05, "loss": 0.0024, "step": 16509 }, { "epoch": 3.36, "learning_rate": 7.402839925081221e-05, "loss": 0.0048, "step": 16510 }, { "epoch": 3.36, "learning_rate": 7.401168478874827e-05, "loss": 0.0087, "step": 16511 }, { "epoch": 3.36, "learning_rate": 7.399497159583253e-05, "loss": 0.004, "step": 16512 }, { "epoch": 3.36, "learning_rate": 7.397825967234433e-05, "loss": 0.009, "step": 16513 }, { "epoch": 3.36, "learning_rate": 7.396154901856258e-05, "loss": 0.0112, "step": 16514 }, { "epoch": 3.36, "learning_rate": 7.394483963476655e-05, "loss": 0.0015, "step": 16515 }, { "epoch": 3.36, "learning_rate": 7.392813152123534e-05, "loss": 0.0015, "step": 16516 }, { "epoch": 3.36, "learning_rate": 7.391142467824779e-05, "loss": 0.0096, "step": 16517 }, { "epoch": 3.36, "learning_rate": 7.38947191060832e-05, "loss": 0.002, "step": 16518 }, { "epoch": 3.36, "learning_rate": 7.387801480502034e-05, "loss": 0.0092, "step": 16519 }, { "epoch": 3.36, "learning_rate": 7.386131177533846e-05, "loss": 0.0002, "step": 16520 }, { "epoch": 3.36, "learning_rate": 7.38446100173163e-05, "loss": 0.0047, "step": 16521 }, { "epoch": 3.36, "learning_rate": 7.382790953123293e-05, "loss": 0.0028, "step": 16522 }, { "epoch": 3.36, "learning_rate": 7.381121031736727e-05, "loss": 0.006, "step": 16523 }, { "epoch": 3.36, "learning_rate": 7.379451237599819e-05, "loss": 0.006, "step": 16524 }, { "epoch": 3.36, "learning_rate": 7.377781570740461e-05, "loss": 0.0003, "step": 16525 }, { "epoch": 3.37, "learning_rate": 7.376112031186538e-05, "loss": 0.0013, "step": 16526 }, { "epoch": 3.37, "learning_rate": 7.374442618965937e-05, "loss": 0.0258, "step": 16527 }, { "epoch": 3.37, "learning_rate": 7.372773334106537e-05, "loss": 0.0009, "step": 16528 }, { "epoch": 3.37, "learning_rate": 7.371104176636219e-05, "loss": 0.0048, "step": 16529 }, { "epoch": 3.37, "learning_rate": 7.369435146582864e-05, "loss": 0.0067, "step": 16530 }, { "epoch": 3.37, "learning_rate": 7.36776624397435e-05, "loss": 0.003, "step": 16531 }, { "epoch": 3.37, "learning_rate": 7.366097468838536e-05, "loss": 0.0043, "step": 16532 }, { "epoch": 3.37, "learning_rate": 7.364428821203314e-05, "loss": 0.0018, "step": 16533 }, { "epoch": 3.37, "learning_rate": 7.36276030109654e-05, "loss": 0.003, "step": 16534 }, { "epoch": 3.37, "learning_rate": 7.361091908546085e-05, "loss": 0.0078, "step": 16535 }, { "epoch": 3.37, "learning_rate": 7.359423643579815e-05, "loss": 0.0076, "step": 16536 }, { "epoch": 3.37, "learning_rate": 7.357755506225586e-05, "loss": 0.0053, "step": 16537 }, { "epoch": 3.37, "learning_rate": 7.356087496511277e-05, "loss": 0.0058, "step": 16538 }, { "epoch": 3.37, "learning_rate": 7.35441961446473e-05, "loss": 0.0026, "step": 16539 }, { "epoch": 3.37, "learning_rate": 7.352751860113808e-05, "loss": 0.0014, "step": 16540 }, { "epoch": 3.37, "learning_rate": 7.351084233486366e-05, "loss": 0.0003, "step": 16541 }, { "epoch": 3.37, "learning_rate": 7.349416734610255e-05, "loss": 0.0063, "step": 16542 }, { "epoch": 3.37, "learning_rate": 7.347749363513326e-05, "loss": 0.0006, "step": 16543 }, { "epoch": 3.37, "learning_rate": 7.346082120223427e-05, "loss": 0.002, "step": 16544 }, { "epoch": 3.37, "learning_rate": 7.344415004768403e-05, "loss": 0.0024, "step": 16545 }, { "epoch": 3.37, "learning_rate": 7.342748017176102e-05, "loss": 0.0067, "step": 16546 }, { "epoch": 3.37, "learning_rate": 7.341081157474362e-05, "loss": 0.0062, "step": 16547 }, { "epoch": 3.37, "learning_rate": 7.339414425691025e-05, "loss": 0.0006, "step": 16548 }, { "epoch": 3.37, "learning_rate": 7.337747821853932e-05, "loss": 0.0007, "step": 16549 }, { "epoch": 3.37, "learning_rate": 7.336081345990903e-05, "loss": 0.0013, "step": 16550 }, { "epoch": 3.37, "learning_rate": 7.334414998129792e-05, "loss": 0.0036, "step": 16551 }, { "epoch": 3.37, "learning_rate": 7.332748778298411e-05, "loss": 0.0029, "step": 16552 }, { "epoch": 3.37, "learning_rate": 7.331082686524609e-05, "loss": 0.0076, "step": 16553 }, { "epoch": 3.37, "learning_rate": 7.329416722836197e-05, "loss": 0.0074, "step": 16554 }, { "epoch": 3.37, "learning_rate": 7.327750887261003e-05, "loss": 0.004, "step": 16555 }, { "epoch": 3.37, "learning_rate": 7.326085179826854e-05, "loss": 0.0044, "step": 16556 }, { "epoch": 3.37, "learning_rate": 7.324419600561567e-05, "loss": 0.0053, "step": 16557 }, { "epoch": 3.37, "learning_rate": 7.322754149492962e-05, "loss": 0.0015, "step": 16558 }, { "epoch": 3.37, "learning_rate": 7.321088826648853e-05, "loss": 0.0032, "step": 16559 }, { "epoch": 3.37, "learning_rate": 7.319423632057057e-05, "loss": 0.0007, "step": 16560 }, { "epoch": 3.37, "learning_rate": 7.317758565745384e-05, "loss": 0.0255, "step": 16561 }, { "epoch": 3.37, "learning_rate": 7.316093627741649e-05, "loss": 0.0032, "step": 16562 }, { "epoch": 3.37, "learning_rate": 7.314428818073645e-05, "loss": 0.0059, "step": 16563 }, { "epoch": 3.37, "learning_rate": 7.312764136769198e-05, "loss": 0.0089, "step": 16564 }, { "epoch": 3.37, "learning_rate": 7.31109958385609e-05, "loss": 0.0023, "step": 16565 }, { "epoch": 3.37, "learning_rate": 7.309435159362143e-05, "loss": 0.0055, "step": 16566 }, { "epoch": 3.37, "learning_rate": 7.30777086331514e-05, "loss": 0.0036, "step": 16567 }, { "epoch": 3.37, "learning_rate": 7.306106695742879e-05, "loss": 0.0093, "step": 16568 }, { "epoch": 3.37, "learning_rate": 7.304442656673171e-05, "loss": 0.0058, "step": 16569 }, { "epoch": 3.37, "learning_rate": 7.302778746133784e-05, "loss": 0.0072, "step": 16570 }, { "epoch": 3.37, "learning_rate": 7.301114964152534e-05, "loss": 0.0106, "step": 16571 }, { "epoch": 3.37, "learning_rate": 7.29945131075719e-05, "loss": 0.0034, "step": 16572 }, { "epoch": 3.37, "learning_rate": 7.297787785975547e-05, "loss": 0.0003, "step": 16573 }, { "epoch": 3.37, "learning_rate": 7.296124389835386e-05, "loss": 0.0072, "step": 16574 }, { "epoch": 3.37, "learning_rate": 7.29446112236449e-05, "loss": 0.0068, "step": 16575 }, { "epoch": 3.38, "learning_rate": 7.292797983590638e-05, "loss": 0.0015, "step": 16576 }, { "epoch": 3.38, "learning_rate": 7.291134973541608e-05, "loss": 0.0058, "step": 16577 }, { "epoch": 3.38, "learning_rate": 7.289472092245175e-05, "loss": 0.0045, "step": 16578 }, { "epoch": 3.38, "learning_rate": 7.287809339729114e-05, "loss": 0.0047, "step": 16579 }, { "epoch": 3.38, "learning_rate": 7.286146716021198e-05, "loss": 0.0077, "step": 16580 }, { "epoch": 3.38, "learning_rate": 7.284484221149184e-05, "loss": 0.0062, "step": 16581 }, { "epoch": 3.38, "learning_rate": 7.28282185514086e-05, "loss": 0.0009, "step": 16582 }, { "epoch": 3.38, "learning_rate": 7.281159618023963e-05, "loss": 0.0004, "step": 16583 }, { "epoch": 3.38, "learning_rate": 7.279497509826284e-05, "loss": 0.0029, "step": 16584 }, { "epoch": 3.38, "learning_rate": 7.277835530575564e-05, "loss": 0.0023, "step": 16585 }, { "epoch": 3.38, "learning_rate": 7.276173680299568e-05, "loss": 0.0183, "step": 16586 }, { "epoch": 3.38, "learning_rate": 7.274511959026051e-05, "loss": 0.0062, "step": 16587 }, { "epoch": 3.38, "learning_rate": 7.272850366782767e-05, "loss": 0.0038, "step": 16588 }, { "epoch": 3.38, "learning_rate": 7.27118890359747e-05, "loss": 0.0027, "step": 16589 }, { "epoch": 3.38, "learning_rate": 7.269527569497905e-05, "loss": 0.0029, "step": 16590 }, { "epoch": 3.38, "learning_rate": 7.267866364511821e-05, "loss": 0.0042, "step": 16591 }, { "epoch": 3.38, "learning_rate": 7.266205288666966e-05, "loss": 0.0431, "step": 16592 }, { "epoch": 3.38, "learning_rate": 7.264544341991081e-05, "loss": 0.0045, "step": 16593 }, { "epoch": 3.38, "learning_rate": 7.262883524511908e-05, "loss": 0.0059, "step": 16594 }, { "epoch": 3.38, "learning_rate": 7.261222836257188e-05, "loss": 0.0033, "step": 16595 }, { "epoch": 3.38, "learning_rate": 7.259562277254646e-05, "loss": 0.0087, "step": 16596 }, { "epoch": 3.38, "learning_rate": 7.25790184753203e-05, "loss": 0.0052, "step": 16597 }, { "epoch": 3.38, "learning_rate": 7.256241547117067e-05, "loss": 0.0043, "step": 16598 }, { "epoch": 3.38, "learning_rate": 7.254581376037488e-05, "loss": 0.004, "step": 16599 }, { "epoch": 3.38, "learning_rate": 7.252921334321025e-05, "loss": 0.0024, "step": 16600 }, { "epoch": 3.38, "learning_rate": 7.25126142199539e-05, "loss": 0.0058, "step": 16601 }, { "epoch": 3.38, "learning_rate": 7.249601639088326e-05, "loss": 0.0081, "step": 16602 }, { "epoch": 3.38, "learning_rate": 7.247941985627532e-05, "loss": 0.0021, "step": 16603 }, { "epoch": 3.38, "learning_rate": 7.246282461640753e-05, "loss": 0.0067, "step": 16604 }, { "epoch": 3.38, "learning_rate": 7.244623067155687e-05, "loss": 0.0024, "step": 16605 }, { "epoch": 3.38, "learning_rate": 7.242963802200056e-05, "loss": 0.0023, "step": 16606 }, { "epoch": 3.38, "learning_rate": 7.241304666801572e-05, "loss": 0.0127, "step": 16607 }, { "epoch": 3.38, "learning_rate": 7.239645660987944e-05, "loss": 0.0031, "step": 16608 }, { "epoch": 3.38, "learning_rate": 7.237986784786882e-05, "loss": 0.0039, "step": 16609 }, { "epoch": 3.38, "learning_rate": 7.236328038226095e-05, "loss": 0.0026, "step": 16610 }, { "epoch": 3.38, "learning_rate": 7.234669421333283e-05, "loss": 0.0019, "step": 16611 }, { "epoch": 3.38, "learning_rate": 7.233010934136149e-05, "loss": 0.0044, "step": 16612 }, { "epoch": 3.38, "learning_rate": 7.2313525766624e-05, "loss": 0.0025, "step": 16613 }, { "epoch": 3.38, "learning_rate": 7.229694348939718e-05, "loss": 0.002, "step": 16614 }, { "epoch": 3.38, "learning_rate": 7.228036250995816e-05, "loss": 0.0029, "step": 16615 }, { "epoch": 3.38, "learning_rate": 7.226378282858369e-05, "loss": 0.0063, "step": 16616 }, { "epoch": 3.38, "learning_rate": 7.22472044455509e-05, "loss": 0.0083, "step": 16617 }, { "epoch": 3.38, "learning_rate": 7.223062736113653e-05, "loss": 0.0084, "step": 16618 }, { "epoch": 3.38, "learning_rate": 7.221405157561746e-05, "loss": 0.008, "step": 16619 }, { "epoch": 3.38, "learning_rate": 7.219747708927056e-05, "loss": 0.0063, "step": 16620 }, { "epoch": 3.38, "learning_rate": 7.218090390237259e-05, "loss": 0.0023, "step": 16621 }, { "epoch": 3.38, "learning_rate": 7.216433201520055e-05, "loss": 0.0062, "step": 16622 }, { "epoch": 3.38, "learning_rate": 7.214776142803102e-05, "loss": 0.0138, "step": 16623 }, { "epoch": 3.38, "learning_rate": 7.213119214114083e-05, "loss": 0.0004, "step": 16624 }, { "epoch": 3.39, "learning_rate": 7.211462415480673e-05, "loss": 0.0113, "step": 16625 }, { "epoch": 3.39, "learning_rate": 7.209805746930544e-05, "loss": 0.0051, "step": 16626 }, { "epoch": 3.39, "learning_rate": 7.20814920849136e-05, "loss": 0.0019, "step": 16627 }, { "epoch": 3.39, "learning_rate": 7.206492800190796e-05, "loss": 0.0102, "step": 16628 }, { "epoch": 3.39, "learning_rate": 7.20483652205651e-05, "loss": 0.0039, "step": 16629 }, { "epoch": 3.39, "learning_rate": 7.203180374116172e-05, "loss": 0.0075, "step": 16630 }, { "epoch": 3.39, "learning_rate": 7.201524356397444e-05, "loss": 0.0022, "step": 16631 }, { "epoch": 3.39, "learning_rate": 7.199868468927969e-05, "loss": 0.0119, "step": 16632 }, { "epoch": 3.39, "learning_rate": 7.198212711735424e-05, "loss": 0.0121, "step": 16633 }, { "epoch": 3.39, "learning_rate": 7.196557084847444e-05, "loss": 0.0069, "step": 16634 }, { "epoch": 3.39, "learning_rate": 7.194901588291701e-05, "loss": 0.0026, "step": 16635 }, { "epoch": 3.39, "learning_rate": 7.193246222095829e-05, "loss": 0.0066, "step": 16636 }, { "epoch": 3.39, "learning_rate": 7.191590986287481e-05, "loss": 0.0006, "step": 16637 }, { "epoch": 3.39, "learning_rate": 7.189935880894303e-05, "loss": 0.0043, "step": 16638 }, { "epoch": 3.39, "learning_rate": 7.18828090594394e-05, "loss": 0.0032, "step": 16639 }, { "epoch": 3.39, "learning_rate": 7.18662606146403e-05, "loss": 0.004, "step": 16640 }, { "epoch": 3.39, "learning_rate": 7.184971347482215e-05, "loss": 0.0014, "step": 16641 }, { "epoch": 3.39, "learning_rate": 7.183316764026128e-05, "loss": 0.0064, "step": 16642 }, { "epoch": 3.39, "learning_rate": 7.181662311123408e-05, "loss": 0.0013, "step": 16643 }, { "epoch": 3.39, "learning_rate": 7.180007988801685e-05, "loss": 0.0056, "step": 16644 }, { "epoch": 3.39, "learning_rate": 7.178353797088591e-05, "loss": 0.0043, "step": 16645 }, { "epoch": 3.39, "learning_rate": 7.176699736011757e-05, "loss": 0.0036, "step": 16646 }, { "epoch": 3.39, "learning_rate": 7.175045805598794e-05, "loss": 0.0003, "step": 16647 }, { "epoch": 3.39, "learning_rate": 7.173392005877347e-05, "loss": 0.0026, "step": 16648 }, { "epoch": 3.39, "learning_rate": 7.171738336875018e-05, "loss": 0.0015, "step": 16649 }, { "epoch": 3.39, "learning_rate": 7.17008479861944e-05, "loss": 0.0065, "step": 16650 }, { "epoch": 3.39, "learning_rate": 7.168431391138232e-05, "loss": 0.0024, "step": 16651 }, { "epoch": 3.39, "learning_rate": 7.166778114458992e-05, "loss": 0.0032, "step": 16652 }, { "epoch": 3.39, "learning_rate": 7.165124968609356e-05, "loss": 0.0023, "step": 16653 }, { "epoch": 3.39, "learning_rate": 7.163471953616914e-05, "loss": 0.0089, "step": 16654 }, { "epoch": 3.39, "learning_rate": 7.161819069509286e-05, "loss": 0.0023, "step": 16655 }, { "epoch": 3.39, "learning_rate": 7.160166316314073e-05, "loss": 0.0027, "step": 16656 }, { "epoch": 3.39, "learning_rate": 7.15851369405888e-05, "loss": 0.0091, "step": 16657 }, { "epoch": 3.39, "learning_rate": 7.156861202771311e-05, "loss": 0.0136, "step": 16658 }, { "epoch": 3.39, "learning_rate": 7.155208842478968e-05, "loss": 0.0094, "step": 16659 }, { "epoch": 3.39, "learning_rate": 7.153556613209444e-05, "loss": 0.0086, "step": 16660 }, { "epoch": 3.39, "learning_rate": 7.151904514990334e-05, "loss": 0.0111, "step": 16661 }, { "epoch": 3.39, "learning_rate": 7.150252547849232e-05, "loss": 0.0122, "step": 16662 }, { "epoch": 3.39, "learning_rate": 7.148600711813734e-05, "loss": 0.0102, "step": 16663 }, { "epoch": 3.39, "learning_rate": 7.146949006911427e-05, "loss": 0.0167, "step": 16664 }, { "epoch": 3.39, "learning_rate": 7.145297433169885e-05, "loss": 0.0068, "step": 16665 }, { "epoch": 3.39, "learning_rate": 7.143645990616714e-05, "loss": 0.0021, "step": 16666 }, { "epoch": 3.39, "learning_rate": 7.141994679279473e-05, "loss": 0.0016, "step": 16667 }, { "epoch": 3.39, "learning_rate": 7.140343499185766e-05, "loss": 0.0009, "step": 16668 }, { "epoch": 3.39, "learning_rate": 7.138692450363154e-05, "loss": 0.0104, "step": 16669 }, { "epoch": 3.39, "learning_rate": 7.137041532839215e-05, "loss": 0.0017, "step": 16670 }, { "epoch": 3.39, "learning_rate": 7.135390746641526e-05, "loss": 0.0046, "step": 16671 }, { "epoch": 3.39, "learning_rate": 7.133740091797658e-05, "loss": 0.0026, "step": 16672 }, { "epoch": 3.39, "learning_rate": 7.132089568335178e-05, "loss": 0.004, "step": 16673 }, { "epoch": 3.4, "learning_rate": 7.130439176281653e-05, "loss": 0.0018, "step": 16674 }, { "epoch": 3.4, "learning_rate": 7.128788915664649e-05, "loss": 0.0009, "step": 16675 }, { "epoch": 3.4, "learning_rate": 7.12713878651173e-05, "loss": 0.002, "step": 16676 }, { "epoch": 3.4, "learning_rate": 7.125488788850452e-05, "loss": 0.0018, "step": 16677 }, { "epoch": 3.4, "learning_rate": 7.123838922708378e-05, "loss": 0.0036, "step": 16678 }, { "epoch": 3.4, "learning_rate": 7.122189188113065e-05, "loss": 0.0017, "step": 16679 }, { "epoch": 3.4, "learning_rate": 7.120539585092052e-05, "loss": 0.0056, "step": 16680 }, { "epoch": 3.4, "learning_rate": 7.118890113672908e-05, "loss": 0.0033, "step": 16681 }, { "epoch": 3.4, "learning_rate": 7.11724077388318e-05, "loss": 0.0027, "step": 16682 }, { "epoch": 3.4, "learning_rate": 7.115591565750401e-05, "loss": 0.005, "step": 16683 }, { "epoch": 3.4, "learning_rate": 7.113942489302135e-05, "loss": 0.014, "step": 16684 }, { "epoch": 3.4, "learning_rate": 7.112293544565905e-05, "loss": 0.007, "step": 16685 }, { "epoch": 3.4, "learning_rate": 7.110644731569273e-05, "loss": 0.0016, "step": 16686 }, { "epoch": 3.4, "learning_rate": 7.108996050339763e-05, "loss": 0.004, "step": 16687 }, { "epoch": 3.4, "learning_rate": 7.10734750090491e-05, "loss": 0.009, "step": 16688 }, { "epoch": 3.4, "learning_rate": 7.105699083292256e-05, "loss": 0.0079, "step": 16689 }, { "epoch": 3.4, "learning_rate": 7.104050797529328e-05, "loss": 0.0065, "step": 16690 }, { "epoch": 3.4, "learning_rate": 7.102402643643655e-05, "loss": 0.0043, "step": 16691 }, { "epoch": 3.4, "learning_rate": 7.100754621662765e-05, "loss": 0.0074, "step": 16692 }, { "epoch": 3.4, "learning_rate": 7.099106731614185e-05, "loss": 0.001, "step": 16693 }, { "epoch": 3.4, "learning_rate": 7.097458973525438e-05, "loss": 0.0071, "step": 16694 }, { "epoch": 3.4, "learning_rate": 7.095811347424041e-05, "loss": 0.0076, "step": 16695 }, { "epoch": 3.4, "learning_rate": 7.094163853337515e-05, "loss": 0.002, "step": 16696 }, { "epoch": 3.4, "learning_rate": 7.092516491293383e-05, "loss": 0.012, "step": 16697 }, { "epoch": 3.4, "learning_rate": 7.09086926131914e-05, "loss": 0.002, "step": 16698 }, { "epoch": 3.4, "learning_rate": 7.08922216344232e-05, "loss": 0.0095, "step": 16699 }, { "epoch": 3.4, "learning_rate": 7.087575197690413e-05, "loss": 0.0006, "step": 16700 }, { "epoch": 3.4, "learning_rate": 7.085928364090947e-05, "loss": 0.0018, "step": 16701 }, { "epoch": 3.4, "learning_rate": 7.08428166267141e-05, "loss": 0.0153, "step": 16702 }, { "epoch": 3.4, "learning_rate": 7.082635093459306e-05, "loss": 0.0002, "step": 16703 }, { "epoch": 3.4, "learning_rate": 7.080988656482152e-05, "loss": 0.0097, "step": 16704 }, { "epoch": 3.4, "learning_rate": 7.07934235176743e-05, "loss": 0.0156, "step": 16705 }, { "epoch": 3.4, "learning_rate": 7.077696179342642e-05, "loss": 0.0027, "step": 16706 }, { "epoch": 3.4, "learning_rate": 7.076050139235281e-05, "loss": 0.0047, "step": 16707 }, { "epoch": 3.4, "learning_rate": 7.074404231472842e-05, "loss": 0.0026, "step": 16708 }, { "epoch": 3.4, "learning_rate": 7.072758456082812e-05, "loss": 0.001, "step": 16709 }, { "epoch": 3.4, "learning_rate": 7.071112813092686e-05, "loss": 0.0072, "step": 16710 }, { "epoch": 3.4, "learning_rate": 7.069467302529931e-05, "loss": 0.0018, "step": 16711 }, { "epoch": 3.4, "learning_rate": 7.067821924422048e-05, "loss": 0.0057, "step": 16712 }, { "epoch": 3.4, "learning_rate": 7.066176678796512e-05, "loss": 0.0016, "step": 16713 }, { "epoch": 3.4, "learning_rate": 7.0645315656808e-05, "loss": 0.0042, "step": 16714 }, { "epoch": 3.4, "learning_rate": 7.062886585102398e-05, "loss": 0.0173, "step": 16715 }, { "epoch": 3.4, "learning_rate": 7.061241737088759e-05, "loss": 0.0013, "step": 16716 }, { "epoch": 3.4, "learning_rate": 7.059597021667382e-05, "loss": 0.003, "step": 16717 }, { "epoch": 3.4, "learning_rate": 7.057952438865711e-05, "loss": 0.0073, "step": 16718 }, { "epoch": 3.4, "learning_rate": 7.056307988711236e-05, "loss": 0.0055, "step": 16719 }, { "epoch": 3.4, "learning_rate": 7.054663671231408e-05, "loss": 0.0036, "step": 16720 }, { "epoch": 3.4, "learning_rate": 7.053019486453695e-05, "loss": 0.0023, "step": 16721 }, { "epoch": 3.4, "learning_rate": 7.051375434405556e-05, "loss": 0.0021, "step": 16722 }, { "epoch": 3.41, "learning_rate": 7.049731515114453e-05, "loss": 0.0014, "step": 16723 }, { "epoch": 3.41, "learning_rate": 7.048087728607841e-05, "loss": 0.0007, "step": 16724 }, { "epoch": 3.41, "learning_rate": 7.046444074913173e-05, "loss": 0.002, "step": 16725 }, { "epoch": 3.41, "learning_rate": 7.044800554057902e-05, "loss": 0.0034, "step": 16726 }, { "epoch": 3.41, "learning_rate": 7.04315716606948e-05, "loss": 0.0014, "step": 16727 }, { "epoch": 3.41, "learning_rate": 7.041513910975351e-05, "loss": 0.0152, "step": 16728 }, { "epoch": 3.41, "learning_rate": 7.039870788802963e-05, "loss": 0.0002, "step": 16729 }, { "epoch": 3.41, "learning_rate": 7.038227799579765e-05, "loss": 0.0027, "step": 16730 }, { "epoch": 3.41, "learning_rate": 7.036584943333181e-05, "loss": 0.0029, "step": 16731 }, { "epoch": 3.41, "learning_rate": 7.03494222009067e-05, "loss": 0.004, "step": 16732 }, { "epoch": 3.41, "learning_rate": 7.033299629879655e-05, "loss": 0.0119, "step": 16733 }, { "epoch": 3.41, "learning_rate": 7.031657172727567e-05, "loss": 0.0012, "step": 16734 }, { "epoch": 3.41, "learning_rate": 7.030014848661858e-05, "loss": 0.0029, "step": 16735 }, { "epoch": 3.41, "learning_rate": 7.028372657709934e-05, "loss": 0.0048, "step": 16736 }, { "epoch": 3.41, "learning_rate": 7.026730599899246e-05, "loss": 0.0055, "step": 16737 }, { "epoch": 3.41, "learning_rate": 7.0250886752572e-05, "loss": 0.0056, "step": 16738 }, { "epoch": 3.41, "learning_rate": 7.023446883811227e-05, "loss": 0.0032, "step": 16739 }, { "epoch": 3.41, "learning_rate": 7.021805225588751e-05, "loss": 0.0027, "step": 16740 }, { "epoch": 3.41, "learning_rate": 7.020163700617184e-05, "loss": 0.0077, "step": 16741 }, { "epoch": 3.41, "learning_rate": 7.018522308923948e-05, "loss": 0.0087, "step": 16742 }, { "epoch": 3.41, "learning_rate": 7.016881050536455e-05, "loss": 0.0017, "step": 16743 }, { "epoch": 3.41, "learning_rate": 7.01523992548212e-05, "loss": 0.0077, "step": 16744 }, { "epoch": 3.41, "learning_rate": 7.013598933788349e-05, "loss": 0.0083, "step": 16745 }, { "epoch": 3.41, "learning_rate": 7.01195807548255e-05, "loss": 0.0033, "step": 16746 }, { "epoch": 3.41, "learning_rate": 7.01031735059213e-05, "loss": 0.0073, "step": 16747 }, { "epoch": 3.41, "learning_rate": 7.008676759144496e-05, "loss": 0.001, "step": 16748 }, { "epoch": 3.41, "learning_rate": 7.007036301167036e-05, "loss": 0.0057, "step": 16749 }, { "epoch": 3.41, "learning_rate": 7.005395976687169e-05, "loss": 0.0017, "step": 16750 }, { "epoch": 3.41, "learning_rate": 7.003755785732267e-05, "loss": 0.0007, "step": 16751 }, { "epoch": 3.41, "learning_rate": 7.00211572832975e-05, "loss": 0.0071, "step": 16752 }, { "epoch": 3.41, "learning_rate": 7.000475804506991e-05, "loss": 0.0008, "step": 16753 }, { "epoch": 3.41, "learning_rate": 6.998836014291387e-05, "loss": 0.0012, "step": 16754 }, { "epoch": 3.41, "learning_rate": 6.997196357710325e-05, "loss": 0.0041, "step": 16755 }, { "epoch": 3.41, "learning_rate": 6.99555683479119e-05, "loss": 0.0061, "step": 16756 }, { "epoch": 3.41, "learning_rate": 6.993917445561365e-05, "loss": 0.0057, "step": 16757 }, { "epoch": 3.41, "learning_rate": 6.992278190048231e-05, "loss": 0.0066, "step": 16758 }, { "epoch": 3.41, "learning_rate": 6.990639068279166e-05, "loss": 0.0034, "step": 16759 }, { "epoch": 3.41, "learning_rate": 6.989000080281549e-05, "loss": 0.0093, "step": 16760 }, { "epoch": 3.41, "learning_rate": 6.987361226082758e-05, "loss": 0.004, "step": 16761 }, { "epoch": 3.41, "learning_rate": 6.985722505710147e-05, "loss": 0.004, "step": 16762 }, { "epoch": 3.41, "learning_rate": 6.984083919191111e-05, "loss": 0.001, "step": 16763 }, { "epoch": 3.41, "learning_rate": 6.982445466552992e-05, "loss": 0.0046, "step": 16764 }, { "epoch": 3.41, "learning_rate": 6.980807147823173e-05, "loss": 0.0033, "step": 16765 }, { "epoch": 3.41, "learning_rate": 6.97916896302902e-05, "loss": 0.0117, "step": 16766 }, { "epoch": 3.41, "learning_rate": 6.977530912197874e-05, "loss": 0.0044, "step": 16767 }, { "epoch": 3.41, "learning_rate": 6.975892995357115e-05, "loss": 0.0173, "step": 16768 }, { "epoch": 3.41, "learning_rate": 6.974255212534078e-05, "loss": 0.0069, "step": 16769 }, { "epoch": 3.41, "learning_rate": 6.972617563756141e-05, "loss": 0.008, "step": 16770 }, { "epoch": 3.41, "learning_rate": 6.970980049050637e-05, "loss": 0.0033, "step": 16771 }, { "epoch": 3.42, "learning_rate": 6.969342668444923e-05, "loss": 0.0008, "step": 16772 }, { "epoch": 3.42, "learning_rate": 6.967705421966346e-05, "loss": 0.0004, "step": 16773 }, { "epoch": 3.42, "learning_rate": 6.966068309642249e-05, "loss": 0.0033, "step": 16774 }, { "epoch": 3.42, "learning_rate": 6.964431331499977e-05, "loss": 0.0072, "step": 16775 }, { "epoch": 3.42, "learning_rate": 6.962794487566869e-05, "loss": 0.0011, "step": 16776 }, { "epoch": 3.42, "learning_rate": 6.961157777870266e-05, "loss": 0.0058, "step": 16777 }, { "epoch": 3.42, "learning_rate": 6.959521202437501e-05, "loss": 0.0061, "step": 16778 }, { "epoch": 3.42, "learning_rate": 6.957884761295915e-05, "loss": 0.0037, "step": 16779 }, { "epoch": 3.42, "learning_rate": 6.956248454472824e-05, "loss": 0.0053, "step": 16780 }, { "epoch": 3.42, "learning_rate": 6.954612281995579e-05, "loss": 0.0023, "step": 16781 }, { "epoch": 3.42, "learning_rate": 6.952976243891482e-05, "loss": 0.0038, "step": 16782 }, { "epoch": 3.42, "learning_rate": 6.951340340187885e-05, "loss": 0.0052, "step": 16783 }, { "epoch": 3.42, "learning_rate": 6.949704570912093e-05, "loss": 0.0108, "step": 16784 }, { "epoch": 3.42, "learning_rate": 6.948068936091428e-05, "loss": 0.0109, "step": 16785 }, { "epoch": 3.42, "learning_rate": 6.946433435753211e-05, "loss": 0.0031, "step": 16786 }, { "epoch": 3.42, "learning_rate": 6.944798069924753e-05, "loss": 0.0044, "step": 16787 }, { "epoch": 3.42, "learning_rate": 6.943162838633383e-05, "loss": 0.0005, "step": 16788 }, { "epoch": 3.42, "learning_rate": 6.941527741906397e-05, "loss": 0.0152, "step": 16789 }, { "epoch": 3.42, "learning_rate": 6.939892779771108e-05, "loss": 0.0119, "step": 16790 }, { "epoch": 3.42, "learning_rate": 6.938257952254826e-05, "loss": 0.0029, "step": 16791 }, { "epoch": 3.42, "learning_rate": 6.936623259384852e-05, "loss": 0.0063, "step": 16792 }, { "epoch": 3.42, "learning_rate": 6.934988701188493e-05, "loss": 0.0099, "step": 16793 }, { "epoch": 3.42, "learning_rate": 6.933354277693042e-05, "loss": 0.0089, "step": 16794 }, { "epoch": 3.42, "learning_rate": 6.931719988925805e-05, "loss": 0.0028, "step": 16795 }, { "epoch": 3.42, "learning_rate": 6.930085834914074e-05, "loss": 0.0037, "step": 16796 }, { "epoch": 3.42, "learning_rate": 6.92845181568514e-05, "loss": 0.0015, "step": 16797 }, { "epoch": 3.42, "learning_rate": 6.9268179312663e-05, "loss": 0.0027, "step": 16798 }, { "epoch": 3.42, "learning_rate": 6.925184181684843e-05, "loss": 0.0041, "step": 16799 }, { "epoch": 3.42, "learning_rate": 6.923550566968043e-05, "loss": 0.0015, "step": 16800 }, { "epoch": 3.42, "learning_rate": 6.921917087143205e-05, "loss": 0.0081, "step": 16801 }, { "epoch": 3.42, "learning_rate": 6.920283742237587e-05, "loss": 0.0043, "step": 16802 }, { "epoch": 3.42, "learning_rate": 6.918650532278496e-05, "loss": 0.0022, "step": 16803 }, { "epoch": 3.42, "learning_rate": 6.917017457293188e-05, "loss": 0.0032, "step": 16804 }, { "epoch": 3.42, "learning_rate": 6.915384517308945e-05, "loss": 0.0004, "step": 16805 }, { "epoch": 3.42, "learning_rate": 6.913751712353045e-05, "loss": 0.0013, "step": 16806 }, { "epoch": 3.42, "learning_rate": 6.912119042452752e-05, "loss": 0.0026, "step": 16807 }, { "epoch": 3.42, "learning_rate": 6.91048650763534e-05, "loss": 0.0015, "step": 16808 }, { "epoch": 3.42, "learning_rate": 6.908854107928073e-05, "loss": 0.0106, "step": 16809 }, { "epoch": 3.42, "learning_rate": 6.907221843358215e-05, "loss": 0.0014, "step": 16810 }, { "epoch": 3.42, "learning_rate": 6.90558971395303e-05, "loss": 0.0118, "step": 16811 }, { "epoch": 3.42, "learning_rate": 6.903957719739779e-05, "loss": 0.0041, "step": 16812 }, { "epoch": 3.42, "learning_rate": 6.902325860745707e-05, "loss": 0.0101, "step": 16813 }, { "epoch": 3.42, "learning_rate": 6.900694136998089e-05, "loss": 0.0079, "step": 16814 }, { "epoch": 3.42, "learning_rate": 6.899062548524158e-05, "loss": 0.0042, "step": 16815 }, { "epoch": 3.42, "learning_rate": 6.897431095351182e-05, "loss": 0.0119, "step": 16816 }, { "epoch": 3.42, "learning_rate": 6.895799777506398e-05, "loss": 0.0167, "step": 16817 }, { "epoch": 3.42, "learning_rate": 6.89416859501705e-05, "loss": 0.0023, "step": 16818 }, { "epoch": 3.42, "learning_rate": 6.892537547910397e-05, "loss": 0.0101, "step": 16819 }, { "epoch": 3.42, "learning_rate": 6.890906636213661e-05, "loss": 0.0023, "step": 16820 }, { "epoch": 3.43, "learning_rate": 6.889275859954103e-05, "loss": 0.0147, "step": 16821 }, { "epoch": 3.43, "learning_rate": 6.887645219158941e-05, "loss": 0.0032, "step": 16822 }, { "epoch": 3.43, "learning_rate": 6.886014713855418e-05, "loss": 0.0091, "step": 16823 }, { "epoch": 3.43, "learning_rate": 6.884384344070765e-05, "loss": 0.0094, "step": 16824 }, { "epoch": 3.43, "learning_rate": 6.882754109832214e-05, "loss": 0.0073, "step": 16825 }, { "epoch": 3.43, "learning_rate": 6.88112401116699e-05, "loss": 0.0011, "step": 16826 }, { "epoch": 3.43, "learning_rate": 6.879494048102321e-05, "loss": 0.0031, "step": 16827 }, { "epoch": 3.43, "learning_rate": 6.877864220665431e-05, "loss": 0.0036, "step": 16828 }, { "epoch": 3.43, "learning_rate": 6.876234528883538e-05, "loss": 0.0015, "step": 16829 }, { "epoch": 3.43, "learning_rate": 6.87460497278387e-05, "loss": 0.005, "step": 16830 }, { "epoch": 3.43, "learning_rate": 6.872975552393626e-05, "loss": 0.0044, "step": 16831 }, { "epoch": 3.43, "learning_rate": 6.871346267740041e-05, "loss": 0.0035, "step": 16832 }, { "epoch": 3.43, "learning_rate": 6.869717118850308e-05, "loss": 0.0112, "step": 16833 }, { "epoch": 3.43, "learning_rate": 6.868088105751655e-05, "loss": 0.0052, "step": 16834 }, { "epoch": 3.43, "learning_rate": 6.866459228471276e-05, "loss": 0.0046, "step": 16835 }, { "epoch": 3.43, "learning_rate": 6.864830487036381e-05, "loss": 0.0014, "step": 16836 }, { "epoch": 3.43, "learning_rate": 6.863201881474175e-05, "loss": 0.0039, "step": 16837 }, { "epoch": 3.43, "learning_rate": 6.861573411811854e-05, "loss": 0.0016, "step": 16838 }, { "epoch": 3.43, "learning_rate": 6.85994507807662e-05, "loss": 0.0013, "step": 16839 }, { "epoch": 3.43, "learning_rate": 6.85831688029567e-05, "loss": 0.004, "step": 16840 }, { "epoch": 3.43, "learning_rate": 6.856688818496196e-05, "loss": 0.0029, "step": 16841 }, { "epoch": 3.43, "learning_rate": 6.855060892705391e-05, "loss": 0.0069, "step": 16842 }, { "epoch": 3.43, "learning_rate": 6.853433102950443e-05, "loss": 0.0118, "step": 16843 }, { "epoch": 3.43, "learning_rate": 6.85180544925854e-05, "loss": 0.0168, "step": 16844 }, { "epoch": 3.43, "learning_rate": 6.850177931656872e-05, "loss": 0.0087, "step": 16845 }, { "epoch": 3.43, "learning_rate": 6.848550550172604e-05, "loss": 0.0014, "step": 16846 }, { "epoch": 3.43, "learning_rate": 6.846923304832936e-05, "loss": 0.0043, "step": 16847 }, { "epoch": 3.43, "learning_rate": 6.845296195665038e-05, "loss": 0.0027, "step": 16848 }, { "epoch": 3.43, "learning_rate": 6.843669222696087e-05, "loss": 0.0048, "step": 16849 }, { "epoch": 3.43, "learning_rate": 6.842042385953262e-05, "loss": 0.0041, "step": 16850 }, { "epoch": 3.43, "learning_rate": 6.840415685463718e-05, "loss": 0.0038, "step": 16851 }, { "epoch": 3.43, "learning_rate": 6.838789121254645e-05, "loss": 0.0079, "step": 16852 }, { "epoch": 3.43, "learning_rate": 6.837162693353193e-05, "loss": 0.0039, "step": 16853 }, { "epoch": 3.43, "learning_rate": 6.835536401786532e-05, "loss": 0.0135, "step": 16854 }, { "epoch": 3.43, "learning_rate": 6.833910246581827e-05, "loss": 0.0048, "step": 16855 }, { "epoch": 3.43, "learning_rate": 6.832284227766233e-05, "loss": 0.0038, "step": 16856 }, { "epoch": 3.43, "learning_rate": 6.83065834536691e-05, "loss": 0.0022, "step": 16857 }, { "epoch": 3.43, "learning_rate": 6.829032599411016e-05, "loss": 0.0009, "step": 16858 }, { "epoch": 3.43, "learning_rate": 6.827406989925697e-05, "loss": 0.007, "step": 16859 }, { "epoch": 3.43, "learning_rate": 6.825781516938111e-05, "loss": 0.0134, "step": 16860 }, { "epoch": 3.43, "learning_rate": 6.824156180475404e-05, "loss": 0.0015, "step": 16861 }, { "epoch": 3.43, "learning_rate": 6.82253098056472e-05, "loss": 0.012, "step": 16862 }, { "epoch": 3.43, "learning_rate": 6.820905917233212e-05, "loss": 0.0013, "step": 16863 }, { "epoch": 3.43, "learning_rate": 6.819280990508003e-05, "loss": 0.0069, "step": 16864 }, { "epoch": 3.43, "learning_rate": 6.817656200416255e-05, "loss": 0.0007, "step": 16865 }, { "epoch": 3.43, "learning_rate": 6.81603154698508e-05, "loss": 0.001, "step": 16866 }, { "epoch": 3.43, "learning_rate": 6.814407030241641e-05, "loss": 0.0036, "step": 16867 }, { "epoch": 3.43, "learning_rate": 6.812782650213048e-05, "loss": 0.0173, "step": 16868 }, { "epoch": 3.43, "learning_rate": 6.811158406926441e-05, "loss": 0.0019, "step": 16869 }, { "epoch": 3.44, "learning_rate": 6.809534300408945e-05, "loss": 0.0052, "step": 16870 }, { "epoch": 3.44, "learning_rate": 6.807910330687682e-05, "loss": 0.0024, "step": 16871 }, { "epoch": 3.44, "learning_rate": 6.806286497789791e-05, "loss": 0.0057, "step": 16872 }, { "epoch": 3.44, "learning_rate": 6.804662801742377e-05, "loss": 0.0038, "step": 16873 }, { "epoch": 3.44, "learning_rate": 6.803039242572563e-05, "loss": 0.0027, "step": 16874 }, { "epoch": 3.44, "learning_rate": 6.801415820307467e-05, "loss": 0.0048, "step": 16875 }, { "epoch": 3.44, "learning_rate": 6.799792534974203e-05, "loss": 0.0015, "step": 16876 }, { "epoch": 3.44, "learning_rate": 6.798169386599881e-05, "loss": 0.004, "step": 16877 }, { "epoch": 3.44, "learning_rate": 6.796546375211614e-05, "loss": 0.0056, "step": 16878 }, { "epoch": 3.44, "learning_rate": 6.794923500836509e-05, "loss": 0.0081, "step": 16879 }, { "epoch": 3.44, "learning_rate": 6.793300763501666e-05, "loss": 0.0038, "step": 16880 }, { "epoch": 3.44, "learning_rate": 6.7916781632342e-05, "loss": 0.0037, "step": 16881 }, { "epoch": 3.44, "learning_rate": 6.79005570006119e-05, "loss": 0.0052, "step": 16882 }, { "epoch": 3.44, "learning_rate": 6.78843337400976e-05, "loss": 0.0264, "step": 16883 }, { "epoch": 3.44, "learning_rate": 6.786811185106981e-05, "loss": 0.0091, "step": 16884 }, { "epoch": 3.44, "learning_rate": 6.785189133379971e-05, "loss": 0.0135, "step": 16885 }, { "epoch": 3.44, "learning_rate": 6.783567218855802e-05, "loss": 0.009, "step": 16886 }, { "epoch": 3.44, "learning_rate": 6.78194544156157e-05, "loss": 0.0057, "step": 16887 }, { "epoch": 3.44, "learning_rate": 6.780323801524362e-05, "loss": 0.0033, "step": 16888 }, { "epoch": 3.44, "learning_rate": 6.778702298771264e-05, "loss": 0.0031, "step": 16889 }, { "epoch": 3.44, "learning_rate": 6.777080933329354e-05, "loss": 0.0017, "step": 16890 }, { "epoch": 3.44, "learning_rate": 6.775459705225715e-05, "loss": 0.0004, "step": 16891 }, { "epoch": 3.44, "learning_rate": 6.773838614487424e-05, "loss": 0.0073, "step": 16892 }, { "epoch": 3.44, "learning_rate": 6.772217661141557e-05, "loss": 0.0004, "step": 16893 }, { "epoch": 3.44, "learning_rate": 6.770596845215185e-05, "loss": 0.0072, "step": 16894 }, { "epoch": 3.44, "learning_rate": 6.76897616673538e-05, "loss": 0.0078, "step": 16895 }, { "epoch": 3.44, "learning_rate": 6.767355625729215e-05, "loss": 0.0026, "step": 16896 }, { "epoch": 3.44, "learning_rate": 6.765735222223741e-05, "loss": 0.001, "step": 16897 }, { "epoch": 3.44, "learning_rate": 6.764114956246045e-05, "loss": 0.0044, "step": 16898 }, { "epoch": 3.44, "learning_rate": 6.762494827823162e-05, "loss": 0.0081, "step": 16899 }, { "epoch": 3.44, "learning_rate": 6.760874836982171e-05, "loss": 0.004, "step": 16900 }, { "epoch": 3.44, "learning_rate": 6.759254983750127e-05, "loss": 0.0126, "step": 16901 }, { "epoch": 3.44, "learning_rate": 6.75763526815407e-05, "loss": 0.0039, "step": 16902 }, { "epoch": 3.44, "learning_rate": 6.756015690221076e-05, "loss": 0.0063, "step": 16903 }, { "epoch": 3.44, "learning_rate": 6.754396249978173e-05, "loss": 0.0012, "step": 16904 }, { "epoch": 3.44, "learning_rate": 6.752776947452418e-05, "loss": 0.0115, "step": 16905 }, { "epoch": 3.44, "learning_rate": 6.751157782670856e-05, "loss": 0.0049, "step": 16906 }, { "epoch": 3.44, "learning_rate": 6.749538755660531e-05, "loss": 0.0085, "step": 16907 }, { "epoch": 3.44, "learning_rate": 6.747919866448481e-05, "loss": 0.0046, "step": 16908 }, { "epoch": 3.44, "learning_rate": 6.746301115061747e-05, "loss": 0.0022, "step": 16909 }, { "epoch": 3.44, "learning_rate": 6.744682501527363e-05, "loss": 0.0066, "step": 16910 }, { "epoch": 3.44, "learning_rate": 6.743064025872367e-05, "loss": 0.0086, "step": 16911 }, { "epoch": 3.44, "learning_rate": 6.741445688123785e-05, "loss": 0.0009, "step": 16912 }, { "epoch": 3.44, "learning_rate": 6.739827488308652e-05, "loss": 0.0093, "step": 16913 }, { "epoch": 3.44, "learning_rate": 6.738209426453994e-05, "loss": 0.001, "step": 16914 }, { "epoch": 3.44, "learning_rate": 6.736591502586824e-05, "loss": 0.0059, "step": 16915 }, { "epoch": 3.44, "learning_rate": 6.734973716734187e-05, "loss": 0.0187, "step": 16916 }, { "epoch": 3.44, "learning_rate": 6.733356068923079e-05, "loss": 0.0064, "step": 16917 }, { "epoch": 3.44, "learning_rate": 6.731738559180539e-05, "loss": 0.0037, "step": 16918 }, { "epoch": 3.45, "learning_rate": 6.730121187533566e-05, "loss": 0.0125, "step": 16919 }, { "epoch": 3.45, "learning_rate": 6.728503954009181e-05, "loss": 0.0014, "step": 16920 }, { "epoch": 3.45, "learning_rate": 6.726886858634393e-05, "loss": 0.0008, "step": 16921 }, { "epoch": 3.45, "learning_rate": 6.725269901436213e-05, "loss": 0.0094, "step": 16922 }, { "epoch": 3.45, "learning_rate": 6.723653082441642e-05, "loss": 0.0007, "step": 16923 }, { "epoch": 3.45, "learning_rate": 6.722036401677691e-05, "loss": 0.0128, "step": 16924 }, { "epoch": 3.45, "learning_rate": 6.720419859171355e-05, "loss": 0.0016, "step": 16925 }, { "epoch": 3.45, "learning_rate": 6.718803454949637e-05, "loss": 0.006, "step": 16926 }, { "epoch": 3.45, "learning_rate": 6.717187189039538e-05, "loss": 0.0029, "step": 16927 }, { "epoch": 3.45, "learning_rate": 6.715571061468037e-05, "loss": 0.0047, "step": 16928 }, { "epoch": 3.45, "learning_rate": 6.71395507226215e-05, "loss": 0.0018, "step": 16929 }, { "epoch": 3.45, "learning_rate": 6.712339221448841e-05, "loss": 0.0041, "step": 16930 }, { "epoch": 3.45, "learning_rate": 6.710723509055119e-05, "loss": 0.0018, "step": 16931 }, { "epoch": 3.45, "learning_rate": 6.709107935107965e-05, "loss": 0.0009, "step": 16932 }, { "epoch": 3.45, "learning_rate": 6.707492499634348e-05, "loss": 0.0035, "step": 16933 }, { "epoch": 3.45, "learning_rate": 6.705877202661272e-05, "loss": 0.0026, "step": 16934 }, { "epoch": 3.45, "learning_rate": 6.70426204421569e-05, "loss": 0.0072, "step": 16935 }, { "epoch": 3.45, "learning_rate": 6.702647024324604e-05, "loss": 0.0034, "step": 16936 }, { "epoch": 3.45, "learning_rate": 6.701032143014967e-05, "loss": 0.0031, "step": 16937 }, { "epoch": 3.45, "learning_rate": 6.69941740031376e-05, "loss": 0.0108, "step": 16938 }, { "epoch": 3.45, "learning_rate": 6.697802796247951e-05, "loss": 0.0027, "step": 16939 }, { "epoch": 3.45, "learning_rate": 6.696188330844508e-05, "loss": 0.0008, "step": 16940 }, { "epoch": 3.45, "learning_rate": 6.694574004130393e-05, "loss": 0.0063, "step": 16941 }, { "epoch": 3.45, "learning_rate": 6.69295981613257e-05, "loss": 0.0106, "step": 16942 }, { "epoch": 3.45, "learning_rate": 6.691345766877999e-05, "loss": 0.0051, "step": 16943 }, { "epoch": 3.45, "learning_rate": 6.689731856393636e-05, "loss": 0.0019, "step": 16944 }, { "epoch": 3.45, "learning_rate": 6.68811808470644e-05, "loss": 0.0057, "step": 16945 }, { "epoch": 3.45, "learning_rate": 6.68650445184336e-05, "loss": 0.0018, "step": 16946 }, { "epoch": 3.45, "learning_rate": 6.684890957831354e-05, "loss": 0.0047, "step": 16947 }, { "epoch": 3.45, "learning_rate": 6.683277602697356e-05, "loss": 0.0014, "step": 16948 }, { "epoch": 3.45, "learning_rate": 6.681664386468331e-05, "loss": 0.0032, "step": 16949 }, { "epoch": 3.45, "learning_rate": 6.6800513091712e-05, "loss": 0.0056, "step": 16950 }, { "epoch": 3.45, "learning_rate": 6.67843837083293e-05, "loss": 0.0067, "step": 16951 }, { "epoch": 3.45, "learning_rate": 6.67682557148044e-05, "loss": 0.0019, "step": 16952 }, { "epoch": 3.45, "learning_rate": 6.675212911140669e-05, "loss": 0.0097, "step": 16953 }, { "epoch": 3.45, "learning_rate": 6.673600389840569e-05, "loss": 0.0094, "step": 16954 }, { "epoch": 3.45, "learning_rate": 6.671988007607054e-05, "loss": 0.0061, "step": 16955 }, { "epoch": 3.45, "learning_rate": 6.670375764467058e-05, "loss": 0.0024, "step": 16956 }, { "epoch": 3.45, "learning_rate": 6.668763660447513e-05, "loss": 0.0023, "step": 16957 }, { "epoch": 3.45, "learning_rate": 6.667151695575338e-05, "loss": 0.0005, "step": 16958 }, { "epoch": 3.45, "learning_rate": 6.665539869877459e-05, "loss": 0.0048, "step": 16959 }, { "epoch": 3.45, "learning_rate": 6.663928183380798e-05, "loss": 0.0053, "step": 16960 }, { "epoch": 3.45, "learning_rate": 6.662316636112272e-05, "loss": 0.0035, "step": 16961 }, { "epoch": 3.45, "learning_rate": 6.660705228098798e-05, "loss": 0.0054, "step": 16962 }, { "epoch": 3.45, "learning_rate": 6.659093959367286e-05, "loss": 0.0022, "step": 16963 }, { "epoch": 3.45, "learning_rate": 6.657482829944648e-05, "loss": 0.0063, "step": 16964 }, { "epoch": 3.45, "learning_rate": 6.655871839857802e-05, "loss": 0.0152, "step": 16965 }, { "epoch": 3.45, "learning_rate": 6.654260989133636e-05, "loss": 0.0059, "step": 16966 }, { "epoch": 3.45, "learning_rate": 6.652650277799076e-05, "loss": 0.0003, "step": 16967 }, { "epoch": 3.46, "learning_rate": 6.651039705881001e-05, "loss": 0.0044, "step": 16968 }, { "epoch": 3.46, "learning_rate": 6.649429273406335e-05, "loss": 0.0011, "step": 16969 }, { "epoch": 3.46, "learning_rate": 6.647818980401957e-05, "loss": 0.0127, "step": 16970 }, { "epoch": 3.46, "learning_rate": 6.646208826894768e-05, "loss": 0.0076, "step": 16971 }, { "epoch": 3.46, "learning_rate": 6.644598812911662e-05, "loss": 0.006, "step": 16972 }, { "epoch": 3.46, "learning_rate": 6.642988938479526e-05, "loss": 0.0061, "step": 16973 }, { "epoch": 3.46, "learning_rate": 6.641379203625249e-05, "loss": 0.0041, "step": 16974 }, { "epoch": 3.46, "learning_rate": 6.639769608375718e-05, "loss": 0.0029, "step": 16975 }, { "epoch": 3.46, "learning_rate": 6.638160152757817e-05, "loss": 0.0014, "step": 16976 }, { "epoch": 3.46, "learning_rate": 6.636550836798424e-05, "loss": 0.0054, "step": 16977 }, { "epoch": 3.46, "learning_rate": 6.634941660524424e-05, "loss": 0.0017, "step": 16978 }, { "epoch": 3.46, "learning_rate": 6.633332623962679e-05, "loss": 0.0054, "step": 16979 }, { "epoch": 3.46, "learning_rate": 6.631723727140082e-05, "loss": 0.0055, "step": 16980 }, { "epoch": 3.46, "learning_rate": 6.630114970083486e-05, "loss": 0.012, "step": 16981 }, { "epoch": 3.46, "learning_rate": 6.628506352819779e-05, "loss": 0.009, "step": 16982 }, { "epoch": 3.46, "learning_rate": 6.626897875375813e-05, "loss": 0.0045, "step": 16983 }, { "epoch": 3.46, "learning_rate": 6.625289537778452e-05, "loss": 0.0004, "step": 16984 }, { "epoch": 3.46, "learning_rate": 6.623681340054575e-05, "loss": 0.0046, "step": 16985 }, { "epoch": 3.46, "learning_rate": 6.62207328223102e-05, "loss": 0.0051, "step": 16986 }, { "epoch": 3.46, "learning_rate": 6.620465364334667e-05, "loss": 0.0006, "step": 16987 }, { "epoch": 3.46, "learning_rate": 6.618857586392355e-05, "loss": 0.0069, "step": 16988 }, { "epoch": 3.46, "learning_rate": 6.617249948430941e-05, "loss": 0.0025, "step": 16989 }, { "epoch": 3.46, "learning_rate": 6.615642450477276e-05, "loss": 0.0061, "step": 16990 }, { "epoch": 3.46, "learning_rate": 6.614035092558209e-05, "loss": 0.0016, "step": 16991 }, { "epoch": 3.46, "learning_rate": 6.612427874700586e-05, "loss": 0.0007, "step": 16992 }, { "epoch": 3.46, "learning_rate": 6.61082079693125e-05, "loss": 0.0235, "step": 16993 }, { "epoch": 3.46, "learning_rate": 6.609213859277043e-05, "loss": 0.0019, "step": 16994 }, { "epoch": 3.46, "learning_rate": 6.607607061764804e-05, "loss": 0.004, "step": 16995 }, { "epoch": 3.46, "learning_rate": 6.606000404421365e-05, "loss": 0.0043, "step": 16996 }, { "epoch": 3.46, "learning_rate": 6.604393887273568e-05, "loss": 0.005, "step": 16997 }, { "epoch": 3.46, "learning_rate": 6.602787510348245e-05, "loss": 0.0082, "step": 16998 }, { "epoch": 3.46, "learning_rate": 6.60118127367221e-05, "loss": 0.0076, "step": 16999 }, { "epoch": 3.46, "learning_rate": 6.599575177272313e-05, "loss": 0.0004, "step": 17000 }, { "epoch": 3.46, "learning_rate": 6.597969221175363e-05, "loss": 0.0113, "step": 17001 }, { "epoch": 3.46, "learning_rate": 6.596363405408185e-05, "loss": 0.002, "step": 17002 }, { "epoch": 3.46, "learning_rate": 6.594757729997602e-05, "loss": 0.0012, "step": 17003 }, { "epoch": 3.46, "learning_rate": 6.593152194970431e-05, "loss": 0.0014, "step": 17004 }, { "epoch": 3.46, "learning_rate": 6.591546800353489e-05, "loss": 0.0055, "step": 17005 }, { "epoch": 3.46, "learning_rate": 6.589941546173586e-05, "loss": 0.0041, "step": 17006 }, { "epoch": 3.46, "learning_rate": 6.588336432457533e-05, "loss": 0.0031, "step": 17007 }, { "epoch": 3.46, "learning_rate": 6.58673145923214e-05, "loss": 0.0025, "step": 17008 }, { "epoch": 3.46, "learning_rate": 6.585126626524214e-05, "loss": 0.0045, "step": 17009 }, { "epoch": 3.46, "learning_rate": 6.583521934360558e-05, "loss": 0.0028, "step": 17010 }, { "epoch": 3.46, "learning_rate": 6.581917382767978e-05, "loss": 0.007, "step": 17011 }, { "epoch": 3.46, "learning_rate": 6.580312971773256e-05, "loss": 0.0027, "step": 17012 }, { "epoch": 3.46, "learning_rate": 6.578708701403207e-05, "loss": 0.006, "step": 17013 }, { "epoch": 3.46, "learning_rate": 6.577104571684619e-05, "loss": 0.013, "step": 17014 }, { "epoch": 3.46, "learning_rate": 6.575500582644284e-05, "loss": 0.0014, "step": 17015 }, { "epoch": 3.46, "learning_rate": 6.573896734308996e-05, "loss": 0.0024, "step": 17016 }, { "epoch": 3.46, "learning_rate": 6.572293026705529e-05, "loss": 0.003, "step": 17017 }, { "epoch": 3.47, "learning_rate": 6.570689459860687e-05, "loss": 0.003, "step": 17018 }, { "epoch": 3.47, "learning_rate": 6.56908603380123e-05, "loss": 0.0017, "step": 17019 }, { "epoch": 3.47, "learning_rate": 6.567482748553964e-05, "loss": 0.0013, "step": 17020 }, { "epoch": 3.47, "learning_rate": 6.565879604145647e-05, "loss": 0.0078, "step": 17021 }, { "epoch": 3.47, "learning_rate": 6.564276600603061e-05, "loss": 0.0027, "step": 17022 }, { "epoch": 3.47, "learning_rate": 6.56267373795298e-05, "loss": 0.0036, "step": 17023 }, { "epoch": 3.47, "learning_rate": 6.561071016222174e-05, "loss": 0.0023, "step": 17024 }, { "epoch": 3.47, "learning_rate": 6.559468435437411e-05, "loss": 0.0004, "step": 17025 }, { "epoch": 3.47, "learning_rate": 6.557865995625458e-05, "loss": 0.0056, "step": 17026 }, { "epoch": 3.47, "learning_rate": 6.55626369681308e-05, "loss": 0.0008, "step": 17027 }, { "epoch": 3.47, "learning_rate": 6.554661539027033e-05, "loss": 0.0079, "step": 17028 }, { "epoch": 3.47, "learning_rate": 6.553059522294089e-05, "loss": 0.0045, "step": 17029 }, { "epoch": 3.47, "learning_rate": 6.551457646640984e-05, "loss": 0.0047, "step": 17030 }, { "epoch": 3.47, "learning_rate": 6.549855912094494e-05, "loss": 0.0055, "step": 17031 }, { "epoch": 3.47, "learning_rate": 6.548254318681352e-05, "loss": 0.0031, "step": 17032 }, { "epoch": 3.47, "learning_rate": 6.546652866428325e-05, "loss": 0.0058, "step": 17033 }, { "epoch": 3.47, "learning_rate": 6.545051555362149e-05, "loss": 0.0036, "step": 17034 }, { "epoch": 3.47, "learning_rate": 6.54345038550957e-05, "loss": 0.0035, "step": 17035 }, { "epoch": 3.47, "learning_rate": 6.541849356897335e-05, "loss": 0.0056, "step": 17036 }, { "epoch": 3.47, "learning_rate": 6.540248469552174e-05, "loss": 0.0041, "step": 17037 }, { "epoch": 3.47, "learning_rate": 6.538647723500844e-05, "loss": 0.004, "step": 17038 }, { "epoch": 3.47, "learning_rate": 6.537047118770063e-05, "loss": 0.0014, "step": 17039 }, { "epoch": 3.47, "learning_rate": 6.53544665538657e-05, "loss": 0.0036, "step": 17040 }, { "epoch": 3.47, "learning_rate": 6.533846333377096e-05, "loss": 0.0056, "step": 17041 }, { "epoch": 3.47, "learning_rate": 6.53224615276837e-05, "loss": 0.0079, "step": 17042 }, { "epoch": 3.47, "learning_rate": 6.530646113587117e-05, "loss": 0.0145, "step": 17043 }, { "epoch": 3.47, "learning_rate": 6.529046215860061e-05, "loss": 0.0104, "step": 17044 }, { "epoch": 3.47, "learning_rate": 6.527446459613921e-05, "loss": 0.0006, "step": 17045 }, { "epoch": 3.47, "learning_rate": 6.525846844875421e-05, "loss": 0.0096, "step": 17046 }, { "epoch": 3.47, "learning_rate": 6.524247371671274e-05, "loss": 0.0019, "step": 17047 }, { "epoch": 3.47, "learning_rate": 6.522648040028195e-05, "loss": 0.0019, "step": 17048 }, { "epoch": 3.47, "learning_rate": 6.521048849972902e-05, "loss": 0.0041, "step": 17049 }, { "epoch": 3.47, "learning_rate": 6.519449801532086e-05, "loss": 0.0149, "step": 17050 }, { "epoch": 3.47, "learning_rate": 6.517850894732479e-05, "loss": 0.0036, "step": 17051 }, { "epoch": 3.47, "learning_rate": 6.516252129600767e-05, "loss": 0.0034, "step": 17052 }, { "epoch": 3.47, "learning_rate": 6.514653506163659e-05, "loss": 0.0028, "step": 17053 }, { "epoch": 3.47, "learning_rate": 6.513055024447853e-05, "loss": 0.0017, "step": 17054 }, { "epoch": 3.47, "learning_rate": 6.51145668448005e-05, "loss": 0.0029, "step": 17055 }, { "epoch": 3.47, "learning_rate": 6.509858486286942e-05, "loss": 0.0037, "step": 17056 }, { "epoch": 3.47, "learning_rate": 6.508260429895227e-05, "loss": 0.0031, "step": 17057 }, { "epoch": 3.47, "learning_rate": 6.506662515331589e-05, "loss": 0.004, "step": 17058 }, { "epoch": 3.47, "learning_rate": 6.505064742622721e-05, "loss": 0.0009, "step": 17059 }, { "epoch": 3.47, "learning_rate": 6.503467111795304e-05, "loss": 0.0017, "step": 17060 }, { "epoch": 3.47, "learning_rate": 6.501869622876028e-05, "loss": 0.0021, "step": 17061 }, { "epoch": 3.47, "learning_rate": 6.500272275891574e-05, "loss": 0.0014, "step": 17062 }, { "epoch": 3.47, "learning_rate": 6.498675070868608e-05, "loss": 0.0047, "step": 17063 }, { "epoch": 3.47, "learning_rate": 6.497078007833825e-05, "loss": 0.0033, "step": 17064 }, { "epoch": 3.47, "learning_rate": 6.495481086813882e-05, "loss": 0.0028, "step": 17065 }, { "epoch": 3.47, "learning_rate": 6.49388430783546e-05, "loss": 0.002, "step": 17066 }, { "epoch": 3.48, "learning_rate": 6.492287670925234e-05, "loss": 0.0063, "step": 17067 }, { "epoch": 3.48, "learning_rate": 6.490691176109852e-05, "loss": 0.0056, "step": 17068 }, { "epoch": 3.48, "learning_rate": 6.489094823416001e-05, "loss": 0.0073, "step": 17069 }, { "epoch": 3.48, "learning_rate": 6.48749861287032e-05, "loss": 0.0119, "step": 17070 }, { "epoch": 3.48, "learning_rate": 6.485902544499493e-05, "loss": 0.0002, "step": 17071 }, { "epoch": 3.48, "learning_rate": 6.484306618330159e-05, "loss": 0.0116, "step": 17072 }, { "epoch": 3.48, "learning_rate": 6.482710834388979e-05, "loss": 0.0008, "step": 17073 }, { "epoch": 3.48, "learning_rate": 6.481115192702605e-05, "loss": 0.0011, "step": 17074 }, { "epoch": 3.48, "learning_rate": 6.479519693297688e-05, "loss": 0.0055, "step": 17075 }, { "epoch": 3.48, "learning_rate": 6.477924336200877e-05, "loss": 0.0059, "step": 17076 }, { "epoch": 3.48, "learning_rate": 6.476329121438812e-05, "loss": 0.003, "step": 17077 }, { "epoch": 3.48, "learning_rate": 6.474734049038145e-05, "loss": 0.0001, "step": 17078 }, { "epoch": 3.48, "learning_rate": 6.47313911902551e-05, "loss": 0.0082, "step": 17079 }, { "epoch": 3.48, "learning_rate": 6.471544331427553e-05, "loss": 0.0053, "step": 17080 }, { "epoch": 3.48, "learning_rate": 6.469949686270893e-05, "loss": 0.0013, "step": 17081 }, { "epoch": 3.48, "learning_rate": 6.468355183582186e-05, "loss": 0.0004, "step": 17082 }, { "epoch": 3.48, "learning_rate": 6.466760823388041e-05, "loss": 0.0086, "step": 17083 }, { "epoch": 3.48, "learning_rate": 6.465166605715108e-05, "loss": 0.009, "step": 17084 }, { "epoch": 3.48, "learning_rate": 6.463572530590001e-05, "loss": 0.004, "step": 17085 }, { "epoch": 3.48, "learning_rate": 6.461978598039344e-05, "loss": 0.0021, "step": 17086 }, { "epoch": 3.48, "learning_rate": 6.46038480808976e-05, "loss": 0.0026, "step": 17087 }, { "epoch": 3.48, "learning_rate": 6.458791160767872e-05, "loss": 0.0072, "step": 17088 }, { "epoch": 3.48, "learning_rate": 6.457197656100294e-05, "loss": 0.0065, "step": 17089 }, { "epoch": 3.48, "learning_rate": 6.455604294113639e-05, "loss": 0.0013, "step": 17090 }, { "epoch": 3.48, "learning_rate": 6.45401107483452e-05, "loss": 0.0008, "step": 17091 }, { "epoch": 3.48, "learning_rate": 6.45241799828955e-05, "loss": 0.0079, "step": 17092 }, { "epoch": 3.48, "learning_rate": 6.450825064505334e-05, "loss": 0.0111, "step": 17093 }, { "epoch": 3.48, "learning_rate": 6.449232273508477e-05, "loss": 0.0086, "step": 17094 }, { "epoch": 3.48, "learning_rate": 6.447639625325587e-05, "loss": 0.0018, "step": 17095 }, { "epoch": 3.48, "learning_rate": 6.446047119983248e-05, "loss": 0.0041, "step": 17096 }, { "epoch": 3.48, "learning_rate": 6.444454757508075e-05, "loss": 0.016, "step": 17097 }, { "epoch": 3.48, "learning_rate": 6.442862537926655e-05, "loss": 0.0006, "step": 17098 }, { "epoch": 3.48, "learning_rate": 6.441270461265587e-05, "loss": 0.0047, "step": 17099 }, { "epoch": 3.48, "learning_rate": 6.43967852755146e-05, "loss": 0.0103, "step": 17100 }, { "epoch": 3.48, "learning_rate": 6.438086736810852e-05, "loss": 0.0039, "step": 17101 }, { "epoch": 3.48, "learning_rate": 6.436495089070367e-05, "loss": 0.0072, "step": 17102 }, { "epoch": 3.48, "learning_rate": 6.434903584356572e-05, "loss": 0.0056, "step": 17103 }, { "epoch": 3.48, "learning_rate": 6.433312222696058e-05, "loss": 0.0047, "step": 17104 }, { "epoch": 3.48, "learning_rate": 6.431721004115397e-05, "loss": 0.0037, "step": 17105 }, { "epoch": 3.48, "learning_rate": 6.430129928641171e-05, "loss": 0.0024, "step": 17106 }, { "epoch": 3.48, "learning_rate": 6.428538996299954e-05, "loss": 0.0127, "step": 17107 }, { "epoch": 3.48, "learning_rate": 6.426948207118312e-05, "loss": 0.001, "step": 17108 }, { "epoch": 3.48, "learning_rate": 6.425357561122819e-05, "loss": 0.0082, "step": 17109 }, { "epoch": 3.48, "learning_rate": 6.42376705834004e-05, "loss": 0.0023, "step": 17110 }, { "epoch": 3.48, "learning_rate": 6.422176698796542e-05, "loss": 0.0022, "step": 17111 }, { "epoch": 3.48, "learning_rate": 6.420586482518882e-05, "loss": 0.0068, "step": 17112 }, { "epoch": 3.48, "learning_rate": 6.418996409533631e-05, "loss": 0.0019, "step": 17113 }, { "epoch": 3.48, "learning_rate": 6.417406479867326e-05, "loss": 0.0023, "step": 17114 }, { "epoch": 3.48, "learning_rate": 6.415816693546543e-05, "loss": 0.0067, "step": 17115 }, { "epoch": 3.49, "learning_rate": 6.414227050597816e-05, "loss": 0.0105, "step": 17116 }, { "epoch": 3.49, "learning_rate": 6.412637551047713e-05, "loss": 0.0105, "step": 17117 }, { "epoch": 3.49, "learning_rate": 6.411048194922767e-05, "loss": 0.0066, "step": 17118 }, { "epoch": 3.49, "learning_rate": 6.409458982249525e-05, "loss": 0.0001, "step": 17119 }, { "epoch": 3.49, "learning_rate": 6.407869913054544e-05, "loss": 0.0048, "step": 17120 }, { "epoch": 3.49, "learning_rate": 6.406280987364345e-05, "loss": 0.0073, "step": 17121 }, { "epoch": 3.49, "learning_rate": 6.404692205205486e-05, "loss": 0.0007, "step": 17122 }, { "epoch": 3.49, "learning_rate": 6.403103566604485e-05, "loss": 0.0031, "step": 17123 }, { "epoch": 3.49, "learning_rate": 6.401515071587881e-05, "loss": 0.0064, "step": 17124 }, { "epoch": 3.49, "learning_rate": 6.399926720182209e-05, "loss": 0.0059, "step": 17125 }, { "epoch": 3.49, "learning_rate": 6.398338512413992e-05, "loss": 0.0006, "step": 17126 }, { "epoch": 3.49, "learning_rate": 6.396750448309761e-05, "loss": 0.0032, "step": 17127 }, { "epoch": 3.49, "learning_rate": 6.395162527896036e-05, "loss": 0.0121, "step": 17128 }, { "epoch": 3.49, "learning_rate": 6.393574751199339e-05, "loss": 0.0062, "step": 17129 }, { "epoch": 3.49, "learning_rate": 6.391987118246191e-05, "loss": 0.0003, "step": 17130 }, { "epoch": 3.49, "learning_rate": 6.390399629063112e-05, "loss": 0.0026, "step": 17131 }, { "epoch": 3.49, "learning_rate": 6.388812283676598e-05, "loss": 0.0019, "step": 17132 }, { "epoch": 3.49, "learning_rate": 6.387225082113186e-05, "loss": 0.0062, "step": 17133 }, { "epoch": 3.49, "learning_rate": 6.385638024399362e-05, "loss": 0.0035, "step": 17134 }, { "epoch": 3.49, "learning_rate": 6.384051110561655e-05, "loss": 0.0039, "step": 17135 }, { "epoch": 3.49, "learning_rate": 6.382464340626554e-05, "loss": 0.0046, "step": 17136 }, { "epoch": 3.49, "learning_rate": 6.380877714620563e-05, "loss": 0.0006, "step": 17137 }, { "epoch": 3.49, "learning_rate": 6.379291232570184e-05, "loss": 0.0046, "step": 17138 }, { "epoch": 3.49, "learning_rate": 6.377704894501915e-05, "loss": 0.0013, "step": 17139 }, { "epoch": 3.49, "learning_rate": 6.37611870044225e-05, "loss": 0.0022, "step": 17140 }, { "epoch": 3.49, "learning_rate": 6.374532650417681e-05, "loss": 0.0004, "step": 17141 }, { "epoch": 3.49, "learning_rate": 6.3729467444547e-05, "loss": 0.0032, "step": 17142 }, { "epoch": 3.49, "learning_rate": 6.371360982579792e-05, "loss": 0.0095, "step": 17143 }, { "epoch": 3.49, "learning_rate": 6.369775364819443e-05, "loss": 0.0008, "step": 17144 }, { "epoch": 3.49, "learning_rate": 6.368189891200137e-05, "loss": 0.0042, "step": 17145 }, { "epoch": 3.49, "learning_rate": 6.366604561748357e-05, "loss": 0.0021, "step": 17146 }, { "epoch": 3.49, "learning_rate": 6.365019376490568e-05, "loss": 0.0021, "step": 17147 }, { "epoch": 3.49, "learning_rate": 6.363434335453267e-05, "loss": 0.0012, "step": 17148 }, { "epoch": 3.49, "learning_rate": 6.361849438662907e-05, "loss": 0.0063, "step": 17149 }, { "epoch": 3.49, "learning_rate": 6.360264686145964e-05, "loss": 0.0051, "step": 17150 }, { "epoch": 3.49, "learning_rate": 6.358680077928919e-05, "loss": 0.0073, "step": 17151 }, { "epoch": 3.49, "learning_rate": 6.357095614038219e-05, "loss": 0.0041, "step": 17152 }, { "epoch": 3.49, "learning_rate": 6.355511294500346e-05, "loss": 0.0091, "step": 17153 }, { "epoch": 3.49, "learning_rate": 6.353927119341747e-05, "loss": 0.0125, "step": 17154 }, { "epoch": 3.49, "learning_rate": 6.352343088588887e-05, "loss": 0.0026, "step": 17155 }, { "epoch": 3.49, "learning_rate": 6.350759202268221e-05, "loss": 0.0009, "step": 17156 }, { "epoch": 3.49, "learning_rate": 6.349175460406201e-05, "loss": 0.0086, "step": 17157 }, { "epoch": 3.49, "learning_rate": 6.347591863029282e-05, "loss": 0.0007, "step": 17158 }, { "epoch": 3.49, "learning_rate": 6.34600841016391e-05, "loss": 0.0051, "step": 17159 }, { "epoch": 3.49, "learning_rate": 6.344425101836534e-05, "loss": 0.0011, "step": 17160 }, { "epoch": 3.49, "learning_rate": 6.342841938073598e-05, "loss": 0.0006, "step": 17161 }, { "epoch": 3.49, "learning_rate": 6.341258918901542e-05, "loss": 0.0067, "step": 17162 }, { "epoch": 3.49, "learning_rate": 6.339676044346807e-05, "loss": 0.0045, "step": 17163 }, { "epoch": 3.49, "learning_rate": 6.338093314435834e-05, "loss": 0.0036, "step": 17164 }, { "epoch": 3.5, "learning_rate": 6.336510729195046e-05, "loss": 0.0066, "step": 17165 }, { "epoch": 3.5, "learning_rate": 6.334928288650889e-05, "loss": 0.0071, "step": 17166 }, { "epoch": 3.5, "learning_rate": 6.333345992829777e-05, "loss": 0.0042, "step": 17167 }, { "epoch": 3.5, "learning_rate": 6.331763841758157e-05, "loss": 0.0083, "step": 17168 }, { "epoch": 3.5, "learning_rate": 6.330181835462438e-05, "loss": 0.0012, "step": 17169 }, { "epoch": 3.5, "learning_rate": 6.328599973969046e-05, "loss": 0.0053, "step": 17170 }, { "epoch": 3.5, "learning_rate": 6.327018257304405e-05, "loss": 0.0011, "step": 17171 }, { "epoch": 3.5, "learning_rate": 6.325436685494925e-05, "loss": 0.0038, "step": 17172 }, { "epoch": 3.5, "learning_rate": 6.323855258567038e-05, "loss": 0.0002, "step": 17173 }, { "epoch": 3.5, "learning_rate": 6.322273976547139e-05, "loss": 0.0127, "step": 17174 }, { "epoch": 3.5, "learning_rate": 6.320692839461645e-05, "loss": 0.002, "step": 17175 }, { "epoch": 3.5, "learning_rate": 6.319111847336965e-05, "loss": 0.0006, "step": 17176 }, { "epoch": 3.5, "learning_rate": 6.31753100019951e-05, "loss": 0.0017, "step": 17177 }, { "epoch": 3.5, "learning_rate": 6.315950298075662e-05, "loss": 0.0027, "step": 17178 }, { "epoch": 3.5, "learning_rate": 6.314369740991843e-05, "loss": 0.0075, "step": 17179 }, { "epoch": 3.5, "learning_rate": 6.312789328974446e-05, "loss": 0.0007, "step": 17180 }, { "epoch": 3.5, "learning_rate": 6.311209062049866e-05, "loss": 0.0016, "step": 17181 }, { "epoch": 3.5, "learning_rate": 6.309628940244498e-05, "loss": 0.0086, "step": 17182 }, { "epoch": 3.5, "learning_rate": 6.308048963584725e-05, "loss": 0.0005, "step": 17183 }, { "epoch": 3.5, "learning_rate": 6.306469132096947e-05, "loss": 0.0086, "step": 17184 }, { "epoch": 3.5, "learning_rate": 6.304889445807537e-05, "loss": 0.0012, "step": 17185 }, { "epoch": 3.5, "learning_rate": 6.303309904742898e-05, "loss": 0.0107, "step": 17186 }, { "epoch": 3.5, "learning_rate": 6.301730508929393e-05, "loss": 0.009, "step": 17187 }, { "epoch": 3.5, "learning_rate": 6.300151258393407e-05, "loss": 0.0058, "step": 17188 }, { "epoch": 3.5, "learning_rate": 6.298572153161318e-05, "loss": 0.0084, "step": 17189 }, { "epoch": 3.5, "learning_rate": 6.296993193259499e-05, "loss": 0.0005, "step": 17190 }, { "epoch": 3.5, "learning_rate": 6.295414378714322e-05, "loss": 0.0066, "step": 17191 }, { "epoch": 3.5, "learning_rate": 6.293835709552154e-05, "loss": 0.0024, "step": 17192 }, { "epoch": 3.5, "learning_rate": 6.292257185799366e-05, "loss": 0.0009, "step": 17193 }, { "epoch": 3.5, "learning_rate": 6.29067880748232e-05, "loss": 0.0126, "step": 17194 }, { "epoch": 3.5, "learning_rate": 6.289100574627378e-05, "loss": 0.0072, "step": 17195 }, { "epoch": 3.5, "learning_rate": 6.287522487260897e-05, "loss": 0.0222, "step": 17196 }, { "epoch": 3.5, "learning_rate": 6.285944545409245e-05, "loss": 0.0063, "step": 17197 }, { "epoch": 3.5, "learning_rate": 6.284366749098755e-05, "loss": 0.0102, "step": 17198 }, { "epoch": 3.5, "learning_rate": 6.282789098355805e-05, "loss": 0.0011, "step": 17199 }, { "epoch": 3.5, "learning_rate": 6.281211593206724e-05, "loss": 0.0109, "step": 17200 }, { "epoch": 3.5, "learning_rate": 6.27963423367787e-05, "loss": 0.0052, "step": 17201 }, { "epoch": 3.5, "learning_rate": 6.278057019795585e-05, "loss": 0.0163, "step": 17202 }, { "epoch": 3.5, "learning_rate": 6.276479951586204e-05, "loss": 0.0029, "step": 17203 }, { "epoch": 3.5, "learning_rate": 6.274903029076086e-05, "loss": 0.0029, "step": 17204 }, { "epoch": 3.5, "learning_rate": 6.273326252291553e-05, "loss": 0.0021, "step": 17205 }, { "epoch": 3.5, "learning_rate": 6.271749621258943e-05, "loss": 0.0042, "step": 17206 }, { "epoch": 3.5, "learning_rate": 6.27017313600459e-05, "loss": 0.0037, "step": 17207 }, { "epoch": 3.5, "learning_rate": 6.268596796554825e-05, "loss": 0.0028, "step": 17208 }, { "epoch": 3.5, "learning_rate": 6.267020602935976e-05, "loss": 0.0098, "step": 17209 }, { "epoch": 3.5, "learning_rate": 6.265444555174367e-05, "loss": 0.0012, "step": 17210 }, { "epoch": 3.5, "learning_rate": 6.26386865329632e-05, "loss": 0.0011, "step": 17211 }, { "epoch": 3.5, "learning_rate": 6.262292897328158e-05, "loss": 0.0072, "step": 17212 }, { "epoch": 3.5, "learning_rate": 6.2607172872962e-05, "loss": 0.0029, "step": 17213 }, { "epoch": 3.51, "learning_rate": 6.259141823226758e-05, "loss": 0.0021, "step": 17214 }, { "epoch": 3.51, "learning_rate": 6.257566505146154e-05, "loss": 0.0021, "step": 17215 }, { "epoch": 3.51, "learning_rate": 6.25599133308068e-05, "loss": 0.0015, "step": 17216 }, { "epoch": 3.51, "learning_rate": 6.254416307056666e-05, "loss": 0.0016, "step": 17217 }, { "epoch": 3.51, "learning_rate": 6.252841427100398e-05, "loss": 0.0025, "step": 17218 }, { "epoch": 3.51, "learning_rate": 6.251266693238202e-05, "loss": 0.0032, "step": 17219 }, { "epoch": 3.51, "learning_rate": 6.24969210549636e-05, "loss": 0.0009, "step": 17220 }, { "epoch": 3.51, "learning_rate": 6.248117663901178e-05, "loss": 0.0051, "step": 17221 }, { "epoch": 3.51, "learning_rate": 6.24654336847895e-05, "loss": 0.0065, "step": 17222 }, { "epoch": 3.51, "learning_rate": 6.244969219255972e-05, "loss": 0.0019, "step": 17223 }, { "epoch": 3.51, "learning_rate": 6.243395216258534e-05, "loss": 0.0008, "step": 17224 }, { "epoch": 3.51, "learning_rate": 6.241821359512925e-05, "loss": 0.0033, "step": 17225 }, { "epoch": 3.51, "learning_rate": 6.240247649045433e-05, "loss": 0.0093, "step": 17226 }, { "epoch": 3.51, "learning_rate": 6.238674084882338e-05, "loss": 0.0057, "step": 17227 }, { "epoch": 3.51, "learning_rate": 6.237100667049931e-05, "loss": 0.0073, "step": 17228 }, { "epoch": 3.51, "learning_rate": 6.235527395574472e-05, "loss": 0.0012, "step": 17229 }, { "epoch": 3.51, "learning_rate": 6.233954270482261e-05, "loss": 0.007, "step": 17230 }, { "epoch": 3.51, "learning_rate": 6.232381291799551e-05, "loss": 0.0032, "step": 17231 }, { "epoch": 3.51, "learning_rate": 6.230808459552633e-05, "loss": 0.0015, "step": 17232 }, { "epoch": 3.51, "learning_rate": 6.229235773767762e-05, "loss": 0.0029, "step": 17233 }, { "epoch": 3.51, "learning_rate": 6.227663234471203e-05, "loss": 0.001, "step": 17234 }, { "epoch": 3.51, "learning_rate": 6.226090841689239e-05, "loss": 0.0067, "step": 17235 }, { "epoch": 3.51, "learning_rate": 6.22451859544811e-05, "loss": 0.0006, "step": 17236 }, { "epoch": 3.51, "learning_rate": 6.222946495774093e-05, "loss": 0.0004, "step": 17237 }, { "epoch": 3.51, "learning_rate": 6.221374542693435e-05, "loss": 0.0013, "step": 17238 }, { "epoch": 3.51, "learning_rate": 6.219802736232392e-05, "loss": 0.0033, "step": 17239 }, { "epoch": 3.51, "learning_rate": 6.218231076417216e-05, "loss": 0.001, "step": 17240 }, { "epoch": 3.51, "learning_rate": 6.216659563274159e-05, "loss": 0.0023, "step": 17241 }, { "epoch": 3.51, "learning_rate": 6.215088196829467e-05, "loss": 0.0059, "step": 17242 }, { "epoch": 3.51, "learning_rate": 6.213516977109384e-05, "loss": 0.0059, "step": 17243 }, { "epoch": 3.51, "learning_rate": 6.211945904140155e-05, "loss": 0.0093, "step": 17244 }, { "epoch": 3.51, "learning_rate": 6.210374977948016e-05, "loss": 0.0005, "step": 17245 }, { "epoch": 3.51, "learning_rate": 6.208804198559208e-05, "loss": 0.0038, "step": 17246 }, { "epoch": 3.51, "learning_rate": 6.207233565999963e-05, "loss": 0.0006, "step": 17247 }, { "epoch": 3.51, "learning_rate": 6.20566308029652e-05, "loss": 0.0008, "step": 17248 }, { "epoch": 3.51, "learning_rate": 6.204092741475095e-05, "loss": 0.0064, "step": 17249 }, { "epoch": 3.51, "learning_rate": 6.202522549561935e-05, "loss": 0.0096, "step": 17250 }, { "epoch": 3.51, "learning_rate": 6.20095250458325e-05, "loss": 0.009, "step": 17251 }, { "epoch": 3.51, "learning_rate": 6.199382606565266e-05, "loss": 0.0065, "step": 17252 }, { "epoch": 3.51, "learning_rate": 6.197812855534205e-05, "loss": 0.0057, "step": 17253 }, { "epoch": 3.51, "learning_rate": 6.196243251516286e-05, "loss": 0.0004, "step": 17254 }, { "epoch": 3.51, "learning_rate": 6.194673794537722e-05, "loss": 0.0039, "step": 17255 }, { "epoch": 3.51, "learning_rate": 6.193104484624727e-05, "loss": 0.0025, "step": 17256 }, { "epoch": 3.51, "learning_rate": 6.191535321803511e-05, "loss": 0.0074, "step": 17257 }, { "epoch": 3.51, "learning_rate": 6.189966306100282e-05, "loss": 0.0072, "step": 17258 }, { "epoch": 3.51, "learning_rate": 6.188397437541247e-05, "loss": 0.0004, "step": 17259 }, { "epoch": 3.51, "learning_rate": 6.186828716152607e-05, "loss": 0.0076, "step": 17260 }, { "epoch": 3.51, "learning_rate": 6.185260141960569e-05, "loss": 0.0035, "step": 17261 }, { "epoch": 3.51, "learning_rate": 6.183691714991315e-05, "loss": 0.0031, "step": 17262 }, { "epoch": 3.52, "learning_rate": 6.182123435271058e-05, "loss": 0.0083, "step": 17263 }, { "epoch": 3.52, "learning_rate": 6.180555302825982e-05, "loss": 0.0109, "step": 17264 }, { "epoch": 3.52, "learning_rate": 6.178987317682283e-05, "loss": 0.0219, "step": 17265 }, { "epoch": 3.52, "learning_rate": 6.17741947986615e-05, "loss": 0.013, "step": 17266 }, { "epoch": 3.52, "learning_rate": 6.175851789403755e-05, "loss": 0.0101, "step": 17267 }, { "epoch": 3.52, "learning_rate": 6.174284246321302e-05, "loss": 0.0014, "step": 17268 }, { "epoch": 3.52, "learning_rate": 6.172716850644953e-05, "loss": 0.005, "step": 17269 }, { "epoch": 3.52, "learning_rate": 6.171149602400905e-05, "loss": 0.0008, "step": 17270 }, { "epoch": 3.52, "learning_rate": 6.169582501615318e-05, "loss": 0.0003, "step": 17271 }, { "epoch": 3.52, "learning_rate": 6.168015548314373e-05, "loss": 0.0038, "step": 17272 }, { "epoch": 3.52, "learning_rate": 6.166448742524239e-05, "loss": 0.0066, "step": 17273 }, { "epoch": 3.52, "learning_rate": 6.164882084271088e-05, "loss": 0.0018, "step": 17274 }, { "epoch": 3.52, "learning_rate": 6.16331557358108e-05, "loss": 0.0012, "step": 17275 }, { "epoch": 3.52, "learning_rate": 6.161749210480384e-05, "loss": 0.0014, "step": 17276 }, { "epoch": 3.52, "learning_rate": 6.160182994995161e-05, "loss": 0.0012, "step": 17277 }, { "epoch": 3.52, "learning_rate": 6.158616927151567e-05, "loss": 0.0101, "step": 17278 }, { "epoch": 3.52, "learning_rate": 6.157051006975764e-05, "loss": 0.0023, "step": 17279 }, { "epoch": 3.52, "learning_rate": 6.155485234493892e-05, "loss": 0.0037, "step": 17280 }, { "epoch": 3.52, "learning_rate": 6.153919609732122e-05, "loss": 0.0024, "step": 17281 }, { "epoch": 3.52, "learning_rate": 6.152354132716583e-05, "loss": 0.0044, "step": 17282 }, { "epoch": 3.52, "learning_rate": 6.15078880347344e-05, "loss": 0.0009, "step": 17283 }, { "epoch": 3.52, "learning_rate": 6.149223622028824e-05, "loss": 0.0069, "step": 17284 }, { "epoch": 3.52, "learning_rate": 6.147658588408881e-05, "loss": 0.0075, "step": 17285 }, { "epoch": 3.52, "learning_rate": 6.146093702639747e-05, "loss": 0.009, "step": 17286 }, { "epoch": 3.52, "learning_rate": 6.144528964747559e-05, "loss": 0.0223, "step": 17287 }, { "epoch": 3.52, "learning_rate": 6.142964374758463e-05, "loss": 0.003, "step": 17288 }, { "epoch": 3.52, "learning_rate": 6.141399932698574e-05, "loss": 0.0069, "step": 17289 }, { "epoch": 3.52, "learning_rate": 6.139835638594029e-05, "loss": 0.0027, "step": 17290 }, { "epoch": 3.52, "learning_rate": 6.138271492470952e-05, "loss": 0.003, "step": 17291 }, { "epoch": 3.52, "learning_rate": 6.136707494355471e-05, "loss": 0.0078, "step": 17292 }, { "epoch": 3.52, "learning_rate": 6.135143644273704e-05, "loss": 0.0084, "step": 17293 }, { "epoch": 3.52, "learning_rate": 6.133579942251773e-05, "loss": 0.0019, "step": 17294 }, { "epoch": 3.52, "learning_rate": 6.132016388315793e-05, "loss": 0.0025, "step": 17295 }, { "epoch": 3.52, "learning_rate": 6.130452982491878e-05, "loss": 0.0042, "step": 17296 }, { "epoch": 3.52, "learning_rate": 6.128889724806148e-05, "loss": 0.0017, "step": 17297 }, { "epoch": 3.52, "learning_rate": 6.127326615284692e-05, "loss": 0.009, "step": 17298 }, { "epoch": 3.52, "learning_rate": 6.125763653953643e-05, "loss": 0.0028, "step": 17299 }, { "epoch": 3.52, "learning_rate": 6.124200840839079e-05, "loss": 0.0021, "step": 17300 }, { "epoch": 3.52, "learning_rate": 6.122638175967127e-05, "loss": 0.0083, "step": 17301 }, { "epoch": 3.52, "learning_rate": 6.121075659363868e-05, "loss": 0.0003, "step": 17302 }, { "epoch": 3.52, "learning_rate": 6.119513291055408e-05, "loss": 0.0103, "step": 17303 }, { "epoch": 3.52, "learning_rate": 6.117951071067837e-05, "loss": 0.0113, "step": 17304 }, { "epoch": 3.52, "learning_rate": 6.116388999427252e-05, "loss": 0.0111, "step": 17305 }, { "epoch": 3.52, "learning_rate": 6.114827076159737e-05, "loss": 0.0034, "step": 17306 }, { "epoch": 3.52, "learning_rate": 6.113265301291383e-05, "loss": 0.0051, "step": 17307 }, { "epoch": 3.52, "learning_rate": 6.111703674848273e-05, "loss": 0.0032, "step": 17308 }, { "epoch": 3.52, "learning_rate": 6.11014219685649e-05, "loss": 0.0048, "step": 17309 }, { "epoch": 3.52, "learning_rate": 6.108580867342112e-05, "loss": 0.0034, "step": 17310 }, { "epoch": 3.52, "learning_rate": 6.107019686331219e-05, "loss": 0.0014, "step": 17311 }, { "epoch": 3.53, "learning_rate": 6.105458653849888e-05, "loss": 0.0034, "step": 17312 }, { "epoch": 3.53, "learning_rate": 6.103897769924176e-05, "loss": 0.0021, "step": 17313 }, { "epoch": 3.53, "learning_rate": 6.1023370345801764e-05, "loss": 0.0052, "step": 17314 }, { "epoch": 3.53, "learning_rate": 6.100776447843932e-05, "loss": 0.0009, "step": 17315 }, { "epoch": 3.53, "learning_rate": 6.0992160097415246e-05, "loss": 0.003, "step": 17316 }, { "epoch": 3.53, "learning_rate": 6.097655720299016e-05, "loss": 0.0033, "step": 17317 }, { "epoch": 3.53, "learning_rate": 6.0960955795424515e-05, "loss": 0.0018, "step": 17318 }, { "epoch": 3.53, "learning_rate": 6.0945355874979096e-05, "loss": 0.0018, "step": 17319 }, { "epoch": 3.53, "learning_rate": 6.0929757441914215e-05, "loss": 0.0104, "step": 17320 }, { "epoch": 3.53, "learning_rate": 6.091416049649062e-05, "loss": 0.0016, "step": 17321 }, { "epoch": 3.53, "learning_rate": 6.089856503896866e-05, "loss": 0.0078, "step": 17322 }, { "epoch": 3.53, "learning_rate": 6.088297106960887e-05, "loss": 0.0048, "step": 17323 }, { "epoch": 3.53, "learning_rate": 6.086737858867166e-05, "loss": 0.0115, "step": 17324 }, { "epoch": 3.53, "learning_rate": 6.08517875964175e-05, "loss": 0.0059, "step": 17325 }, { "epoch": 3.53, "learning_rate": 6.083619809310675e-05, "loss": 0.005, "step": 17326 }, { "epoch": 3.53, "learning_rate": 6.0820610078999794e-05, "loss": 0.004, "step": 17327 }, { "epoch": 3.53, "learning_rate": 6.080502355435701e-05, "loss": 0.0104, "step": 17328 }, { "epoch": 3.53, "learning_rate": 6.078943851943868e-05, "loss": 0.0045, "step": 17329 }, { "epoch": 3.53, "learning_rate": 6.077385497450518e-05, "loss": 0.0002, "step": 17330 }, { "epoch": 3.53, "learning_rate": 6.075827291981663e-05, "loss": 0.006, "step": 17331 }, { "epoch": 3.53, "learning_rate": 6.074269235563347e-05, "loss": 0.0051, "step": 17332 }, { "epoch": 3.53, "learning_rate": 6.072711328221574e-05, "loss": 0.005, "step": 17333 }, { "epoch": 3.53, "learning_rate": 6.0711535699823844e-05, "loss": 0.0103, "step": 17334 }, { "epoch": 3.53, "learning_rate": 6.069595960871778e-05, "loss": 0.0056, "step": 17335 }, { "epoch": 3.53, "learning_rate": 6.068038500915776e-05, "loss": 0.0047, "step": 17336 }, { "epoch": 3.53, "learning_rate": 6.0664811901403923e-05, "loss": 0.0165, "step": 17337 }, { "epoch": 3.53, "learning_rate": 6.064924028571636e-05, "loss": 0.0011, "step": 17338 }, { "epoch": 3.53, "learning_rate": 6.063367016235514e-05, "loss": 0.0043, "step": 17339 }, { "epoch": 3.53, "learning_rate": 6.0618101531580325e-05, "loss": 0.0082, "step": 17340 }, { "epoch": 3.53, "learning_rate": 6.060253439365194e-05, "loss": 0.0109, "step": 17341 }, { "epoch": 3.53, "learning_rate": 6.058696874882996e-05, "loss": 0.0021, "step": 17342 }, { "epoch": 3.53, "learning_rate": 6.0571404597374396e-05, "loss": 0.007, "step": 17343 }, { "epoch": 3.53, "learning_rate": 6.055584193954519e-05, "loss": 0.0062, "step": 17344 }, { "epoch": 3.53, "learning_rate": 6.0540280775602305e-05, "loss": 0.0018, "step": 17345 }, { "epoch": 3.53, "learning_rate": 6.0524721105805485e-05, "loss": 0.0066, "step": 17346 }, { "epoch": 3.53, "learning_rate": 6.050916293041478e-05, "loss": 0.0007, "step": 17347 }, { "epoch": 3.53, "learning_rate": 6.049360624969003e-05, "loss": 0.0095, "step": 17348 }, { "epoch": 3.53, "learning_rate": 6.0478051063890915e-05, "loss": 0.005, "step": 17349 }, { "epoch": 3.53, "learning_rate": 6.046249737327742e-05, "loss": 0.0114, "step": 17350 }, { "epoch": 3.53, "learning_rate": 6.044694517810915e-05, "loss": 0.0069, "step": 17351 }, { "epoch": 3.53, "learning_rate": 6.043139447864602e-05, "loss": 0.0003, "step": 17352 }, { "epoch": 3.53, "learning_rate": 6.041584527514764e-05, "loss": 0.0068, "step": 17353 }, { "epoch": 3.53, "learning_rate": 6.040029756787375e-05, "loss": 0.0108, "step": 17354 }, { "epoch": 3.53, "learning_rate": 6.0384751357084e-05, "loss": 0.0065, "step": 17355 }, { "epoch": 3.53, "learning_rate": 6.036920664303808e-05, "loss": 0.0059, "step": 17356 }, { "epoch": 3.53, "learning_rate": 6.0353663425995587e-05, "loss": 0.0105, "step": 17357 }, { "epoch": 3.53, "learning_rate": 6.0338121706216154e-05, "loss": 0.0319, "step": 17358 }, { "epoch": 3.53, "learning_rate": 6.032258148395931e-05, "loss": 0.0016, "step": 17359 }, { "epoch": 3.53, "learning_rate": 6.030704275948465e-05, "loss": 0.009, "step": 17360 }, { "epoch": 3.54, "learning_rate": 6.0291505533051695e-05, "loss": 0.0014, "step": 17361 }, { "epoch": 3.54, "learning_rate": 6.027596980491992e-05, "loss": 0.0029, "step": 17362 }, { "epoch": 3.54, "learning_rate": 6.0260435575348856e-05, "loss": 0.015, "step": 17363 }, { "epoch": 3.54, "learning_rate": 6.024490284459783e-05, "loss": 0.0053, "step": 17364 }, { "epoch": 3.54, "learning_rate": 6.022937161292645e-05, "loss": 0.0022, "step": 17365 }, { "epoch": 3.54, "learning_rate": 6.02138418805939e-05, "loss": 0.0014, "step": 17366 }, { "epoch": 3.54, "learning_rate": 6.0198313647859795e-05, "loss": 0.0035, "step": 17367 }, { "epoch": 3.54, "learning_rate": 6.0182786914983297e-05, "loss": 0.0028, "step": 17368 }, { "epoch": 3.54, "learning_rate": 6.0167261682223764e-05, "loss": 0.0007, "step": 17369 }, { "epoch": 3.54, "learning_rate": 6.015173794984064e-05, "loss": 0.0054, "step": 17370 }, { "epoch": 3.54, "learning_rate": 6.013621571809298e-05, "loss": 0.0099, "step": 17371 }, { "epoch": 3.54, "learning_rate": 6.012069498724024e-05, "loss": 0.0017, "step": 17372 }, { "epoch": 3.54, "learning_rate": 6.0105175757541504e-05, "loss": 0.0151, "step": 17373 }, { "epoch": 3.54, "learning_rate": 6.008965802925603e-05, "loss": 0.0068, "step": 17374 }, { "epoch": 3.54, "learning_rate": 6.007414180264299e-05, "loss": 0.0049, "step": 17375 }, { "epoch": 3.54, "learning_rate": 6.005862707796152e-05, "loss": 0.0063, "step": 17376 }, { "epoch": 3.54, "learning_rate": 6.004311385547075e-05, "loss": 0.0032, "step": 17377 }, { "epoch": 3.54, "learning_rate": 6.0027602135429794e-05, "loss": 0.0038, "step": 17378 }, { "epoch": 3.54, "learning_rate": 6.001209191809771e-05, "loss": 0.0006, "step": 17379 }, { "epoch": 3.54, "learning_rate": 5.999658320373356e-05, "loss": 0.0072, "step": 17380 }, { "epoch": 3.54, "learning_rate": 5.9981075992596426e-05, "loss": 0.0004, "step": 17381 }, { "epoch": 3.54, "learning_rate": 5.996557028494512e-05, "loss": 0.0059, "step": 17382 }, { "epoch": 3.54, "learning_rate": 5.995006608103886e-05, "loss": 0.0041, "step": 17383 }, { "epoch": 3.54, "learning_rate": 5.993456338113637e-05, "loss": 0.0031, "step": 17384 }, { "epoch": 3.54, "learning_rate": 5.991906218549678e-05, "loss": 0.0014, "step": 17385 }, { "epoch": 3.54, "learning_rate": 5.990356249437885e-05, "loss": 0.0084, "step": 17386 }, { "epoch": 3.54, "learning_rate": 5.988806430804149e-05, "loss": 0.003, "step": 17387 }, { "epoch": 3.54, "learning_rate": 5.987256762674357e-05, "loss": 0.006, "step": 17388 }, { "epoch": 3.54, "learning_rate": 5.9857072450743884e-05, "loss": 0.0093, "step": 17389 }, { "epoch": 3.54, "learning_rate": 5.984157878030124e-05, "loss": 0.0074, "step": 17390 }, { "epoch": 3.54, "learning_rate": 5.9826086615674424e-05, "loss": 0.0016, "step": 17391 }, { "epoch": 3.54, "learning_rate": 5.981059595712217e-05, "loss": 0.0032, "step": 17392 }, { "epoch": 3.54, "learning_rate": 5.979510680490321e-05, "loss": 0.0056, "step": 17393 }, { "epoch": 3.54, "learning_rate": 5.977961915927623e-05, "loss": 0.0051, "step": 17394 }, { "epoch": 3.54, "learning_rate": 5.9764133020499935e-05, "loss": 0.0026, "step": 17395 }, { "epoch": 3.54, "learning_rate": 5.9748648388832986e-05, "loss": 0.0039, "step": 17396 }, { "epoch": 3.54, "learning_rate": 5.973316526453389e-05, "loss": 0.0032, "step": 17397 }, { "epoch": 3.54, "learning_rate": 5.9717683647861396e-05, "loss": 0.0051, "step": 17398 }, { "epoch": 3.54, "learning_rate": 5.9702203539073974e-05, "loss": 0.0033, "step": 17399 }, { "epoch": 3.54, "learning_rate": 5.9686724938430145e-05, "loss": 0.0034, "step": 17400 }, { "epoch": 3.54, "learning_rate": 5.96712478461886e-05, "loss": 0.022, "step": 17401 }, { "epoch": 3.54, "learning_rate": 5.965577226260761e-05, "loss": 0.0047, "step": 17402 }, { "epoch": 3.54, "learning_rate": 5.964029818794586e-05, "loss": 0.0006, "step": 17403 }, { "epoch": 3.54, "learning_rate": 5.962482562246165e-05, "loss": 0.0032, "step": 17404 }, { "epoch": 3.54, "learning_rate": 5.9609354566413446e-05, "loss": 0.0081, "step": 17405 }, { "epoch": 3.54, "learning_rate": 5.959388502005965e-05, "loss": 0.0013, "step": 17406 }, { "epoch": 3.54, "learning_rate": 5.957841698365863e-05, "loss": 0.0063, "step": 17407 }, { "epoch": 3.54, "learning_rate": 5.956295045746872e-05, "loss": 0.0021, "step": 17408 }, { "epoch": 3.54, "learning_rate": 5.954748544174826e-05, "loss": 0.0112, "step": 17409 }, { "epoch": 3.55, "learning_rate": 5.9532021936755525e-05, "loss": 0.0136, "step": 17410 }, { "epoch": 3.55, "learning_rate": 5.9516559942748795e-05, "loss": 0.0074, "step": 17411 }, { "epoch": 3.55, "learning_rate": 5.9501099459986306e-05, "loss": 0.0023, "step": 17412 }, { "epoch": 3.55, "learning_rate": 5.9485640488726296e-05, "loss": 0.0006, "step": 17413 }, { "epoch": 3.55, "learning_rate": 5.9470183029227e-05, "loss": 0.0047, "step": 17414 }, { "epoch": 3.55, "learning_rate": 5.945472708174643e-05, "loss": 0.0009, "step": 17415 }, { "epoch": 3.55, "learning_rate": 5.943927264654295e-05, "loss": 0.0035, "step": 17416 }, { "epoch": 3.55, "learning_rate": 5.942381972387443e-05, "loss": 0.0051, "step": 17417 }, { "epoch": 3.55, "learning_rate": 5.940836831399922e-05, "loss": 0.0007, "step": 17418 }, { "epoch": 3.55, "learning_rate": 5.9392918417175207e-05, "loss": 0.0005, "step": 17419 }, { "epoch": 3.55, "learning_rate": 5.9377470033660476e-05, "loss": 0.0051, "step": 17420 }, { "epoch": 3.55, "learning_rate": 5.936202316371308e-05, "loss": 0.0109, "step": 17421 }, { "epoch": 3.55, "learning_rate": 5.934657780759097e-05, "loss": 0.0081, "step": 17422 }, { "epoch": 3.55, "learning_rate": 5.9331133965552144e-05, "loss": 0.0005, "step": 17423 }, { "epoch": 3.55, "learning_rate": 5.931569163785451e-05, "loss": 0.003, "step": 17424 }, { "epoch": 3.55, "learning_rate": 5.9300250824756023e-05, "loss": 0.0036, "step": 17425 }, { "epoch": 3.55, "learning_rate": 5.928481152651456e-05, "loss": 0.0107, "step": 17426 }, { "epoch": 3.55, "learning_rate": 5.926937374338803e-05, "loss": 0.0008, "step": 17427 }, { "epoch": 3.55, "learning_rate": 5.9253937475634106e-05, "loss": 0.0047, "step": 17428 }, { "epoch": 3.55, "learning_rate": 5.923850272351079e-05, "loss": 0.0071, "step": 17429 }, { "epoch": 3.55, "learning_rate": 5.922306948727579e-05, "loss": 0.0193, "step": 17430 }, { "epoch": 3.55, "learning_rate": 5.920763776718689e-05, "loss": 0.0044, "step": 17431 }, { "epoch": 3.55, "learning_rate": 5.919220756350187e-05, "loss": 0.0017, "step": 17432 }, { "epoch": 3.55, "learning_rate": 5.917677887647829e-05, "loss": 0.0054, "step": 17433 }, { "epoch": 3.55, "learning_rate": 5.916135170637406e-05, "loss": 0.0071, "step": 17434 }, { "epoch": 3.55, "learning_rate": 5.914592605344662e-05, "loss": 0.0026, "step": 17435 }, { "epoch": 3.55, "learning_rate": 5.913050191795381e-05, "loss": 0.0068, "step": 17436 }, { "epoch": 3.55, "learning_rate": 5.911507930015309e-05, "loss": 0.0009, "step": 17437 }, { "epoch": 3.55, "learning_rate": 5.909965820030212e-05, "loss": 0.0039, "step": 17438 }, { "epoch": 3.55, "learning_rate": 5.908423861865843e-05, "loss": 0.0124, "step": 17439 }, { "epoch": 3.55, "learning_rate": 5.9068820555479586e-05, "loss": 0.0037, "step": 17440 }, { "epoch": 3.55, "learning_rate": 5.905340401102306e-05, "loss": 0.0014, "step": 17441 }, { "epoch": 3.55, "learning_rate": 5.9037988985546375e-05, "loss": 0.0066, "step": 17442 }, { "epoch": 3.55, "learning_rate": 5.9022575479306974e-05, "loss": 0.003, "step": 17443 }, { "epoch": 3.55, "learning_rate": 5.900716349256231e-05, "loss": 0.0032, "step": 17444 }, { "epoch": 3.55, "learning_rate": 5.899175302556975e-05, "loss": 0.0069, "step": 17445 }, { "epoch": 3.55, "learning_rate": 5.897634407858672e-05, "loss": 0.0082, "step": 17446 }, { "epoch": 3.55, "learning_rate": 5.8960936651870625e-05, "loss": 0.0018, "step": 17447 }, { "epoch": 3.55, "learning_rate": 5.894553074567862e-05, "loss": 0.0055, "step": 17448 }, { "epoch": 3.55, "learning_rate": 5.893012636026823e-05, "loss": 0.0164, "step": 17449 }, { "epoch": 3.55, "learning_rate": 5.891472349589659e-05, "loss": 0.0003, "step": 17450 }, { "epoch": 3.55, "learning_rate": 5.8899322152821e-05, "loss": 0.0043, "step": 17451 }, { "epoch": 3.55, "learning_rate": 5.8883922331298696e-05, "loss": 0.0031, "step": 17452 }, { "epoch": 3.55, "learning_rate": 5.8868524031586834e-05, "loss": 0.008, "step": 17453 }, { "epoch": 3.55, "learning_rate": 5.885312725394274e-05, "loss": 0.0024, "step": 17454 }, { "epoch": 3.55, "learning_rate": 5.8837731998623424e-05, "loss": 0.0002, "step": 17455 }, { "epoch": 3.55, "learning_rate": 5.882233826588606e-05, "loss": 0.0082, "step": 17456 }, { "epoch": 3.55, "learning_rate": 5.880694605598777e-05, "loss": 0.0098, "step": 17457 }, { "epoch": 3.55, "learning_rate": 5.879155536918561e-05, "loss": 0.0008, "step": 17458 }, { "epoch": 3.55, "learning_rate": 5.877616620573665e-05, "loss": 0.0071, "step": 17459 }, { "epoch": 3.56, "learning_rate": 5.87607785658979e-05, "loss": 0.0045, "step": 17460 }, { "epoch": 3.56, "learning_rate": 5.874539244992639e-05, "loss": 0.0016, "step": 17461 }, { "epoch": 3.56, "learning_rate": 5.873000785807908e-05, "loss": 0.0038, "step": 17462 }, { "epoch": 3.56, "learning_rate": 5.871462479061291e-05, "loss": 0.007, "step": 17463 }, { "epoch": 3.56, "learning_rate": 5.869924324778483e-05, "loss": 0.003, "step": 17464 }, { "epoch": 3.56, "learning_rate": 5.8683863229851777e-05, "loss": 0.0006, "step": 17465 }, { "epoch": 3.56, "learning_rate": 5.8668484737070465e-05, "loss": 0.0065, "step": 17466 }, { "epoch": 3.56, "learning_rate": 5.865310776969798e-05, "loss": 0.0018, "step": 17467 }, { "epoch": 3.56, "learning_rate": 5.8637732327990914e-05, "loss": 0.0054, "step": 17468 }, { "epoch": 3.56, "learning_rate": 5.8622358412206275e-05, "loss": 0.0028, "step": 17469 }, { "epoch": 3.56, "learning_rate": 5.8606986022600694e-05, "loss": 0.0031, "step": 17470 }, { "epoch": 3.56, "learning_rate": 5.859161515943097e-05, "loss": 0.0047, "step": 17471 }, { "epoch": 3.56, "learning_rate": 5.8576245822953806e-05, "loss": 0.0017, "step": 17472 }, { "epoch": 3.56, "learning_rate": 5.856087801342592e-05, "loss": 0.0069, "step": 17473 }, { "epoch": 3.56, "learning_rate": 5.8545511731103966e-05, "loss": 0.0099, "step": 17474 }, { "epoch": 3.56, "learning_rate": 5.85301469762446e-05, "loss": 0.0022, "step": 17475 }, { "epoch": 3.56, "learning_rate": 5.851478374910446e-05, "loss": 0.0053, "step": 17476 }, { "epoch": 3.56, "learning_rate": 5.8499422049940085e-05, "loss": 0.0014, "step": 17477 }, { "epoch": 3.56, "learning_rate": 5.848406187900816e-05, "loss": 0.0033, "step": 17478 }, { "epoch": 3.56, "learning_rate": 5.846870323656503e-05, "loss": 0.0071, "step": 17479 }, { "epoch": 3.56, "learning_rate": 5.845334612286746e-05, "loss": 0.0067, "step": 17480 }, { "epoch": 3.56, "learning_rate": 5.8437990538171705e-05, "loss": 0.0115, "step": 17481 }, { "epoch": 3.56, "learning_rate": 5.842263648273439e-05, "loss": 0.0024, "step": 17482 }, { "epoch": 3.56, "learning_rate": 5.8407283956811954e-05, "loss": 0.0029, "step": 17483 }, { "epoch": 3.56, "learning_rate": 5.8391932960660676e-05, "loss": 0.002, "step": 17484 }, { "epoch": 3.56, "learning_rate": 5.8376583494537137e-05, "loss": 0.0082, "step": 17485 }, { "epoch": 3.56, "learning_rate": 5.836123555869752e-05, "loss": 0.0009, "step": 17486 }, { "epoch": 3.56, "learning_rate": 5.834588915339832e-05, "loss": 0.0009, "step": 17487 }, { "epoch": 3.56, "learning_rate": 5.833054427889575e-05, "loss": 0.0031, "step": 17488 }, { "epoch": 3.56, "learning_rate": 5.831520093544613e-05, "loss": 0.0024, "step": 17489 }, { "epoch": 3.56, "learning_rate": 5.8299859123305725e-05, "loss": 0.0065, "step": 17490 }, { "epoch": 3.56, "learning_rate": 5.828451884273076e-05, "loss": 0.0097, "step": 17491 }, { "epoch": 3.56, "learning_rate": 5.8269180093977465e-05, "loss": 0.0008, "step": 17492 }, { "epoch": 3.56, "learning_rate": 5.8253842877302e-05, "loss": 0.0016, "step": 17493 }, { "epoch": 3.56, "learning_rate": 5.823850719296056e-05, "loss": 0.0017, "step": 17494 }, { "epoch": 3.56, "learning_rate": 5.822317304120926e-05, "loss": 0.003, "step": 17495 }, { "epoch": 3.56, "learning_rate": 5.820784042230424e-05, "loss": 0.0076, "step": 17496 }, { "epoch": 3.56, "learning_rate": 5.819250933650147e-05, "loss": 0.0004, "step": 17497 }, { "epoch": 3.56, "learning_rate": 5.8177179784057205e-05, "loss": 0.0027, "step": 17498 }, { "epoch": 3.56, "learning_rate": 5.816185176522724e-05, "loss": 0.0011, "step": 17499 }, { "epoch": 3.56, "learning_rate": 5.8146525280267825e-05, "loss": 0.0012, "step": 17500 }, { "epoch": 3.56, "learning_rate": 5.8131200329434786e-05, "loss": 0.0035, "step": 17501 }, { "epoch": 3.56, "learning_rate": 5.811587691298408e-05, "loss": 0.0003, "step": 17502 }, { "epoch": 3.56, "learning_rate": 5.8100555031171694e-05, "loss": 0.0009, "step": 17503 }, { "epoch": 3.56, "learning_rate": 5.808523468425352e-05, "loss": 0.0074, "step": 17504 }, { "epoch": 3.56, "learning_rate": 5.8069915872485426e-05, "loss": 0.0022, "step": 17505 }, { "epoch": 3.56, "learning_rate": 5.805459859612326e-05, "loss": 0.0039, "step": 17506 }, { "epoch": 3.56, "learning_rate": 5.8039282855422845e-05, "loss": 0.0061, "step": 17507 }, { "epoch": 3.56, "learning_rate": 5.802396865064e-05, "loss": 0.0037, "step": 17508 }, { "epoch": 3.57, "learning_rate": 5.800865598203051e-05, "loss": 0.0135, "step": 17509 }, { "epoch": 3.57, "learning_rate": 5.79933448498501e-05, "loss": 0.0082, "step": 17510 }, { "epoch": 3.57, "learning_rate": 5.7978035254354563e-05, "loss": 0.0081, "step": 17511 }, { "epoch": 3.57, "learning_rate": 5.796272719579943e-05, "loss": 0.002, "step": 17512 }, { "epoch": 3.57, "learning_rate": 5.794742067444055e-05, "loss": 0.0023, "step": 17513 }, { "epoch": 3.57, "learning_rate": 5.7932115690533495e-05, "loss": 0.0063, "step": 17514 }, { "epoch": 3.57, "learning_rate": 5.791681224433389e-05, "loss": 0.0016, "step": 17515 }, { "epoch": 3.57, "learning_rate": 5.790151033609742e-05, "loss": 0.0117, "step": 17516 }, { "epoch": 3.57, "learning_rate": 5.788620996607944e-05, "loss": 0.0101, "step": 17517 }, { "epoch": 3.57, "learning_rate": 5.787091113453575e-05, "loss": 0.0064, "step": 17518 }, { "epoch": 3.57, "learning_rate": 5.7855613841721655e-05, "loss": 0.0051, "step": 17519 }, { "epoch": 3.57, "learning_rate": 5.7840318087892846e-05, "loss": 0.0008, "step": 17520 }, { "epoch": 3.57, "learning_rate": 5.782502387330462e-05, "loss": 0.0066, "step": 17521 }, { "epoch": 3.57, "learning_rate": 5.7809731198212494e-05, "loss": 0.0034, "step": 17522 }, { "epoch": 3.57, "learning_rate": 5.7794440062871894e-05, "loss": 0.0021, "step": 17523 }, { "epoch": 3.57, "learning_rate": 5.777915046753818e-05, "loss": 0.0057, "step": 17524 }, { "epoch": 3.57, "learning_rate": 5.776386241246672e-05, "loss": 0.0044, "step": 17525 }, { "epoch": 3.57, "learning_rate": 5.774857589791289e-05, "loss": 0.0133, "step": 17526 }, { "epoch": 3.57, "learning_rate": 5.773329092413197e-05, "loss": 0.0047, "step": 17527 }, { "epoch": 3.57, "learning_rate": 5.7718007491379254e-05, "loss": 0.0007, "step": 17528 }, { "epoch": 3.57, "learning_rate": 5.770272559991007e-05, "loss": 0.004, "step": 17529 }, { "epoch": 3.57, "learning_rate": 5.768744524997948e-05, "loss": 0.0053, "step": 17530 }, { "epoch": 3.57, "learning_rate": 5.767216644184291e-05, "loss": 0.0032, "step": 17531 }, { "epoch": 3.57, "learning_rate": 5.7656889175755335e-05, "loss": 0.0071, "step": 17532 }, { "epoch": 3.57, "learning_rate": 5.7641613451972135e-05, "loss": 0.0035, "step": 17533 }, { "epoch": 3.57, "learning_rate": 5.762633927074826e-05, "loss": 0.0018, "step": 17534 }, { "epoch": 3.57, "learning_rate": 5.761106663233885e-05, "loss": 0.009, "step": 17535 }, { "epoch": 3.57, "learning_rate": 5.7595795536999124e-05, "loss": 0.0028, "step": 17536 }, { "epoch": 3.57, "learning_rate": 5.7580525984983935e-05, "loss": 0.0014, "step": 17537 }, { "epoch": 3.57, "learning_rate": 5.7565257976548525e-05, "loss": 0.0008, "step": 17538 }, { "epoch": 3.57, "learning_rate": 5.754999151194772e-05, "loss": 0.0147, "step": 17539 }, { "epoch": 3.57, "learning_rate": 5.753472659143658e-05, "loss": 0.0086, "step": 17540 }, { "epoch": 3.57, "learning_rate": 5.751946321527006e-05, "loss": 0.0071, "step": 17541 }, { "epoch": 3.57, "learning_rate": 5.7504201383703045e-05, "loss": 0.0118, "step": 17542 }, { "epoch": 3.57, "learning_rate": 5.748894109699048e-05, "loss": 0.0085, "step": 17543 }, { "epoch": 3.57, "learning_rate": 5.747368235538724e-05, "loss": 0.0009, "step": 17544 }, { "epoch": 3.57, "learning_rate": 5.745842515914813e-05, "loss": 0.0064, "step": 17545 }, { "epoch": 3.57, "learning_rate": 5.744316950852803e-05, "loss": 0.0194, "step": 17546 }, { "epoch": 3.57, "learning_rate": 5.742791540378175e-05, "loss": 0.0002, "step": 17547 }, { "epoch": 3.57, "learning_rate": 5.7412662845163935e-05, "loss": 0.002, "step": 17548 }, { "epoch": 3.57, "learning_rate": 5.739741183292951e-05, "loss": 0.0005, "step": 17549 }, { "epoch": 3.57, "learning_rate": 5.738216236733301e-05, "loss": 0.0037, "step": 17550 }, { "epoch": 3.57, "learning_rate": 5.736691444862933e-05, "loss": 0.0023, "step": 17551 }, { "epoch": 3.57, "learning_rate": 5.735166807707299e-05, "loss": 0.006, "step": 17552 }, { "epoch": 3.57, "learning_rate": 5.7336423252918676e-05, "loss": 0.0105, "step": 17553 }, { "epoch": 3.57, "learning_rate": 5.7321179976421e-05, "loss": 0.0004, "step": 17554 }, { "epoch": 3.57, "learning_rate": 5.730593824783457e-05, "loss": 0.0067, "step": 17555 }, { "epoch": 3.57, "learning_rate": 5.7290698067413954e-05, "loss": 0.003, "step": 17556 }, { "epoch": 3.57, "learning_rate": 5.727545943541366e-05, "loss": 0.0074, "step": 17557 }, { "epoch": 3.58, "learning_rate": 5.726022235208824e-05, "loss": 0.0014, "step": 17558 }, { "epoch": 3.58, "learning_rate": 5.724498681769216e-05, "loss": 0.0034, "step": 17559 }, { "epoch": 3.58, "learning_rate": 5.7229752832479885e-05, "loss": 0.0044, "step": 17560 }, { "epoch": 3.58, "learning_rate": 5.721452039670586e-05, "loss": 0.0057, "step": 17561 }, { "epoch": 3.58, "learning_rate": 5.7199289510624525e-05, "loss": 0.006, "step": 17562 }, { "epoch": 3.58, "learning_rate": 5.718406017449014e-05, "loss": 0.0009, "step": 17563 }, { "epoch": 3.58, "learning_rate": 5.7168832388557264e-05, "loss": 0.0034, "step": 17564 }, { "epoch": 3.58, "learning_rate": 5.715360615307999e-05, "loss": 0.0065, "step": 17565 }, { "epoch": 3.58, "learning_rate": 5.7138381468312824e-05, "loss": 0.0031, "step": 17566 }, { "epoch": 3.58, "learning_rate": 5.712315833451002e-05, "loss": 0.0026, "step": 17567 }, { "epoch": 3.58, "learning_rate": 5.710793675192569e-05, "loss": 0.0005, "step": 17568 }, { "epoch": 3.58, "learning_rate": 5.7092716720814264e-05, "loss": 0.0057, "step": 17569 }, { "epoch": 3.58, "learning_rate": 5.70774982414298e-05, "loss": 0.0019, "step": 17570 }, { "epoch": 3.58, "learning_rate": 5.706228131402651e-05, "loss": 0.0021, "step": 17571 }, { "epoch": 3.58, "learning_rate": 5.7047065938858545e-05, "loss": 0.0013, "step": 17572 }, { "epoch": 3.58, "learning_rate": 5.703185211618005e-05, "loss": 0.0037, "step": 17573 }, { "epoch": 3.58, "learning_rate": 5.7016639846245124e-05, "loss": 0.0005, "step": 17574 }, { "epoch": 3.58, "learning_rate": 5.7001429129307825e-05, "loss": 0.0066, "step": 17575 }, { "epoch": 3.58, "learning_rate": 5.698621996562221e-05, "loss": 0.0046, "step": 17576 }, { "epoch": 3.58, "learning_rate": 5.697101235544227e-05, "loss": 0.0041, "step": 17577 }, { "epoch": 3.58, "learning_rate": 5.695580629902207e-05, "loss": 0.0019, "step": 17578 }, { "epoch": 3.58, "learning_rate": 5.694060179661551e-05, "loss": 0.0083, "step": 17579 }, { "epoch": 3.58, "learning_rate": 5.692539884847661e-05, "loss": 0.0097, "step": 17580 }, { "epoch": 3.58, "learning_rate": 5.6910197454859154e-05, "loss": 0.0028, "step": 17581 }, { "epoch": 3.58, "learning_rate": 5.689499761601723e-05, "loss": 0.0035, "step": 17582 }, { "epoch": 3.58, "learning_rate": 5.687979933220448e-05, "loss": 0.0006, "step": 17583 }, { "epoch": 3.58, "learning_rate": 5.686460260367495e-05, "loss": 0.0043, "step": 17584 }, { "epoch": 3.58, "learning_rate": 5.6849407430682315e-05, "loss": 0.0068, "step": 17585 }, { "epoch": 3.58, "learning_rate": 5.683421381348043e-05, "loss": 0.0076, "step": 17586 }, { "epoch": 3.58, "learning_rate": 5.681902175232302e-05, "loss": 0.0033, "step": 17587 }, { "epoch": 3.58, "learning_rate": 5.6803831247463784e-05, "loss": 0.0006, "step": 17588 }, { "epoch": 3.58, "learning_rate": 5.67886422991566e-05, "loss": 0.0114, "step": 17589 }, { "epoch": 3.58, "learning_rate": 5.677345490765497e-05, "loss": 0.0097, "step": 17590 }, { "epoch": 3.58, "learning_rate": 5.675826907321264e-05, "loss": 0.0025, "step": 17591 }, { "epoch": 3.58, "learning_rate": 5.6743084796083216e-05, "loss": 0.0114, "step": 17592 }, { "epoch": 3.58, "learning_rate": 5.67279020765203e-05, "loss": 0.0214, "step": 17593 }, { "epoch": 3.58, "learning_rate": 5.67127209147775e-05, "loss": 0.0036, "step": 17594 }, { "epoch": 3.58, "learning_rate": 5.669754131110835e-05, "loss": 0.0002, "step": 17595 }, { "epoch": 3.58, "learning_rate": 5.6682363265766376e-05, "loss": 0.0112, "step": 17596 }, { "epoch": 3.58, "learning_rate": 5.6667186779005075e-05, "loss": 0.0019, "step": 17597 }, { "epoch": 3.58, "learning_rate": 5.6652011851078e-05, "loss": 0.0112, "step": 17598 }, { "epoch": 3.58, "learning_rate": 5.663683848223843e-05, "loss": 0.009, "step": 17599 }, { "epoch": 3.58, "learning_rate": 5.662166667273999e-05, "loss": 0.0052, "step": 17600 }, { "epoch": 3.58, "learning_rate": 5.660649642283588e-05, "loss": 0.0039, "step": 17601 }, { "epoch": 3.58, "learning_rate": 5.659132773277968e-05, "loss": 0.0089, "step": 17602 }, { "epoch": 3.58, "learning_rate": 5.657616060282457e-05, "loss": 0.0032, "step": 17603 }, { "epoch": 3.58, "learning_rate": 5.656099503322393e-05, "loss": 0.015, "step": 17604 }, { "epoch": 3.58, "learning_rate": 5.654583102423104e-05, "loss": 0.0073, "step": 17605 }, { "epoch": 3.58, "learning_rate": 5.6530668576099196e-05, "loss": 0.0038, "step": 17606 }, { "epoch": 3.59, "learning_rate": 5.651550768908162e-05, "loss": 0.0038, "step": 17607 }, { "epoch": 3.59, "learning_rate": 5.650034836343152e-05, "loss": 0.0095, "step": 17608 }, { "epoch": 3.59, "learning_rate": 5.648519059940211e-05, "loss": 0.0018, "step": 17609 }, { "epoch": 3.59, "learning_rate": 5.647003439724652e-05, "loss": 0.0067, "step": 17610 }, { "epoch": 3.59, "learning_rate": 5.645487975721793e-05, "loss": 0.0124, "step": 17611 }, { "epoch": 3.59, "learning_rate": 5.64397266795694e-05, "loss": 0.0184, "step": 17612 }, { "epoch": 3.59, "learning_rate": 5.642457516455412e-05, "loss": 0.0043, "step": 17613 }, { "epoch": 3.59, "learning_rate": 5.640942521242496e-05, "loss": 0.0128, "step": 17614 }, { "epoch": 3.59, "learning_rate": 5.639427682343515e-05, "loss": 0.0251, "step": 17615 }, { "epoch": 3.59, "learning_rate": 5.637912999783752e-05, "loss": 0.0005, "step": 17616 }, { "epoch": 3.59, "learning_rate": 5.636398473588525e-05, "loss": 0.0026, "step": 17617 }, { "epoch": 3.59, "learning_rate": 5.634884103783113e-05, "loss": 0.0014, "step": 17618 }, { "epoch": 3.59, "learning_rate": 5.633369890392809e-05, "loss": 0.0059, "step": 17619 }, { "epoch": 3.59, "learning_rate": 5.631855833442918e-05, "loss": 0.003, "step": 17620 }, { "epoch": 3.59, "learning_rate": 5.6303419329587146e-05, "loss": 0.0019, "step": 17621 }, { "epoch": 3.59, "learning_rate": 5.628828188965486e-05, "loss": 0.0016, "step": 17622 }, { "epoch": 3.59, "learning_rate": 5.627314601488516e-05, "loss": 0.0007, "step": 17623 }, { "epoch": 3.59, "learning_rate": 5.625801170553086e-05, "loss": 0.005, "step": 17624 }, { "epoch": 3.59, "learning_rate": 5.62428789618447e-05, "loss": 0.0044, "step": 17625 }, { "epoch": 3.59, "learning_rate": 5.622774778407945e-05, "loss": 0.0017, "step": 17626 }, { "epoch": 3.59, "learning_rate": 5.621261817248781e-05, "loss": 0.0121, "step": 17627 }, { "epoch": 3.59, "learning_rate": 5.6197490127322494e-05, "loss": 0.0067, "step": 17628 }, { "epoch": 3.59, "learning_rate": 5.618236364883616e-05, "loss": 0.001, "step": 17629 }, { "epoch": 3.59, "learning_rate": 5.616723873728143e-05, "loss": 0.0026, "step": 17630 }, { "epoch": 3.59, "learning_rate": 5.615211539291099e-05, "loss": 0.0016, "step": 17631 }, { "epoch": 3.59, "learning_rate": 5.6136993615977276e-05, "loss": 0.0015, "step": 17632 }, { "epoch": 3.59, "learning_rate": 5.612187340673305e-05, "loss": 0.0066, "step": 17633 }, { "epoch": 3.59, "learning_rate": 5.610675476543066e-05, "loss": 0.0139, "step": 17634 }, { "epoch": 3.59, "learning_rate": 5.6091637692322784e-05, "loss": 0.0023, "step": 17635 }, { "epoch": 3.59, "learning_rate": 5.607652218766177e-05, "loss": 0.0034, "step": 17636 }, { "epoch": 3.59, "learning_rate": 5.6061408251700137e-05, "loss": 0.0087, "step": 17637 }, { "epoch": 3.59, "learning_rate": 5.604629588469029e-05, "loss": 0.0003, "step": 17638 }, { "epoch": 3.59, "learning_rate": 5.603118508688468e-05, "loss": 0.0015, "step": 17639 }, { "epoch": 3.59, "learning_rate": 5.601607585853563e-05, "loss": 0.0016, "step": 17640 }, { "epoch": 3.59, "learning_rate": 5.600096819989555e-05, "loss": 0.0115, "step": 17641 }, { "epoch": 3.59, "learning_rate": 5.5985862111216705e-05, "loss": 0.0036, "step": 17642 }, { "epoch": 3.59, "learning_rate": 5.597075759275144e-05, "loss": 0.0084, "step": 17643 }, { "epoch": 3.59, "learning_rate": 5.5955654644752085e-05, "loss": 0.0033, "step": 17644 }, { "epoch": 3.59, "learning_rate": 5.59405532674707e-05, "loss": 0.0055, "step": 17645 }, { "epoch": 3.59, "learning_rate": 5.592545346115972e-05, "loss": 0.0003, "step": 17646 }, { "epoch": 3.59, "learning_rate": 5.591035522607116e-05, "loss": 0.0041, "step": 17647 }, { "epoch": 3.59, "learning_rate": 5.589525856245731e-05, "loss": 0.0018, "step": 17648 }, { "epoch": 3.59, "learning_rate": 5.588016347057033e-05, "loss": 0.0007, "step": 17649 }, { "epoch": 3.59, "learning_rate": 5.58650699506622e-05, "loss": 0.0081, "step": 17650 }, { "epoch": 3.59, "learning_rate": 5.5849978002985177e-05, "loss": 0.0018, "step": 17651 }, { "epoch": 3.59, "learning_rate": 5.5834887627791155e-05, "loss": 0.0112, "step": 17652 }, { "epoch": 3.59, "learning_rate": 5.5819798825332354e-05, "loss": 0.0079, "step": 17653 }, { "epoch": 3.59, "learning_rate": 5.580471159586064e-05, "loss": 0.0016, "step": 17654 }, { "epoch": 3.59, "learning_rate": 5.5789625939628035e-05, "loss": 0.0022, "step": 17655 }, { "epoch": 3.6, "learning_rate": 5.5774541856886534e-05, "loss": 0.0106, "step": 17656 }, { "epoch": 3.6, "learning_rate": 5.5759459347888034e-05, "loss": 0.0048, "step": 17657 }, { "epoch": 3.6, "learning_rate": 5.5744378412884456e-05, "loss": 0.0079, "step": 17658 }, { "epoch": 3.6, "learning_rate": 5.5729299052127674e-05, "loss": 0.001, "step": 17659 }, { "epoch": 3.6, "learning_rate": 5.5714221265869554e-05, "loss": 0.0059, "step": 17660 }, { "epoch": 3.6, "learning_rate": 5.5699145054361924e-05, "loss": 0.002, "step": 17661 }, { "epoch": 3.6, "learning_rate": 5.568407041785656e-05, "loss": 0.0011, "step": 17662 }, { "epoch": 3.6, "learning_rate": 5.5668997356605265e-05, "loss": 0.0054, "step": 17663 }, { "epoch": 3.6, "learning_rate": 5.565392587085983e-05, "loss": 0.0051, "step": 17664 }, { "epoch": 3.6, "learning_rate": 5.56388559608718e-05, "loss": 0.007, "step": 17665 }, { "epoch": 3.6, "learning_rate": 5.562378762689312e-05, "loss": 0.0111, "step": 17666 }, { "epoch": 3.6, "learning_rate": 5.5608720869175225e-05, "loss": 0.0007, "step": 17667 }, { "epoch": 3.6, "learning_rate": 5.559365568796997e-05, "loss": 0.0083, "step": 17668 }, { "epoch": 3.6, "learning_rate": 5.5578592083528814e-05, "loss": 0.0199, "step": 17669 }, { "epoch": 3.6, "learning_rate": 5.55635300561034e-05, "loss": 0.0029, "step": 17670 }, { "epoch": 3.6, "learning_rate": 5.554846960594531e-05, "loss": 0.0016, "step": 17671 }, { "epoch": 3.6, "learning_rate": 5.553341073330606e-05, "loss": 0.0097, "step": 17672 }, { "epoch": 3.6, "learning_rate": 5.551835343843716e-05, "loss": 0.0094, "step": 17673 }, { "epoch": 3.6, "learning_rate": 5.550329772159011e-05, "loss": 0.0024, "step": 17674 }, { "epoch": 3.6, "learning_rate": 5.5488243583016375e-05, "loss": 0.0007, "step": 17675 }, { "epoch": 3.6, "learning_rate": 5.5473191022967364e-05, "loss": 0.0007, "step": 17676 }, { "epoch": 3.6, "learning_rate": 5.545814004169456e-05, "loss": 0.0043, "step": 17677 }, { "epoch": 3.6, "learning_rate": 5.544309063944915e-05, "loss": 0.0066, "step": 17678 }, { "epoch": 3.6, "learning_rate": 5.5428042816482685e-05, "loss": 0.0004, "step": 17679 }, { "epoch": 3.6, "learning_rate": 5.541299657304642e-05, "loss": 0.0008, "step": 17680 }, { "epoch": 3.6, "learning_rate": 5.539795190939166e-05, "loss": 0.0005, "step": 17681 }, { "epoch": 3.6, "learning_rate": 5.5382908825769727e-05, "loss": 0.0044, "step": 17682 }, { "epoch": 3.6, "learning_rate": 5.5367867322431716e-05, "loss": 0.0118, "step": 17683 }, { "epoch": 3.6, "learning_rate": 5.535282739962905e-05, "loss": 0.0013, "step": 17684 }, { "epoch": 3.6, "learning_rate": 5.533778905761272e-05, "loss": 0.0065, "step": 17685 }, { "epoch": 3.6, "learning_rate": 5.5322752296634117e-05, "loss": 0.0003, "step": 17686 }, { "epoch": 3.6, "learning_rate": 5.530771711694421e-05, "loss": 0.0016, "step": 17687 }, { "epoch": 3.6, "learning_rate": 5.529268351879416e-05, "loss": 0.0095, "step": 17688 }, { "epoch": 3.6, "learning_rate": 5.527765150243507e-05, "loss": 0.0092, "step": 17689 }, { "epoch": 3.6, "learning_rate": 5.5262621068118e-05, "loss": 0.0003, "step": 17690 }, { "epoch": 3.6, "learning_rate": 5.5247592216094e-05, "loss": 0.0012, "step": 17691 }, { "epoch": 3.6, "learning_rate": 5.523256494661406e-05, "loss": 0.0015, "step": 17692 }, { "epoch": 3.6, "learning_rate": 5.521753925992918e-05, "loss": 0.0104, "step": 17693 }, { "epoch": 3.6, "learning_rate": 5.52025151562903e-05, "loss": 0.0011, "step": 17694 }, { "epoch": 3.6, "learning_rate": 5.518749263594841e-05, "loss": 0.0018, "step": 17695 }, { "epoch": 3.6, "learning_rate": 5.5172471699154264e-05, "loss": 0.0049, "step": 17696 }, { "epoch": 3.6, "learning_rate": 5.5157452346158944e-05, "loss": 0.0092, "step": 17697 }, { "epoch": 3.6, "learning_rate": 5.51424345772131e-05, "loss": 0.0056, "step": 17698 }, { "epoch": 3.6, "learning_rate": 5.512741839256776e-05, "loss": 0.0207, "step": 17699 }, { "epoch": 3.6, "learning_rate": 5.5112403792473555e-05, "loss": 0.0123, "step": 17700 }, { "epoch": 3.6, "learning_rate": 5.509739077718127e-05, "loss": 0.0006, "step": 17701 }, { "epoch": 3.6, "learning_rate": 5.508237934694181e-05, "loss": 0.0024, "step": 17702 }, { "epoch": 3.6, "learning_rate": 5.506736950200568e-05, "loss": 0.001, "step": 17703 }, { "epoch": 3.6, "learning_rate": 5.5052361242623773e-05, "loss": 0.004, "step": 17704 }, { "epoch": 3.61, "learning_rate": 5.503735456904662e-05, "loss": 0.0023, "step": 17705 }, { "epoch": 3.61, "learning_rate": 5.502234948152488e-05, "loss": 0.0101, "step": 17706 }, { "epoch": 3.61, "learning_rate": 5.50073459803092e-05, "loss": 0.0019, "step": 17707 }, { "epoch": 3.61, "learning_rate": 5.499234406565015e-05, "loss": 0.0034, "step": 17708 }, { "epoch": 3.61, "learning_rate": 5.497734373779831e-05, "loss": 0.0047, "step": 17709 }, { "epoch": 3.61, "learning_rate": 5.4962344997004184e-05, "loss": 0.0004, "step": 17710 }, { "epoch": 3.61, "learning_rate": 5.494734784351829e-05, "loss": 0.0013, "step": 17711 }, { "epoch": 3.61, "learning_rate": 5.493235227759112e-05, "loss": 0.0069, "step": 17712 }, { "epoch": 3.61, "learning_rate": 5.4917358299473115e-05, "loss": 0.0021, "step": 17713 }, { "epoch": 3.61, "learning_rate": 5.490236590941471e-05, "loss": 0.0031, "step": 17714 }, { "epoch": 3.61, "learning_rate": 5.4887375107666355e-05, "loss": 0.0005, "step": 17715 }, { "epoch": 3.61, "learning_rate": 5.4872385894478263e-05, "loss": 0.0037, "step": 17716 }, { "epoch": 3.61, "learning_rate": 5.4857398270100994e-05, "loss": 0.006, "step": 17717 }, { "epoch": 3.61, "learning_rate": 5.484241223478472e-05, "loss": 0.0013, "step": 17718 }, { "epoch": 3.61, "learning_rate": 5.48274277887798e-05, "loss": 0.0107, "step": 17719 }, { "epoch": 3.61, "learning_rate": 5.4812444932336474e-05, "loss": 0.0141, "step": 17720 }, { "epoch": 3.61, "learning_rate": 5.4797463665704996e-05, "loss": 0.0003, "step": 17721 }, { "epoch": 3.61, "learning_rate": 5.478248398913559e-05, "loss": 0.0089, "step": 17722 }, { "epoch": 3.61, "learning_rate": 5.4767505902878427e-05, "loss": 0.0056, "step": 17723 }, { "epoch": 3.61, "learning_rate": 5.475252940718368e-05, "loss": 0.0155, "step": 17724 }, { "epoch": 3.61, "learning_rate": 5.4737554502301485e-05, "loss": 0.0045, "step": 17725 }, { "epoch": 3.61, "learning_rate": 5.472258118848195e-05, "loss": 0.0033, "step": 17726 }, { "epoch": 3.61, "learning_rate": 5.470760946597517e-05, "loss": 0.0076, "step": 17727 }, { "epoch": 3.61, "learning_rate": 5.469263933503123e-05, "loss": 0.0031, "step": 17728 }, { "epoch": 3.61, "learning_rate": 5.4677670795900026e-05, "loss": 0.0105, "step": 17729 }, { "epoch": 3.61, "learning_rate": 5.4662703848831736e-05, "loss": 0.0029, "step": 17730 }, { "epoch": 3.61, "learning_rate": 5.4647738494076174e-05, "loss": 0.0015, "step": 17731 }, { "epoch": 3.61, "learning_rate": 5.46327747318834e-05, "loss": 0.0064, "step": 17732 }, { "epoch": 3.61, "learning_rate": 5.461781256250337e-05, "loss": 0.0085, "step": 17733 }, { "epoch": 3.61, "learning_rate": 5.460285198618581e-05, "loss": 0.0056, "step": 17734 }, { "epoch": 3.61, "learning_rate": 5.458789300318081e-05, "loss": 0.0118, "step": 17735 }, { "epoch": 3.61, "learning_rate": 5.457293561373798e-05, "loss": 0.0008, "step": 17736 }, { "epoch": 3.61, "learning_rate": 5.455797981810736e-05, "loss": 0.0041, "step": 17737 }, { "epoch": 3.61, "learning_rate": 5.45430256165386e-05, "loss": 0.0074, "step": 17738 }, { "epoch": 3.61, "learning_rate": 5.452807300928149e-05, "loss": 0.0059, "step": 17739 }, { "epoch": 3.61, "learning_rate": 5.451312199658579e-05, "loss": 0.0051, "step": 17740 }, { "epoch": 3.61, "learning_rate": 5.4498172578701186e-05, "loss": 0.0051, "step": 17741 }, { "epoch": 3.61, "learning_rate": 5.448322475587737e-05, "loss": 0.0012, "step": 17742 }, { "epoch": 3.61, "learning_rate": 5.4468278528364e-05, "loss": 0.0084, "step": 17743 }, { "epoch": 3.61, "learning_rate": 5.445333389641072e-05, "loss": 0.0046, "step": 17744 }, { "epoch": 3.61, "learning_rate": 5.44383908602671e-05, "loss": 0.0058, "step": 17745 }, { "epoch": 3.61, "learning_rate": 5.44234494201828e-05, "loss": 0.0009, "step": 17746 }, { "epoch": 3.61, "learning_rate": 5.4408509576407205e-05, "loss": 0.0025, "step": 17747 }, { "epoch": 3.61, "learning_rate": 5.439357132919006e-05, "loss": 0.0032, "step": 17748 }, { "epoch": 3.61, "learning_rate": 5.437863467878062e-05, "loss": 0.0025, "step": 17749 }, { "epoch": 3.61, "learning_rate": 5.4363699625428596e-05, "loss": 0.0121, "step": 17750 }, { "epoch": 3.61, "learning_rate": 5.434876616938324e-05, "loss": 0.0042, "step": 17751 }, { "epoch": 3.61, "learning_rate": 5.433383431089408e-05, "loss": 0.0043, "step": 17752 }, { "epoch": 3.61, "learning_rate": 5.4318904050210436e-05, "loss": 0.0083, "step": 17753 }, { "epoch": 3.62, "learning_rate": 5.430397538758168e-05, "loss": 0.0047, "step": 17754 }, { "epoch": 3.62, "learning_rate": 5.428904832325727e-05, "loss": 0.001, "step": 17755 }, { "epoch": 3.62, "learning_rate": 5.427412285748636e-05, "loss": 0.0006, "step": 17756 }, { "epoch": 3.62, "learning_rate": 5.425919899051829e-05, "loss": 0.0071, "step": 17757 }, { "epoch": 3.62, "learning_rate": 5.424427672260232e-05, "loss": 0.003, "step": 17758 }, { "epoch": 3.62, "learning_rate": 5.422935605398769e-05, "loss": 0.0066, "step": 17759 }, { "epoch": 3.62, "learning_rate": 5.4214436984923595e-05, "loss": 0.0052, "step": 17760 }, { "epoch": 3.62, "learning_rate": 5.419951951565926e-05, "loss": 0.0021, "step": 17761 }, { "epoch": 3.62, "learning_rate": 5.418460364644368e-05, "loss": 0.0016, "step": 17762 }, { "epoch": 3.62, "learning_rate": 5.416968937752613e-05, "loss": 0.0193, "step": 17763 }, { "epoch": 3.62, "learning_rate": 5.415477670915568e-05, "loss": 0.0142, "step": 17764 }, { "epoch": 3.62, "learning_rate": 5.4139865641581356e-05, "loss": 0.0022, "step": 17765 }, { "epoch": 3.62, "learning_rate": 5.4124956175052295e-05, "loss": 0.0011, "step": 17766 }, { "epoch": 3.62, "learning_rate": 5.411004830981733e-05, "loss": 0.0095, "step": 17767 }, { "epoch": 3.62, "learning_rate": 5.409514204612566e-05, "loss": 0.0074, "step": 17768 }, { "epoch": 3.62, "learning_rate": 5.408023738422611e-05, "loss": 0.0095, "step": 17769 }, { "epoch": 3.62, "learning_rate": 5.406533432436764e-05, "loss": 0.0023, "step": 17770 }, { "epoch": 3.62, "learning_rate": 5.4050432866799194e-05, "loss": 0.0046, "step": 17771 }, { "epoch": 3.62, "learning_rate": 5.403553301176964e-05, "loss": 0.0026, "step": 17772 }, { "epoch": 3.62, "learning_rate": 5.402063475952781e-05, "loss": 0.0065, "step": 17773 }, { "epoch": 3.62, "learning_rate": 5.400573811032257e-05, "loss": 0.0041, "step": 17774 }, { "epoch": 3.62, "learning_rate": 5.3990843064402716e-05, "loss": 0.005, "step": 17775 }, { "epoch": 3.62, "learning_rate": 5.3975949622017e-05, "loss": 0.0022, "step": 17776 }, { "epoch": 3.62, "learning_rate": 5.3961057783414176e-05, "loss": 0.0002, "step": 17777 }, { "epoch": 3.62, "learning_rate": 5.394616754884297e-05, "loss": 0.0117, "step": 17778 }, { "epoch": 3.62, "learning_rate": 5.393127891855214e-05, "loss": 0.0009, "step": 17779 }, { "epoch": 3.62, "learning_rate": 5.391639189279021e-05, "loss": 0.0027, "step": 17780 }, { "epoch": 3.62, "learning_rate": 5.3901506471805987e-05, "loss": 0.0031, "step": 17781 }, { "epoch": 3.62, "learning_rate": 5.388662265584791e-05, "loss": 0.0014, "step": 17782 }, { "epoch": 3.62, "learning_rate": 5.387174044516476e-05, "loss": 0.0014, "step": 17783 }, { "epoch": 3.62, "learning_rate": 5.385685984000494e-05, "loss": 0.0019, "step": 17784 }, { "epoch": 3.62, "learning_rate": 5.384198084061701e-05, "loss": 0.0004, "step": 17785 }, { "epoch": 3.62, "learning_rate": 5.382710344724961e-05, "loss": 0.0034, "step": 17786 }, { "epoch": 3.62, "learning_rate": 5.381222766015101e-05, "loss": 0.0034, "step": 17787 }, { "epoch": 3.62, "learning_rate": 5.3797353479569874e-05, "loss": 0.0016, "step": 17788 }, { "epoch": 3.62, "learning_rate": 5.3782480905754496e-05, "loss": 0.0007, "step": 17789 }, { "epoch": 3.62, "learning_rate": 5.3767609938953296e-05, "loss": 0.0033, "step": 17790 }, { "epoch": 3.62, "learning_rate": 5.375274057941468e-05, "loss": 0.0035, "step": 17791 }, { "epoch": 3.62, "learning_rate": 5.373787282738695e-05, "loss": 0.0009, "step": 17792 }, { "epoch": 3.62, "learning_rate": 5.372300668311847e-05, "loss": 0.005, "step": 17793 }, { "epoch": 3.62, "learning_rate": 5.370814214685751e-05, "loss": 0.0013, "step": 17794 }, { "epoch": 3.62, "learning_rate": 5.369327921885233e-05, "loss": 0.0043, "step": 17795 }, { "epoch": 3.62, "learning_rate": 5.367841789935119e-05, "loss": 0.0038, "step": 17796 }, { "epoch": 3.62, "learning_rate": 5.366355818860234e-05, "loss": 0.0018, "step": 17797 }, { "epoch": 3.62, "learning_rate": 5.3648700086853823e-05, "loss": 0.0125, "step": 17798 }, { "epoch": 3.62, "learning_rate": 5.363384359435398e-05, "loss": 0.006, "step": 17799 }, { "epoch": 3.62, "learning_rate": 5.361898871135075e-05, "loss": 0.0123, "step": 17800 }, { "epoch": 3.62, "learning_rate": 5.3604135438092453e-05, "loss": 0.0053, "step": 17801 }, { "epoch": 3.62, "learning_rate": 5.3589283774827e-05, "loss": 0.0046, "step": 17802 }, { "epoch": 3.63, "learning_rate": 5.357443372180249e-05, "loss": 0.0078, "step": 17803 }, { "epoch": 3.63, "learning_rate": 5.355958527926695e-05, "loss": 0.0058, "step": 17804 }, { "epoch": 3.63, "learning_rate": 5.35447384474684e-05, "loss": 0.0057, "step": 17805 }, { "epoch": 3.63, "learning_rate": 5.3529893226654766e-05, "loss": 0.005, "step": 17806 }, { "epoch": 3.63, "learning_rate": 5.351504961707403e-05, "loss": 0.0031, "step": 17807 }, { "epoch": 3.63, "learning_rate": 5.3500207618974075e-05, "loss": 0.0069, "step": 17808 }, { "epoch": 3.63, "learning_rate": 5.348536723260283e-05, "loss": 0.0019, "step": 17809 }, { "epoch": 3.63, "learning_rate": 5.347052845820813e-05, "loss": 0.0002, "step": 17810 }, { "epoch": 3.63, "learning_rate": 5.345569129603782e-05, "loss": 0.0019, "step": 17811 }, { "epoch": 3.63, "learning_rate": 5.344085574633976e-05, "loss": 0.0133, "step": 17812 }, { "epoch": 3.63, "learning_rate": 5.342602180936156e-05, "loss": 0.0098, "step": 17813 }, { "epoch": 3.63, "learning_rate": 5.3411189485351205e-05, "loss": 0.0047, "step": 17814 }, { "epoch": 3.63, "learning_rate": 5.3396358774556215e-05, "loss": 0.0139, "step": 17815 }, { "epoch": 3.63, "learning_rate": 5.338152967722441e-05, "loss": 0.0014, "step": 17816 }, { "epoch": 3.63, "learning_rate": 5.336670219360352e-05, "loss": 0.0045, "step": 17817 }, { "epoch": 3.63, "learning_rate": 5.3351876323941e-05, "loss": 0.0006, "step": 17818 }, { "epoch": 3.63, "learning_rate": 5.333705206848467e-05, "loss": 0.0011, "step": 17819 }, { "epoch": 3.63, "learning_rate": 5.332222942748199e-05, "loss": 0.0064, "step": 17820 }, { "epoch": 3.63, "learning_rate": 5.330740840118059e-05, "loss": 0.0046, "step": 17821 }, { "epoch": 3.63, "learning_rate": 5.3292588989827976e-05, "loss": 0.0015, "step": 17822 }, { "epoch": 3.63, "learning_rate": 5.327777119367168e-05, "loss": 0.0021, "step": 17823 }, { "epoch": 3.63, "learning_rate": 5.326295501295917e-05, "loss": 0.0062, "step": 17824 }, { "epoch": 3.63, "learning_rate": 5.324814044793792e-05, "loss": 0.0014, "step": 17825 }, { "epoch": 3.63, "learning_rate": 5.323332749885535e-05, "loss": 0.0163, "step": 17826 }, { "epoch": 3.63, "learning_rate": 5.321851616595889e-05, "loss": 0.0002, "step": 17827 }, { "epoch": 3.63, "learning_rate": 5.3203706449495885e-05, "loss": 0.0041, "step": 17828 }, { "epoch": 3.63, "learning_rate": 5.318889834971369e-05, "loss": 0.0003, "step": 17829 }, { "epoch": 3.63, "learning_rate": 5.3174091866859697e-05, "loss": 0.0066, "step": 17830 }, { "epoch": 3.63, "learning_rate": 5.315928700118105e-05, "loss": 0.0132, "step": 17831 }, { "epoch": 3.63, "learning_rate": 5.31444837529252e-05, "loss": 0.0135, "step": 17832 }, { "epoch": 3.63, "learning_rate": 5.3129682122339196e-05, "loss": 0.0035, "step": 17833 }, { "epoch": 3.63, "learning_rate": 5.311488210967046e-05, "loss": 0.0047, "step": 17834 }, { "epoch": 3.63, "learning_rate": 5.310008371516603e-05, "loss": 0.0011, "step": 17835 }, { "epoch": 3.63, "learning_rate": 5.30852869390731e-05, "loss": 0.0022, "step": 17836 }, { "epoch": 3.63, "learning_rate": 5.307049178163883e-05, "loss": 0.0097, "step": 17837 }, { "epoch": 3.63, "learning_rate": 5.305569824311026e-05, "loss": 0.0034, "step": 17838 }, { "epoch": 3.63, "learning_rate": 5.304090632373463e-05, "loss": 0.0014, "step": 17839 }, { "epoch": 3.63, "learning_rate": 5.302611602375883e-05, "loss": 0.0011, "step": 17840 }, { "epoch": 3.63, "learning_rate": 5.3011327343429955e-05, "loss": 0.0041, "step": 17841 }, { "epoch": 3.63, "learning_rate": 5.299654028299497e-05, "loss": 0.0037, "step": 17842 }, { "epoch": 3.63, "learning_rate": 5.298175484270094e-05, "loss": 0.0033, "step": 17843 }, { "epoch": 3.63, "learning_rate": 5.2966971022794636e-05, "loss": 0.0021, "step": 17844 }, { "epoch": 3.63, "learning_rate": 5.2952188823523126e-05, "loss": 0.0062, "step": 17845 }, { "epoch": 3.63, "learning_rate": 5.2937408245133254e-05, "loss": 0.0053, "step": 17846 }, { "epoch": 3.63, "learning_rate": 5.2922629287871885e-05, "loss": 0.0081, "step": 17847 }, { "epoch": 3.63, "learning_rate": 5.29078519519859e-05, "loss": 0.0017, "step": 17848 }, { "epoch": 3.63, "learning_rate": 5.2893076237721956e-05, "loss": 0.0052, "step": 17849 }, { "epoch": 3.63, "learning_rate": 5.2878302145327046e-05, "loss": 0.0067, "step": 17850 }, { "epoch": 3.63, "learning_rate": 5.286352967504773e-05, "loss": 0.0053, "step": 17851 }, { "epoch": 3.64, "learning_rate": 5.284875882713092e-05, "loss": 0.0053, "step": 17852 }, { "epoch": 3.64, "learning_rate": 5.283398960182316e-05, "loss": 0.0032, "step": 17853 }, { "epoch": 3.64, "learning_rate": 5.28192219993712e-05, "loss": 0.0029, "step": 17854 }, { "epoch": 3.64, "learning_rate": 5.280445602002168e-05, "loss": 0.0026, "step": 17855 }, { "epoch": 3.64, "learning_rate": 5.278969166402121e-05, "loss": 0.0013, "step": 17856 }, { "epoch": 3.64, "learning_rate": 5.277492893161638e-05, "loss": 0.0013, "step": 17857 }, { "epoch": 3.64, "learning_rate": 5.276016782305377e-05, "loss": 0.0013, "step": 17858 }, { "epoch": 3.64, "learning_rate": 5.274540833857991e-05, "loss": 0.0085, "step": 17859 }, { "epoch": 3.64, "learning_rate": 5.273065047844131e-05, "loss": 0.005, "step": 17860 }, { "epoch": 3.64, "learning_rate": 5.271589424288446e-05, "loss": 0.004, "step": 17861 }, { "epoch": 3.64, "learning_rate": 5.2701139632155796e-05, "loss": 0.0036, "step": 17862 }, { "epoch": 3.64, "learning_rate": 5.2686386646501827e-05, "loss": 0.0074, "step": 17863 }, { "epoch": 3.64, "learning_rate": 5.26716352861688e-05, "loss": 0.0005, "step": 17864 }, { "epoch": 3.64, "learning_rate": 5.265688555140327e-05, "loss": 0.0072, "step": 17865 }, { "epoch": 3.64, "learning_rate": 5.264213744245146e-05, "loss": 0.0026, "step": 17866 }, { "epoch": 3.64, "learning_rate": 5.262739095955973e-05, "loss": 0.0011, "step": 17867 }, { "epoch": 3.64, "learning_rate": 5.261264610297438e-05, "loss": 0.0094, "step": 17868 }, { "epoch": 3.64, "learning_rate": 5.2597902872941604e-05, "loss": 0.003, "step": 17869 }, { "epoch": 3.64, "learning_rate": 5.258316126970782e-05, "loss": 0.0007, "step": 17870 }, { "epoch": 3.64, "learning_rate": 5.256842129351909e-05, "loss": 0.0026, "step": 17871 }, { "epoch": 3.64, "learning_rate": 5.255368294462163e-05, "loss": 0.0011, "step": 17872 }, { "epoch": 3.64, "learning_rate": 5.25389462232616e-05, "loss": 0.0048, "step": 17873 }, { "epoch": 3.64, "learning_rate": 5.252421112968515e-05, "loss": 0.0057, "step": 17874 }, { "epoch": 3.64, "learning_rate": 5.250947766413836e-05, "loss": 0.0069, "step": 17875 }, { "epoch": 3.64, "learning_rate": 5.2494745826867336e-05, "loss": 0.01, "step": 17876 }, { "epoch": 3.64, "learning_rate": 5.248001561811809e-05, "loss": 0.0008, "step": 17877 }, { "epoch": 3.64, "learning_rate": 5.246528703813669e-05, "loss": 0.0057, "step": 17878 }, { "epoch": 3.64, "learning_rate": 5.245056008716909e-05, "loss": 0.0076, "step": 17879 }, { "epoch": 3.64, "learning_rate": 5.2435834765461286e-05, "loss": 0.0039, "step": 17880 }, { "epoch": 3.64, "learning_rate": 5.2421111073259245e-05, "loss": 0.0018, "step": 17881 }, { "epoch": 3.64, "learning_rate": 5.240638901080874e-05, "loss": 0.0017, "step": 17882 }, { "epoch": 3.64, "learning_rate": 5.239166857835587e-05, "loss": 0.0009, "step": 17883 }, { "epoch": 3.64, "learning_rate": 5.2376949776146275e-05, "loss": 0.0136, "step": 17884 }, { "epoch": 3.64, "learning_rate": 5.236223260442601e-05, "loss": 0.0054, "step": 17885 }, { "epoch": 3.64, "learning_rate": 5.23475170634407e-05, "loss": 0.0114, "step": 17886 }, { "epoch": 3.64, "learning_rate": 5.23328031534362e-05, "loss": 0.0199, "step": 17887 }, { "epoch": 3.64, "learning_rate": 5.231809087465823e-05, "loss": 0.001, "step": 17888 }, { "epoch": 3.64, "learning_rate": 5.230338022735254e-05, "loss": 0.0048, "step": 17889 }, { "epoch": 3.64, "learning_rate": 5.2288671211764824e-05, "loss": 0.0042, "step": 17890 }, { "epoch": 3.64, "learning_rate": 5.227396382814072e-05, "loss": 0.0028, "step": 17891 }, { "epoch": 3.64, "learning_rate": 5.22592580767259e-05, "loss": 0.0019, "step": 17892 }, { "epoch": 3.64, "learning_rate": 5.2244553957765974e-05, "loss": 0.0052, "step": 17893 }, { "epoch": 3.64, "learning_rate": 5.222985147150658e-05, "loss": 0.0019, "step": 17894 }, { "epoch": 3.64, "learning_rate": 5.221515061819311e-05, "loss": 0.0029, "step": 17895 }, { "epoch": 3.64, "learning_rate": 5.2200451398071315e-05, "loss": 0.0093, "step": 17896 }, { "epoch": 3.64, "learning_rate": 5.218575381138649e-05, "loss": 0.0018, "step": 17897 }, { "epoch": 3.64, "learning_rate": 5.2171057858384254e-05, "loss": 0.0005, "step": 17898 }, { "epoch": 3.64, "learning_rate": 5.215636353931008e-05, "loss": 0.0069, "step": 17899 }, { "epoch": 3.64, "learning_rate": 5.214167085440921e-05, "loss": 0.0037, "step": 17900 }, { "epoch": 3.64, "learning_rate": 5.2126979803927264e-05, "loss": 0.0002, "step": 17901 }, { "epoch": 3.65, "learning_rate": 5.2112290388109404e-05, "loss": 0.005, "step": 17902 }, { "epoch": 3.65, "learning_rate": 5.209760260720119e-05, "loss": 0.0016, "step": 17903 }, { "epoch": 3.65, "learning_rate": 5.208291646144775e-05, "loss": 0.0041, "step": 17904 }, { "epoch": 3.65, "learning_rate": 5.206823195109442e-05, "loss": 0.0013, "step": 17905 }, { "epoch": 3.65, "learning_rate": 5.20535490763865e-05, "loss": 0.0019, "step": 17906 }, { "epoch": 3.65, "learning_rate": 5.203886783756919e-05, "loss": 0.0021, "step": 17907 }, { "epoch": 3.65, "learning_rate": 5.20241882348877e-05, "loss": 0.0041, "step": 17908 }, { "epoch": 3.65, "learning_rate": 5.200951026858722e-05, "loss": 0.0051, "step": 17909 }, { "epoch": 3.65, "learning_rate": 5.1994833938912884e-05, "loss": 0.0049, "step": 17910 }, { "epoch": 3.65, "learning_rate": 5.1980159246109816e-05, "loss": 0.0028, "step": 17911 }, { "epoch": 3.65, "learning_rate": 5.196548619042311e-05, "loss": 0.005, "step": 17912 }, { "epoch": 3.65, "learning_rate": 5.195081477209783e-05, "loss": 0.0065, "step": 17913 }, { "epoch": 3.65, "learning_rate": 5.19361449913791e-05, "loss": 0.0079, "step": 17914 }, { "epoch": 3.65, "learning_rate": 5.192147684851174e-05, "loss": 0.0027, "step": 17915 }, { "epoch": 3.65, "learning_rate": 5.190681034374094e-05, "loss": 0.001, "step": 17916 }, { "epoch": 3.65, "learning_rate": 5.189214547731154e-05, "loss": 0.0035, "step": 17917 }, { "epoch": 3.65, "learning_rate": 5.18774822494685e-05, "loss": 0.0037, "step": 17918 }, { "epoch": 3.65, "learning_rate": 5.186282066045673e-05, "loss": 0.0019, "step": 17919 }, { "epoch": 3.65, "learning_rate": 5.184816071052109e-05, "loss": 0.0095, "step": 17920 }, { "epoch": 3.65, "learning_rate": 5.183350239990644e-05, "loss": 0.0001, "step": 17921 }, { "epoch": 3.65, "learning_rate": 5.1818845728857617e-05, "loss": 0.0026, "step": 17922 }, { "epoch": 3.65, "learning_rate": 5.180419069761939e-05, "loss": 0.0135, "step": 17923 }, { "epoch": 3.65, "learning_rate": 5.178953730643654e-05, "loss": 0.0001, "step": 17924 }, { "epoch": 3.65, "learning_rate": 5.17748855555538e-05, "loss": 0.0015, "step": 17925 }, { "epoch": 3.65, "learning_rate": 5.1760235445215894e-05, "loss": 0.0022, "step": 17926 }, { "epoch": 3.65, "learning_rate": 5.174558697566755e-05, "loss": 0.0034, "step": 17927 }, { "epoch": 3.65, "learning_rate": 5.173094014715326e-05, "loss": 0.0024, "step": 17928 }, { "epoch": 3.65, "learning_rate": 5.171629495991781e-05, "loss": 0.0043, "step": 17929 }, { "epoch": 3.65, "learning_rate": 5.1701651414205765e-05, "loss": 0.0075, "step": 17930 }, { "epoch": 3.65, "learning_rate": 5.1687009510261687e-05, "loss": 0.0023, "step": 17931 }, { "epoch": 3.65, "learning_rate": 5.167236924833019e-05, "loss": 0.0056, "step": 17932 }, { "epoch": 3.65, "learning_rate": 5.165773062865562e-05, "loss": 0.0017, "step": 17933 }, { "epoch": 3.65, "learning_rate": 5.1643093651482694e-05, "loss": 0.0041, "step": 17934 }, { "epoch": 3.65, "learning_rate": 5.162845831705567e-05, "loss": 0.0063, "step": 17935 }, { "epoch": 3.65, "learning_rate": 5.161382462561917e-05, "loss": 0.0003, "step": 17936 }, { "epoch": 3.65, "learning_rate": 5.1599192577417465e-05, "loss": 0.0148, "step": 17937 }, { "epoch": 3.65, "learning_rate": 5.1584562172694985e-05, "loss": 0.0005, "step": 17938 }, { "epoch": 3.65, "learning_rate": 5.156993341169611e-05, "loss": 0.0091, "step": 17939 }, { "epoch": 3.65, "learning_rate": 5.1555306294665124e-05, "loss": 0.0016, "step": 17940 }, { "epoch": 3.65, "learning_rate": 5.1540680821846366e-05, "loss": 0.0025, "step": 17941 }, { "epoch": 3.65, "learning_rate": 5.152605699348407e-05, "loss": 0.0026, "step": 17942 }, { "epoch": 3.65, "learning_rate": 5.1511434809822535e-05, "loss": 0.005, "step": 17943 }, { "epoch": 3.65, "learning_rate": 5.1496814271105935e-05, "loss": 0.0038, "step": 17944 }, { "epoch": 3.65, "learning_rate": 5.1482195377578515e-05, "loss": 0.0004, "step": 17945 }, { "epoch": 3.65, "learning_rate": 5.146757812948432e-05, "loss": 0.0009, "step": 17946 }, { "epoch": 3.65, "learning_rate": 5.1452962527067654e-05, "loss": 0.0024, "step": 17947 }, { "epoch": 3.65, "learning_rate": 5.143834857057242e-05, "loss": 0.0039, "step": 17948 }, { "epoch": 3.65, "learning_rate": 5.142373626024294e-05, "loss": 0.0078, "step": 17949 }, { "epoch": 3.65, "learning_rate": 5.1409125596323064e-05, "loss": 0.0004, "step": 17950 }, { "epoch": 3.66, "learning_rate": 5.139451657905686e-05, "loss": 0.004, "step": 17951 }, { "epoch": 3.66, "learning_rate": 5.1379909208688464e-05, "loss": 0.006, "step": 17952 }, { "epoch": 3.66, "learning_rate": 5.136530348546163e-05, "loss": 0.0033, "step": 17953 }, { "epoch": 3.66, "learning_rate": 5.135069940962052e-05, "loss": 0.0006, "step": 17954 }, { "epoch": 3.66, "learning_rate": 5.1336096981408884e-05, "loss": 0.0028, "step": 17955 }, { "epoch": 3.66, "learning_rate": 5.1321496201070675e-05, "loss": 0.0076, "step": 17956 }, { "epoch": 3.66, "learning_rate": 5.130689706884975e-05, "loss": 0.0038, "step": 17957 }, { "epoch": 3.66, "learning_rate": 5.1292299584989957e-05, "loss": 0.0058, "step": 17958 }, { "epoch": 3.66, "learning_rate": 5.127770374973506e-05, "loss": 0.0019, "step": 17959 }, { "epoch": 3.66, "learning_rate": 5.1263109563328876e-05, "loss": 0.0083, "step": 17960 }, { "epoch": 3.66, "learning_rate": 5.1248517026015135e-05, "loss": 0.005, "step": 17961 }, { "epoch": 3.66, "learning_rate": 5.123392613803756e-05, "loss": 0.0045, "step": 17962 }, { "epoch": 3.66, "learning_rate": 5.1219336899639864e-05, "loss": 0.0024, "step": 17963 }, { "epoch": 3.66, "learning_rate": 5.120474931106571e-05, "loss": 0.0054, "step": 17964 }, { "epoch": 3.66, "learning_rate": 5.119016337255877e-05, "loss": 0.0016, "step": 17965 }, { "epoch": 3.66, "learning_rate": 5.117557908436252e-05, "loss": 0.0001, "step": 17966 }, { "epoch": 3.66, "learning_rate": 5.116099644672074e-05, "loss": 0.0043, "step": 17967 }, { "epoch": 3.66, "learning_rate": 5.114641545987685e-05, "loss": 0.003, "step": 17968 }, { "epoch": 3.66, "learning_rate": 5.113183612407441e-05, "loss": 0.0029, "step": 17969 }, { "epoch": 3.66, "learning_rate": 5.1117258439556944e-05, "loss": 0.0033, "step": 17970 }, { "epoch": 3.66, "learning_rate": 5.110268240656791e-05, "loss": 0.0148, "step": 17971 }, { "epoch": 3.66, "learning_rate": 5.1088108025350766e-05, "loss": 0.001, "step": 17972 }, { "epoch": 3.66, "learning_rate": 5.107353529614893e-05, "loss": 0.0071, "step": 17973 }, { "epoch": 3.66, "learning_rate": 5.1058964219205786e-05, "loss": 0.015, "step": 17974 }, { "epoch": 3.66, "learning_rate": 5.104439479476471e-05, "loss": 0.0016, "step": 17975 }, { "epoch": 3.66, "learning_rate": 5.102982702306903e-05, "loss": 0.0029, "step": 17976 }, { "epoch": 3.66, "learning_rate": 5.101526090436205e-05, "loss": 0.0046, "step": 17977 }, { "epoch": 3.66, "learning_rate": 5.1000696438887117e-05, "loss": 0.0052, "step": 17978 }, { "epoch": 3.66, "learning_rate": 5.098613362688732e-05, "loss": 0.0035, "step": 17979 }, { "epoch": 3.66, "learning_rate": 5.0971572468606106e-05, "loss": 0.0033, "step": 17980 }, { "epoch": 3.66, "learning_rate": 5.095701296428645e-05, "loss": 0.0102, "step": 17981 }, { "epoch": 3.66, "learning_rate": 5.094245511417169e-05, "loss": 0.0026, "step": 17982 }, { "epoch": 3.66, "learning_rate": 5.0927898918504976e-05, "loss": 0.0031, "step": 17983 }, { "epoch": 3.66, "learning_rate": 5.0913344377529245e-05, "loss": 0.0044, "step": 17984 }, { "epoch": 3.66, "learning_rate": 5.089879149148781e-05, "loss": 0.0072, "step": 17985 }, { "epoch": 3.66, "learning_rate": 5.088424026062351e-05, "loss": 0.0004, "step": 17986 }, { "epoch": 3.66, "learning_rate": 5.086969068517961e-05, "loss": 0.0045, "step": 17987 }, { "epoch": 3.66, "learning_rate": 5.085514276539894e-05, "loss": 0.0024, "step": 17988 }, { "epoch": 3.66, "learning_rate": 5.0840596501524533e-05, "loss": 0.0004, "step": 17989 }, { "epoch": 3.66, "learning_rate": 5.082605189379934e-05, "loss": 0.008, "step": 17990 }, { "epoch": 3.66, "learning_rate": 5.081150894246629e-05, "loss": 0.0043, "step": 17991 }, { "epoch": 3.66, "learning_rate": 5.079696764776827e-05, "loss": 0.0019, "step": 17992 }, { "epoch": 3.66, "learning_rate": 5.0782428009948145e-05, "loss": 0.0016, "step": 17993 }, { "epoch": 3.66, "learning_rate": 5.0767890029248764e-05, "loss": 0.0011, "step": 17994 }, { "epoch": 3.66, "learning_rate": 5.075335370591293e-05, "loss": 0.0086, "step": 17995 }, { "epoch": 3.66, "learning_rate": 5.073881904018348e-05, "loss": 0.0036, "step": 17996 }, { "epoch": 3.66, "learning_rate": 5.072428603230304e-05, "loss": 0.0006, "step": 17997 }, { "epoch": 3.66, "learning_rate": 5.07097546825145e-05, "loss": 0.0005, "step": 17998 }, { "epoch": 3.66, "learning_rate": 5.069522499106037e-05, "loss": 0.0062, "step": 17999 }, { "epoch": 3.67, "learning_rate": 5.068069695818356e-05, "loss": 0.0033, "step": 18000 }, { "epoch": 3.67, "learning_rate": 5.066617058412653e-05, "loss": 0.0014, "step": 18001 }, { "epoch": 3.67, "learning_rate": 5.0651645869131947e-05, "loss": 0.0018, "step": 18002 }, { "epoch": 3.67, "learning_rate": 5.063712281344241e-05, "loss": 0.0031, "step": 18003 }, { "epoch": 3.67, "learning_rate": 5.062260141730044e-05, "loss": 0.0011, "step": 18004 }, { "epoch": 3.67, "learning_rate": 5.060808168094873e-05, "loss": 0.0053, "step": 18005 }, { "epoch": 3.67, "learning_rate": 5.059356360462959e-05, "loss": 0.0017, "step": 18006 }, { "epoch": 3.67, "learning_rate": 5.0579047188585604e-05, "loss": 0.0089, "step": 18007 }, { "epoch": 3.67, "learning_rate": 5.056453243305919e-05, "loss": 0.0081, "step": 18008 }, { "epoch": 3.67, "learning_rate": 5.055001933829279e-05, "loss": 0.0033, "step": 18009 }, { "epoch": 3.67, "learning_rate": 5.0535507904528795e-05, "loss": 0.0088, "step": 18010 }, { "epoch": 3.67, "learning_rate": 5.052099813200956e-05, "loss": 0.002, "step": 18011 }, { "epoch": 3.67, "learning_rate": 5.050649002097743e-05, "loss": 0.0023, "step": 18012 }, { "epoch": 3.67, "learning_rate": 5.0491983571674744e-05, "loss": 0.0002, "step": 18013 }, { "epoch": 3.67, "learning_rate": 5.047747878434375e-05, "loss": 0.0009, "step": 18014 }, { "epoch": 3.67, "learning_rate": 5.046297565922672e-05, "loss": 0.002, "step": 18015 }, { "epoch": 3.67, "learning_rate": 5.0448474196565954e-05, "loss": 0.0007, "step": 18016 }, { "epoch": 3.67, "learning_rate": 5.043397439660348e-05, "loss": 0.005, "step": 18017 }, { "epoch": 3.67, "learning_rate": 5.041947625958167e-05, "loss": 0.0024, "step": 18018 }, { "epoch": 3.67, "learning_rate": 5.0404979785742536e-05, "loss": 0.002, "step": 18019 }, { "epoch": 3.67, "learning_rate": 5.0390484975328224e-05, "loss": 0.002, "step": 18020 }, { "epoch": 3.67, "learning_rate": 5.037599182858086e-05, "loss": 0.0171, "step": 18021 }, { "epoch": 3.67, "learning_rate": 5.036150034574247e-05, "loss": 0.0029, "step": 18022 }, { "epoch": 3.67, "learning_rate": 5.034701052705512e-05, "loss": 0.006, "step": 18023 }, { "epoch": 3.67, "learning_rate": 5.033252237276079e-05, "loss": 0.0019, "step": 18024 }, { "epoch": 3.67, "learning_rate": 5.031803588310148e-05, "loss": 0.0116, "step": 18025 }, { "epoch": 3.67, "learning_rate": 5.0303551058319116e-05, "loss": 0.0023, "step": 18026 }, { "epoch": 3.67, "learning_rate": 5.028906789865566e-05, "loss": 0.0043, "step": 18027 }, { "epoch": 3.67, "learning_rate": 5.027458640435297e-05, "loss": 0.0055, "step": 18028 }, { "epoch": 3.67, "learning_rate": 5.026010657565301e-05, "loss": 0.0033, "step": 18029 }, { "epoch": 3.67, "learning_rate": 5.024562841279742e-05, "loss": 0.0073, "step": 18030 }, { "epoch": 3.67, "learning_rate": 5.023115191602824e-05, "loss": 0.0058, "step": 18031 }, { "epoch": 3.67, "learning_rate": 5.021667708558705e-05, "loss": 0.0032, "step": 18032 }, { "epoch": 3.67, "learning_rate": 5.020220392171581e-05, "loss": 0.0001, "step": 18033 }, { "epoch": 3.67, "learning_rate": 5.018773242465609e-05, "loss": 0.0038, "step": 18034 }, { "epoch": 3.67, "learning_rate": 5.017326259464961e-05, "loss": 0.0029, "step": 18035 }, { "epoch": 3.67, "learning_rate": 5.015879443193817e-05, "loss": 0.0056, "step": 18036 }, { "epoch": 3.67, "learning_rate": 5.014432793676322e-05, "loss": 0.0067, "step": 18037 }, { "epoch": 3.67, "learning_rate": 5.012986310936659e-05, "loss": 0.0007, "step": 18038 }, { "epoch": 3.67, "learning_rate": 5.011539994998973e-05, "loss": 0.0049, "step": 18039 }, { "epoch": 3.67, "learning_rate": 5.0100938458874215e-05, "loss": 0.0033, "step": 18040 }, { "epoch": 3.67, "learning_rate": 5.008647863626162e-05, "loss": 0.0033, "step": 18041 }, { "epoch": 3.67, "learning_rate": 5.007202048239342e-05, "loss": 0.0032, "step": 18042 }, { "epoch": 3.67, "learning_rate": 5.00575639975111e-05, "loss": 0.0057, "step": 18043 }, { "epoch": 3.67, "learning_rate": 5.0043109181856124e-05, "loss": 0.011, "step": 18044 }, { "epoch": 3.67, "learning_rate": 5.00286560356699e-05, "loss": 0.0017, "step": 18045 }, { "epoch": 3.67, "learning_rate": 5.001420455919384e-05, "loss": 0.0056, "step": 18046 }, { "epoch": 3.67, "learning_rate": 4.999975475266936e-05, "loss": 0.003, "step": 18047 }, { "epoch": 3.67, "learning_rate": 4.998530661633762e-05, "loss": 0.0048, "step": 18048 }, { "epoch": 3.68, "learning_rate": 4.997086015044016e-05, "loss": 0.0062, "step": 18049 }, { "epoch": 3.68, "learning_rate": 4.995641535521805e-05, "loss": 0.0028, "step": 18050 }, { "epoch": 3.68, "learning_rate": 4.994197223091274e-05, "loss": 0.0007, "step": 18051 }, { "epoch": 3.68, "learning_rate": 4.992753077776533e-05, "loss": 0.0129, "step": 18052 }, { "epoch": 3.68, "learning_rate": 4.991309099601705e-05, "loss": 0.0101, "step": 18053 }, { "epoch": 3.68, "learning_rate": 4.989865288590908e-05, "loss": 0.0085, "step": 18054 }, { "epoch": 3.68, "learning_rate": 4.988421644768257e-05, "loss": 0.007, "step": 18055 }, { "epoch": 3.68, "learning_rate": 4.986978168157861e-05, "loss": 0.006, "step": 18056 }, { "epoch": 3.68, "learning_rate": 4.985534858783831e-05, "loss": 0.0064, "step": 18057 }, { "epoch": 3.68, "learning_rate": 4.984091716670274e-05, "loss": 0.0012, "step": 18058 }, { "epoch": 3.68, "learning_rate": 4.982648741841289e-05, "loss": 0.0033, "step": 18059 }, { "epoch": 3.68, "learning_rate": 4.981205934320981e-05, "loss": 0.0025, "step": 18060 }, { "epoch": 3.68, "learning_rate": 4.9797632941334447e-05, "loss": 0.0008, "step": 18061 }, { "epoch": 3.68, "learning_rate": 4.9783208213027834e-05, "loss": 0.0219, "step": 18062 }, { "epoch": 3.68, "learning_rate": 4.976878515853069e-05, "loss": 0.0058, "step": 18063 }, { "epoch": 3.68, "learning_rate": 4.97543637780841e-05, "loss": 0.0008, "step": 18064 }, { "epoch": 3.68, "learning_rate": 4.973994407192889e-05, "loss": 0.0033, "step": 18065 }, { "epoch": 3.68, "learning_rate": 4.972552604030578e-05, "loss": 0.0057, "step": 18066 }, { "epoch": 3.68, "learning_rate": 4.971110968345577e-05, "loss": 0.0034, "step": 18067 }, { "epoch": 3.68, "learning_rate": 4.969669500161945e-05, "loss": 0.0069, "step": 18068 }, { "epoch": 3.68, "learning_rate": 4.9682281995037737e-05, "loss": 0.0015, "step": 18069 }, { "epoch": 3.68, "learning_rate": 4.966787066395124e-05, "loss": 0.0094, "step": 18070 }, { "epoch": 3.68, "learning_rate": 4.9653461008600686e-05, "loss": 0.0014, "step": 18071 }, { "epoch": 3.68, "learning_rate": 4.9639053029226745e-05, "loss": 0.0056, "step": 18072 }, { "epoch": 3.68, "learning_rate": 4.962464672607008e-05, "loss": 0.0017, "step": 18073 }, { "epoch": 3.68, "learning_rate": 4.961024209937128e-05, "loss": 0.0032, "step": 18074 }, { "epoch": 3.68, "learning_rate": 4.959583914937094e-05, "loss": 0.0005, "step": 18075 }, { "epoch": 3.68, "learning_rate": 4.95814378763096e-05, "loss": 0.015, "step": 18076 }, { "epoch": 3.68, "learning_rate": 4.9567038280427807e-05, "loss": 0.0018, "step": 18077 }, { "epoch": 3.68, "learning_rate": 4.955264036196605e-05, "loss": 0.0031, "step": 18078 }, { "epoch": 3.68, "learning_rate": 4.9538244121164824e-05, "loss": 0.002, "step": 18079 }, { "epoch": 3.68, "learning_rate": 4.952384955826459e-05, "loss": 0.0098, "step": 18080 }, { "epoch": 3.68, "learning_rate": 4.950945667350564e-05, "loss": 0.0015, "step": 18081 }, { "epoch": 3.68, "learning_rate": 4.9495065467128544e-05, "loss": 0.0022, "step": 18082 }, { "epoch": 3.68, "learning_rate": 4.9480675939373484e-05, "loss": 0.0103, "step": 18083 }, { "epoch": 3.68, "learning_rate": 4.946628809048097e-05, "loss": 0.0057, "step": 18084 }, { "epoch": 3.68, "learning_rate": 4.9451901920691165e-05, "loss": 0.0028, "step": 18085 }, { "epoch": 3.68, "learning_rate": 4.94375174302444e-05, "loss": 0.0055, "step": 18086 }, { "epoch": 3.68, "learning_rate": 4.9423134619380914e-05, "loss": 0.0123, "step": 18087 }, { "epoch": 3.68, "learning_rate": 4.940875348834087e-05, "loss": 0.0029, "step": 18088 }, { "epoch": 3.68, "learning_rate": 4.939437403736464e-05, "loss": 0.0052, "step": 18089 }, { "epoch": 3.68, "learning_rate": 4.937999626669222e-05, "loss": 0.0033, "step": 18090 }, { "epoch": 3.68, "learning_rate": 4.936562017656381e-05, "loss": 0.0051, "step": 18091 }, { "epoch": 3.68, "learning_rate": 4.935124576721947e-05, "loss": 0.0037, "step": 18092 }, { "epoch": 3.68, "learning_rate": 4.933687303889939e-05, "loss": 0.0058, "step": 18093 }, { "epoch": 3.68, "learning_rate": 4.932250199184343e-05, "loss": 0.0015, "step": 18094 }, { "epoch": 3.68, "learning_rate": 4.9308132626291795e-05, "loss": 0.001, "step": 18095 }, { "epoch": 3.68, "learning_rate": 4.9293764942484406e-05, "loss": 0.0001, "step": 18096 }, { "epoch": 3.68, "learning_rate": 4.927939894066123e-05, "loss": 0.0041, "step": 18097 }, { "epoch": 3.69, "learning_rate": 4.926503462106228e-05, "loss": 0.0086, "step": 18098 }, { "epoch": 3.69, "learning_rate": 4.925067198392729e-05, "loss": 0.01, "step": 18099 }, { "epoch": 3.69, "learning_rate": 4.923631102949637e-05, "loss": 0.0046, "step": 18100 }, { "epoch": 3.69, "learning_rate": 4.922195175800915e-05, "loss": 0.0021, "step": 18101 }, { "epoch": 3.69, "learning_rate": 4.920759416970567e-05, "loss": 0.0056, "step": 18102 }, { "epoch": 3.69, "learning_rate": 4.919323826482558e-05, "loss": 0.0032, "step": 18103 }, { "epoch": 3.69, "learning_rate": 4.917888404360868e-05, "loss": 0.0038, "step": 18104 }, { "epoch": 3.69, "learning_rate": 4.9164531506294745e-05, "loss": 0.0053, "step": 18105 }, { "epoch": 3.69, "learning_rate": 4.915018065312347e-05, "loss": 0.0026, "step": 18106 }, { "epoch": 3.69, "learning_rate": 4.913583148433455e-05, "loss": 0.0058, "step": 18107 }, { "epoch": 3.69, "learning_rate": 4.912148400016765e-05, "loss": 0.0013, "step": 18108 }, { "epoch": 3.69, "learning_rate": 4.9107138200862364e-05, "loss": 0.0044, "step": 18109 }, { "epoch": 3.69, "learning_rate": 4.9092794086658324e-05, "loss": 0.0076, "step": 18110 }, { "epoch": 3.69, "learning_rate": 4.907845165779512e-05, "loss": 0.0017, "step": 18111 }, { "epoch": 3.69, "learning_rate": 4.906411091451226e-05, "loss": 0.0093, "step": 18112 }, { "epoch": 3.69, "learning_rate": 4.904977185704932e-05, "loss": 0.0013, "step": 18113 }, { "epoch": 3.69, "learning_rate": 4.903543448564567e-05, "loss": 0.0016, "step": 18114 }, { "epoch": 3.69, "learning_rate": 4.9021098800540934e-05, "loss": 0.0161, "step": 18115 }, { "epoch": 3.69, "learning_rate": 4.90067648019744e-05, "loss": 0.0005, "step": 18116 }, { "epoch": 3.69, "learning_rate": 4.899243249018549e-05, "loss": 0.003, "step": 18117 }, { "epoch": 3.69, "learning_rate": 4.897810186541374e-05, "loss": 0.0008, "step": 18118 }, { "epoch": 3.69, "learning_rate": 4.896377292789825e-05, "loss": 0.0055, "step": 18119 }, { "epoch": 3.69, "learning_rate": 4.8949445677878596e-05, "loss": 0.0023, "step": 18120 }, { "epoch": 3.69, "learning_rate": 4.893512011559389e-05, "loss": 0.0081, "step": 18121 }, { "epoch": 3.69, "learning_rate": 4.8920796241283444e-05, "loss": 0.0086, "step": 18122 }, { "epoch": 3.69, "learning_rate": 4.89064740551865e-05, "loss": 0.0064, "step": 18123 }, { "epoch": 3.69, "learning_rate": 4.8892153557542284e-05, "loss": 0.0083, "step": 18124 }, { "epoch": 3.69, "learning_rate": 4.887783474858994e-05, "loss": 0.0067, "step": 18125 }, { "epoch": 3.69, "learning_rate": 4.886351762856864e-05, "loss": 0.008, "step": 18126 }, { "epoch": 3.69, "learning_rate": 4.8849202197717506e-05, "loss": 0.0039, "step": 18127 }, { "epoch": 3.69, "learning_rate": 4.883488845627564e-05, "loss": 0.0004, "step": 18128 }, { "epoch": 3.69, "learning_rate": 4.882057640448209e-05, "loss": 0.0223, "step": 18129 }, { "epoch": 3.69, "learning_rate": 4.880626604257591e-05, "loss": 0.0027, "step": 18130 }, { "epoch": 3.69, "learning_rate": 4.8791957370796146e-05, "loss": 0.0007, "step": 18131 }, { "epoch": 3.69, "learning_rate": 4.877765038938165e-05, "loss": 0.0041, "step": 18132 }, { "epoch": 3.69, "learning_rate": 4.8763345098571546e-05, "loss": 0.0086, "step": 18133 }, { "epoch": 3.69, "learning_rate": 4.8749041498604585e-05, "loss": 0.0059, "step": 18134 }, { "epoch": 3.69, "learning_rate": 4.873473958971987e-05, "loss": 0.0071, "step": 18135 }, { "epoch": 3.69, "learning_rate": 4.8720439372156084e-05, "loss": 0.0002, "step": 18136 }, { "epoch": 3.69, "learning_rate": 4.870614084615214e-05, "loss": 0.0007, "step": 18137 }, { "epoch": 3.69, "learning_rate": 4.8691844011946865e-05, "loss": 0.003, "step": 18138 }, { "epoch": 3.69, "learning_rate": 4.867754886977902e-05, "loss": 0.0005, "step": 18139 }, { "epoch": 3.69, "learning_rate": 4.866325541988736e-05, "loss": 0.0006, "step": 18140 }, { "epoch": 3.69, "learning_rate": 4.864896366251064e-05, "loss": 0.0044, "step": 18141 }, { "epoch": 3.69, "learning_rate": 4.863467359788753e-05, "loss": 0.0047, "step": 18142 }, { "epoch": 3.69, "learning_rate": 4.8620385226256715e-05, "loss": 0.0028, "step": 18143 }, { "epoch": 3.69, "learning_rate": 4.860609854785687e-05, "loss": 0.005, "step": 18144 }, { "epoch": 3.69, "learning_rate": 4.859181356292649e-05, "loss": 0.0003, "step": 18145 }, { "epoch": 3.69, "learning_rate": 4.857753027170433e-05, "loss": 0.0076, "step": 18146 }, { "epoch": 3.7, "learning_rate": 4.8563248674428775e-05, "loss": 0.0045, "step": 18147 }, { "epoch": 3.7, "learning_rate": 4.8548968771338496e-05, "loss": 0.0023, "step": 18148 }, { "epoch": 3.7, "learning_rate": 4.853469056267199e-05, "loss": 0.0031, "step": 18149 }, { "epoch": 3.7, "learning_rate": 4.852041404866757e-05, "loss": 0.0074, "step": 18150 }, { "epoch": 3.7, "learning_rate": 4.85061392295639e-05, "loss": 0.0036, "step": 18151 }, { "epoch": 3.7, "learning_rate": 4.849186610559918e-05, "loss": 0.003, "step": 18152 }, { "epoch": 3.7, "learning_rate": 4.847759467701202e-05, "loss": 0.0113, "step": 18153 }, { "epoch": 3.7, "learning_rate": 4.84633249440406e-05, "loss": 0.0089, "step": 18154 }, { "epoch": 3.7, "learning_rate": 4.844905690692332e-05, "loss": 0.0031, "step": 18155 }, { "epoch": 3.7, "learning_rate": 4.8434790565898496e-05, "loss": 0.0027, "step": 18156 }, { "epoch": 3.7, "learning_rate": 4.842052592120438e-05, "loss": 0.0002, "step": 18157 }, { "epoch": 3.7, "learning_rate": 4.8406262973079216e-05, "loss": 0.0015, "step": 18158 }, { "epoch": 3.7, "learning_rate": 4.839200172176124e-05, "loss": 0.0019, "step": 18159 }, { "epoch": 3.7, "learning_rate": 4.8377742167488627e-05, "loss": 0.0022, "step": 18160 }, { "epoch": 3.7, "learning_rate": 4.836348431049956e-05, "loss": 0.0116, "step": 18161 }, { "epoch": 3.7, "learning_rate": 4.8349228151032145e-05, "loss": 0.0056, "step": 18162 }, { "epoch": 3.7, "learning_rate": 4.8334973689324496e-05, "loss": 0.0006, "step": 18163 }, { "epoch": 3.7, "learning_rate": 4.8320720925614756e-05, "loss": 0.0007, "step": 18164 }, { "epoch": 3.7, "learning_rate": 4.830646986014081e-05, "loss": 0.0215, "step": 18165 }, { "epoch": 3.7, "learning_rate": 4.829222049314087e-05, "loss": 0.0038, "step": 18166 }, { "epoch": 3.7, "learning_rate": 4.827797282485278e-05, "loss": 0.0027, "step": 18167 }, { "epoch": 3.7, "learning_rate": 4.8263726855514574e-05, "loss": 0.0051, "step": 18168 }, { "epoch": 3.7, "learning_rate": 4.824948258536416e-05, "loss": 0.0063, "step": 18169 }, { "epoch": 3.7, "learning_rate": 4.823524001463939e-05, "loss": 0.0052, "step": 18170 }, { "epoch": 3.7, "learning_rate": 4.822099914357832e-05, "loss": 0.0006, "step": 18171 }, { "epoch": 3.7, "learning_rate": 4.8206759972418654e-05, "loss": 0.0032, "step": 18172 }, { "epoch": 3.7, "learning_rate": 4.819252250139821e-05, "loss": 0.0004, "step": 18173 }, { "epoch": 3.7, "learning_rate": 4.817828673075485e-05, "loss": 0.0274, "step": 18174 }, { "epoch": 3.7, "learning_rate": 4.816405266072628e-05, "loss": 0.0056, "step": 18175 }, { "epoch": 3.7, "learning_rate": 4.8149820291550264e-05, "loss": 0.0002, "step": 18176 }, { "epoch": 3.7, "learning_rate": 4.813558962346451e-05, "loss": 0.0054, "step": 18177 }, { "epoch": 3.7, "learning_rate": 4.81213606567067e-05, "loss": 0.0064, "step": 18178 }, { "epoch": 3.7, "learning_rate": 4.810713339151446e-05, "loss": 0.0017, "step": 18179 }, { "epoch": 3.7, "learning_rate": 4.809290782812543e-05, "loss": 0.0062, "step": 18180 }, { "epoch": 3.7, "learning_rate": 4.8078683966777214e-05, "loss": 0.0008, "step": 18181 }, { "epoch": 3.7, "learning_rate": 4.8064461807707397e-05, "loss": 0.0078, "step": 18182 }, { "epoch": 3.7, "learning_rate": 4.8050241351153394e-05, "loss": 0.0052, "step": 18183 }, { "epoch": 3.7, "learning_rate": 4.8036022597352916e-05, "loss": 0.0066, "step": 18184 }, { "epoch": 3.7, "learning_rate": 4.802180554654323e-05, "loss": 0.0052, "step": 18185 }, { "epoch": 3.7, "learning_rate": 4.800759019896197e-05, "loss": 0.013, "step": 18186 }, { "epoch": 3.7, "learning_rate": 4.7993376554846447e-05, "loss": 0.0002, "step": 18187 }, { "epoch": 3.7, "learning_rate": 4.7979164614434066e-05, "loss": 0.0057, "step": 18188 }, { "epoch": 3.7, "learning_rate": 4.796495437796223e-05, "loss": 0.0025, "step": 18189 }, { "epoch": 3.7, "learning_rate": 4.7950745845668273e-05, "loss": 0.004, "step": 18190 }, { "epoch": 3.7, "learning_rate": 4.793653901778947e-05, "loss": 0.0032, "step": 18191 }, { "epoch": 3.7, "learning_rate": 4.792233389456313e-05, "loss": 0.0033, "step": 18192 }, { "epoch": 3.7, "learning_rate": 4.790813047622649e-05, "loss": 0.0015, "step": 18193 }, { "epoch": 3.7, "learning_rate": 4.7893928763016795e-05, "loss": 0.0095, "step": 18194 }, { "epoch": 3.7, "learning_rate": 4.787972875517129e-05, "loss": 0.0121, "step": 18195 }, { "epoch": 3.71, "learning_rate": 4.7865530452926955e-05, "loss": 0.0073, "step": 18196 }, { "epoch": 3.71, "learning_rate": 4.785133385652117e-05, "loss": 0.0101, "step": 18197 }, { "epoch": 3.71, "learning_rate": 4.7837138966190825e-05, "loss": 0.005, "step": 18198 }, { "epoch": 3.71, "learning_rate": 4.78229457821732e-05, "loss": 0.0067, "step": 18199 }, { "epoch": 3.71, "learning_rate": 4.780875430470521e-05, "loss": 0.0004, "step": 18200 }, { "epoch": 3.71, "learning_rate": 4.779456453402387e-05, "loss": 0.0096, "step": 18201 }, { "epoch": 3.71, "learning_rate": 4.778037647036633e-05, "loss": 0.0027, "step": 18202 }, { "epoch": 3.71, "learning_rate": 4.7766190113969357e-05, "loss": 0.0023, "step": 18203 }, { "epoch": 3.71, "learning_rate": 4.7752005465070094e-05, "loss": 0.0092, "step": 18204 }, { "epoch": 3.71, "learning_rate": 4.773782252390528e-05, "loss": 0.0071, "step": 18205 }, { "epoch": 3.71, "learning_rate": 4.7723641290711876e-05, "loss": 0.0063, "step": 18206 }, { "epoch": 3.71, "learning_rate": 4.770946176572672e-05, "loss": 0.0033, "step": 18207 }, { "epoch": 3.71, "learning_rate": 4.7695283949186636e-05, "loss": 0.0054, "step": 18208 }, { "epoch": 3.71, "learning_rate": 4.768110784132843e-05, "loss": 0.0032, "step": 18209 }, { "epoch": 3.71, "learning_rate": 4.766693344238887e-05, "loss": 0.0034, "step": 18210 }, { "epoch": 3.71, "learning_rate": 4.765276075260469e-05, "loss": 0.0018, "step": 18211 }, { "epoch": 3.71, "learning_rate": 4.763858977221258e-05, "loss": 0.0049, "step": 18212 }, { "epoch": 3.71, "learning_rate": 4.76244205014493e-05, "loss": 0.0012, "step": 18213 }, { "epoch": 3.71, "learning_rate": 4.761025294055135e-05, "loss": 0.0084, "step": 18214 }, { "epoch": 3.71, "learning_rate": 4.759608708975555e-05, "loss": 0.0017, "step": 18215 }, { "epoch": 3.71, "learning_rate": 4.75819229492983e-05, "loss": 0.0052, "step": 18216 }, { "epoch": 3.71, "learning_rate": 4.7567760519416344e-05, "loss": 0.0029, "step": 18217 }, { "epoch": 3.71, "learning_rate": 4.755359980034611e-05, "loss": 0.0099, "step": 18218 }, { "epoch": 3.71, "learning_rate": 4.753944079232414e-05, "loss": 0.0014, "step": 18219 }, { "epoch": 3.71, "learning_rate": 4.752528349558691e-05, "loss": 0.0027, "step": 18220 }, { "epoch": 3.71, "learning_rate": 4.751112791037088e-05, "loss": 0.0091, "step": 18221 }, { "epoch": 3.71, "learning_rate": 4.7496974036912474e-05, "loss": 0.0035, "step": 18222 }, { "epoch": 3.71, "learning_rate": 4.748282187544811e-05, "loss": 0.0037, "step": 18223 }, { "epoch": 3.71, "learning_rate": 4.746867142621411e-05, "loss": 0.0018, "step": 18224 }, { "epoch": 3.71, "learning_rate": 4.745452268944685e-05, "loss": 0.003, "step": 18225 }, { "epoch": 3.71, "learning_rate": 4.744037566538264e-05, "loss": 0.0042, "step": 18226 }, { "epoch": 3.71, "learning_rate": 4.7426230354257726e-05, "loss": 0.0068, "step": 18227 }, { "epoch": 3.71, "learning_rate": 4.7412086756308456e-05, "loss": 0.0018, "step": 18228 }, { "epoch": 3.71, "learning_rate": 4.739794487177088e-05, "loss": 0.0104, "step": 18229 }, { "epoch": 3.71, "learning_rate": 4.7383804700881406e-05, "loss": 0.0041, "step": 18230 }, { "epoch": 3.71, "learning_rate": 4.7369666243875987e-05, "loss": 0.0006, "step": 18231 }, { "epoch": 3.71, "learning_rate": 4.735552950099093e-05, "loss": 0.0056, "step": 18232 }, { "epoch": 3.71, "learning_rate": 4.734139447246231e-05, "loss": 0.0043, "step": 18233 }, { "epoch": 3.71, "learning_rate": 4.7327261158526116e-05, "loss": 0.0029, "step": 18234 }, { "epoch": 3.71, "learning_rate": 4.7313129559418545e-05, "loss": 0.0019, "step": 18235 }, { "epoch": 3.71, "learning_rate": 4.7298999675375466e-05, "loss": 0.0128, "step": 18236 }, { "epoch": 3.71, "learning_rate": 4.728487150663304e-05, "loss": 0.0036, "step": 18237 }, { "epoch": 3.71, "learning_rate": 4.727074505342711e-05, "loss": 0.0079, "step": 18238 }, { "epoch": 3.71, "learning_rate": 4.725662031599363e-05, "loss": 0.003, "step": 18239 }, { "epoch": 3.71, "learning_rate": 4.724249729456856e-05, "loss": 0.0087, "step": 18240 }, { "epoch": 3.71, "learning_rate": 4.722837598938773e-05, "loss": 0.001, "step": 18241 }, { "epoch": 3.71, "learning_rate": 4.721425640068703e-05, "loss": 0.0024, "step": 18242 }, { "epoch": 3.71, "learning_rate": 4.720013852870227e-05, "loss": 0.0076, "step": 18243 }, { "epoch": 3.71, "learning_rate": 4.7186022373669254e-05, "loss": 0.0096, "step": 18244 }, { "epoch": 3.72, "learning_rate": 4.7171907935823725e-05, "loss": 0.0521, "step": 18245 }, { "epoch": 3.72, "learning_rate": 4.715779521540149e-05, "loss": 0.0048, "step": 18246 }, { "epoch": 3.72, "learning_rate": 4.71436842126381e-05, "loss": 0.0071, "step": 18247 }, { "epoch": 3.72, "learning_rate": 4.712957492776944e-05, "loss": 0.0006, "step": 18248 }, { "epoch": 3.72, "learning_rate": 4.7115467361030964e-05, "loss": 0.0043, "step": 18249 }, { "epoch": 3.72, "learning_rate": 4.710136151265849e-05, "loss": 0.0018, "step": 18250 }, { "epoch": 3.72, "learning_rate": 4.7087257382887455e-05, "loss": 0.0018, "step": 18251 }, { "epoch": 3.72, "learning_rate": 4.70731549719535e-05, "loss": 0.0153, "step": 18252 }, { "epoch": 3.72, "learning_rate": 4.7059054280092124e-05, "loss": 0.0122, "step": 18253 }, { "epoch": 3.72, "learning_rate": 4.704495530753883e-05, "loss": 0.0026, "step": 18254 }, { "epoch": 3.72, "learning_rate": 4.7030858054529205e-05, "loss": 0.0095, "step": 18255 }, { "epoch": 3.72, "learning_rate": 4.701676252129857e-05, "loss": 0.0199, "step": 18256 }, { "epoch": 3.72, "learning_rate": 4.7002668708082405e-05, "loss": 0.003, "step": 18257 }, { "epoch": 3.72, "learning_rate": 4.698857661511609e-05, "loss": 0.0016, "step": 18258 }, { "epoch": 3.72, "learning_rate": 4.6974486242635004e-05, "loss": 0.0014, "step": 18259 }, { "epoch": 3.72, "learning_rate": 4.696039759087446e-05, "loss": 0.0059, "step": 18260 }, { "epoch": 3.72, "learning_rate": 4.694631066006978e-05, "loss": 0.0023, "step": 18261 }, { "epoch": 3.72, "learning_rate": 4.693222545045622e-05, "loss": 0.0036, "step": 18262 }, { "epoch": 3.72, "learning_rate": 4.691814196226908e-05, "loss": 0.0027, "step": 18263 }, { "epoch": 3.72, "learning_rate": 4.690406019574359e-05, "loss": 0.0007, "step": 18264 }, { "epoch": 3.72, "learning_rate": 4.688998015111479e-05, "loss": 0.0007, "step": 18265 }, { "epoch": 3.72, "learning_rate": 4.6875901828618064e-05, "loss": 0.0017, "step": 18266 }, { "epoch": 3.72, "learning_rate": 4.6861825228488345e-05, "loss": 0.0016, "step": 18267 }, { "epoch": 3.72, "learning_rate": 4.6847750350960924e-05, "loss": 0.0115, "step": 18268 }, { "epoch": 3.72, "learning_rate": 4.683367719627073e-05, "loss": 0.0021, "step": 18269 }, { "epoch": 3.72, "learning_rate": 4.681960576465288e-05, "loss": 0.0061, "step": 18270 }, { "epoch": 3.72, "learning_rate": 4.6805536056342385e-05, "loss": 0.0028, "step": 18271 }, { "epoch": 3.72, "learning_rate": 4.679146807157421e-05, "loss": 0.0008, "step": 18272 }, { "epoch": 3.72, "learning_rate": 4.677740181058336e-05, "loss": 0.0024, "step": 18273 }, { "epoch": 3.72, "learning_rate": 4.676333727360472e-05, "loss": 0.0091, "step": 18274 }, { "epoch": 3.72, "learning_rate": 4.674927446087325e-05, "loss": 0.0048, "step": 18275 }, { "epoch": 3.72, "learning_rate": 4.673521337262378e-05, "loss": 0.0023, "step": 18276 }, { "epoch": 3.72, "learning_rate": 4.672115400909117e-05, "loss": 0.0205, "step": 18277 }, { "epoch": 3.72, "learning_rate": 4.670709637051025e-05, "loss": 0.0019, "step": 18278 }, { "epoch": 3.72, "learning_rate": 4.669304045711584e-05, "loss": 0.0042, "step": 18279 }, { "epoch": 3.72, "learning_rate": 4.667898626914258e-05, "loss": 0.0003, "step": 18280 }, { "epoch": 3.72, "learning_rate": 4.666493380682536e-05, "loss": 0.0095, "step": 18281 }, { "epoch": 3.72, "learning_rate": 4.665088307039871e-05, "loss": 0.0049, "step": 18282 }, { "epoch": 3.72, "learning_rate": 4.66368340600975e-05, "loss": 0.0003, "step": 18283 }, { "epoch": 3.72, "learning_rate": 4.662278677615621e-05, "loss": 0.0018, "step": 18284 }, { "epoch": 3.72, "learning_rate": 4.660874121880949e-05, "loss": 0.0057, "step": 18285 }, { "epoch": 3.72, "learning_rate": 4.6594697388292054e-05, "loss": 0.003, "step": 18286 }, { "epoch": 3.72, "learning_rate": 4.6580655284838305e-05, "loss": 0.0084, "step": 18287 }, { "epoch": 3.72, "learning_rate": 4.6566614908682825e-05, "loss": 0.005, "step": 18288 }, { "epoch": 3.72, "learning_rate": 4.6552576260060135e-05, "loss": 0.0074, "step": 18289 }, { "epoch": 3.72, "learning_rate": 4.6538539339204686e-05, "loss": 0.0021, "step": 18290 }, { "epoch": 3.72, "learning_rate": 4.6524504146350924e-05, "loss": 0.0002, "step": 18291 }, { "epoch": 3.72, "learning_rate": 4.6510470681733274e-05, "loss": 0.0014, "step": 18292 }, { "epoch": 3.72, "learning_rate": 4.6496438945586106e-05, "loss": 0.0073, "step": 18293 }, { "epoch": 3.73, "learning_rate": 4.6482408938143785e-05, "loss": 0.0016, "step": 18294 }, { "epoch": 3.73, "learning_rate": 4.646838065964064e-05, "loss": 0.0032, "step": 18295 }, { "epoch": 3.73, "learning_rate": 4.645435411031098e-05, "loss": 0.0106, "step": 18296 }, { "epoch": 3.73, "learning_rate": 4.644032929038908e-05, "loss": 0.0053, "step": 18297 }, { "epoch": 3.73, "learning_rate": 4.6426306200109084e-05, "loss": 0.0022, "step": 18298 }, { "epoch": 3.73, "learning_rate": 4.64122848397054e-05, "loss": 0.0031, "step": 18299 }, { "epoch": 3.73, "learning_rate": 4.6398265209411966e-05, "loss": 0.0008, "step": 18300 }, { "epoch": 3.73, "learning_rate": 4.6384247309463186e-05, "loss": 0.0003, "step": 18301 }, { "epoch": 3.73, "learning_rate": 4.6370231140093e-05, "loss": 0.004, "step": 18302 }, { "epoch": 3.73, "learning_rate": 4.6356216701535576e-05, "loss": 0.0046, "step": 18303 }, { "epoch": 3.73, "learning_rate": 4.634220399402497e-05, "loss": 0.0015, "step": 18304 }, { "epoch": 3.73, "learning_rate": 4.632819301779524e-05, "loss": 0.01, "step": 18305 }, { "epoch": 3.73, "learning_rate": 4.631418377308037e-05, "loss": 0.001, "step": 18306 }, { "epoch": 3.73, "learning_rate": 4.630017626011435e-05, "loss": 0.0017, "step": 18307 }, { "epoch": 3.73, "learning_rate": 4.628617047913113e-05, "loss": 0.0015, "step": 18308 }, { "epoch": 3.73, "learning_rate": 4.627216643036465e-05, "loss": 0.0045, "step": 18309 }, { "epoch": 3.73, "learning_rate": 4.6258164114048784e-05, "loss": 0.0006, "step": 18310 }, { "epoch": 3.73, "learning_rate": 4.62441635304174e-05, "loss": 0.0172, "step": 18311 }, { "epoch": 3.73, "learning_rate": 4.623016467970439e-05, "loss": 0.0064, "step": 18312 }, { "epoch": 3.73, "learning_rate": 4.621616756214342e-05, "loss": 0.0047, "step": 18313 }, { "epoch": 3.73, "learning_rate": 4.62021721779684e-05, "loss": 0.0008, "step": 18314 }, { "epoch": 3.73, "learning_rate": 4.618817852741308e-05, "loss": 0.0057, "step": 18315 }, { "epoch": 3.73, "learning_rate": 4.617418661071105e-05, "loss": 0.0006, "step": 18316 }, { "epoch": 3.73, "learning_rate": 4.616019642809618e-05, "loss": 0.0076, "step": 18317 }, { "epoch": 3.73, "learning_rate": 4.614620797980193e-05, "loss": 0.0056, "step": 18318 }, { "epoch": 3.73, "learning_rate": 4.6132221266062166e-05, "loss": 0.0029, "step": 18319 }, { "epoch": 3.73, "learning_rate": 4.611823628711031e-05, "loss": 0.0203, "step": 18320 }, { "epoch": 3.73, "learning_rate": 4.610425304318e-05, "loss": 0.0031, "step": 18321 }, { "epoch": 3.73, "learning_rate": 4.609027153450478e-05, "loss": 0.0018, "step": 18322 }, { "epoch": 3.73, "learning_rate": 4.607629176131818e-05, "loss": 0.0011, "step": 18323 }, { "epoch": 3.73, "learning_rate": 4.606231372385366e-05, "loss": 0.0001, "step": 18324 }, { "epoch": 3.73, "learning_rate": 4.604833742234471e-05, "loss": 0.0066, "step": 18325 }, { "epoch": 3.73, "learning_rate": 4.603436285702474e-05, "loss": 0.0015, "step": 18326 }, { "epoch": 3.73, "learning_rate": 4.602039002812717e-05, "loss": 0.0004, "step": 18327 }, { "epoch": 3.73, "learning_rate": 4.6006418935885345e-05, "loss": 0.004, "step": 18328 }, { "epoch": 3.73, "learning_rate": 4.599244958053264e-05, "loss": 0.0065, "step": 18329 }, { "epoch": 3.73, "learning_rate": 4.5978481962302397e-05, "loss": 0.0033, "step": 18330 }, { "epoch": 3.73, "learning_rate": 4.5964516081427765e-05, "loss": 0.0094, "step": 18331 }, { "epoch": 3.73, "learning_rate": 4.595055193814219e-05, "loss": 0.0042, "step": 18332 }, { "epoch": 3.73, "learning_rate": 4.593658953267871e-05, "loss": 0.0059, "step": 18333 }, { "epoch": 3.73, "learning_rate": 4.592262886527072e-05, "loss": 0.0019, "step": 18334 }, { "epoch": 3.73, "learning_rate": 4.590866993615123e-05, "loss": 0.0054, "step": 18335 }, { "epoch": 3.73, "learning_rate": 4.589471274555344e-05, "loss": 0.0026, "step": 18336 }, { "epoch": 3.73, "learning_rate": 4.588075729371046e-05, "loss": 0.002, "step": 18337 }, { "epoch": 3.73, "learning_rate": 4.5866803580855386e-05, "loss": 0.0045, "step": 18338 }, { "epoch": 3.73, "learning_rate": 4.5852851607221246e-05, "loss": 0.0077, "step": 18339 }, { "epoch": 3.73, "learning_rate": 4.583890137304107e-05, "loss": 0.0039, "step": 18340 }, { "epoch": 3.73, "learning_rate": 4.582495287854787e-05, "loss": 0.0023, "step": 18341 }, { "epoch": 3.73, "learning_rate": 4.58110061239746e-05, "loss": 0.0021, "step": 18342 }, { "epoch": 3.73, "learning_rate": 4.579706110955425e-05, "loss": 0.0108, "step": 18343 }, { "epoch": 3.74, "learning_rate": 4.578311783551956e-05, "loss": 0.0022, "step": 18344 }, { "epoch": 3.74, "learning_rate": 4.5769176302103594e-05, "loss": 0.0003, "step": 18345 }, { "epoch": 3.74, "learning_rate": 4.5755236509539124e-05, "loss": 0.0018, "step": 18346 }, { "epoch": 3.74, "learning_rate": 4.5741298458058975e-05, "loss": 0.0148, "step": 18347 }, { "epoch": 3.74, "learning_rate": 4.5727362147896006e-05, "loss": 0.0082, "step": 18348 }, { "epoch": 3.74, "learning_rate": 4.5713427579282826e-05, "loss": 0.002, "step": 18349 }, { "epoch": 3.74, "learning_rate": 4.569949475245234e-05, "loss": 0.004, "step": 18350 }, { "epoch": 3.74, "learning_rate": 4.5685563667637075e-05, "loss": 0.0084, "step": 18351 }, { "epoch": 3.74, "learning_rate": 4.5671634325069925e-05, "loss": 0.0044, "step": 18352 }, { "epoch": 3.74, "learning_rate": 4.5657706724983344e-05, "loss": 0.0026, "step": 18353 }, { "epoch": 3.74, "learning_rate": 4.5643780867610024e-05, "loss": 0.0029, "step": 18354 }, { "epoch": 3.74, "learning_rate": 4.562985675318256e-05, "loss": 0.0017, "step": 18355 }, { "epoch": 3.74, "learning_rate": 4.5615934381933476e-05, "loss": 0.0032, "step": 18356 }, { "epoch": 3.74, "learning_rate": 4.5602013754095344e-05, "loss": 0.0024, "step": 18357 }, { "epoch": 3.74, "learning_rate": 4.558809486990066e-05, "loss": 0.001, "step": 18358 }, { "epoch": 3.74, "learning_rate": 4.5574177729581867e-05, "loss": 0.003, "step": 18359 }, { "epoch": 3.74, "learning_rate": 4.5560262333371434e-05, "loss": 0.004, "step": 18360 }, { "epoch": 3.74, "learning_rate": 4.5546348681501804e-05, "loss": 0.0077, "step": 18361 }, { "epoch": 3.74, "learning_rate": 4.553243677420523e-05, "loss": 0.0043, "step": 18362 }, { "epoch": 3.74, "learning_rate": 4.551852661171425e-05, "loss": 0.0051, "step": 18363 }, { "epoch": 3.74, "learning_rate": 4.5504618194261e-05, "loss": 0.0041, "step": 18364 }, { "epoch": 3.74, "learning_rate": 4.549071152207797e-05, "loss": 0.0002, "step": 18365 }, { "epoch": 3.74, "learning_rate": 4.5476806595397295e-05, "loss": 0.0005, "step": 18366 }, { "epoch": 3.74, "learning_rate": 4.54629034144512e-05, "loss": 0.0039, "step": 18367 }, { "epoch": 3.74, "learning_rate": 4.544900197947203e-05, "loss": 0.0099, "step": 18368 }, { "epoch": 3.74, "learning_rate": 4.543510229069181e-05, "loss": 0.0018, "step": 18369 }, { "epoch": 3.74, "learning_rate": 4.5421204348342824e-05, "loss": 0.0033, "step": 18370 }, { "epoch": 3.74, "learning_rate": 4.540730815265711e-05, "loss": 0.0136, "step": 18371 }, { "epoch": 3.74, "learning_rate": 4.5393413703866775e-05, "loss": 0.0039, "step": 18372 }, { "epoch": 3.74, "learning_rate": 4.5379521002203884e-05, "loss": 0.014, "step": 18373 }, { "epoch": 3.74, "learning_rate": 4.53656300479005e-05, "loss": 0.0066, "step": 18374 }, { "epoch": 3.74, "learning_rate": 4.535174084118858e-05, "loss": 0.0082, "step": 18375 }, { "epoch": 3.74, "learning_rate": 4.533785338230014e-05, "loss": 0.0045, "step": 18376 }, { "epoch": 3.74, "learning_rate": 4.532396767146709e-05, "loss": 0.005, "step": 18377 }, { "epoch": 3.74, "learning_rate": 4.53100837089214e-05, "loss": 0.0028, "step": 18378 }, { "epoch": 3.74, "learning_rate": 4.5296201494894915e-05, "loss": 0.0082, "step": 18379 }, { "epoch": 3.74, "learning_rate": 4.5282321029619505e-05, "loss": 0.0027, "step": 18380 }, { "epoch": 3.74, "learning_rate": 4.526844231332706e-05, "loss": 0.0005, "step": 18381 }, { "epoch": 3.74, "learning_rate": 4.5254565346249216e-05, "loss": 0.0013, "step": 18382 }, { "epoch": 3.74, "learning_rate": 4.524069012861794e-05, "loss": 0.0015, "step": 18383 }, { "epoch": 3.74, "learning_rate": 4.522681666066481e-05, "loss": 0.002, "step": 18384 }, { "epoch": 3.74, "learning_rate": 4.521294494262171e-05, "loss": 0.0043, "step": 18385 }, { "epoch": 3.74, "learning_rate": 4.519907497472017e-05, "loss": 0.0062, "step": 18386 }, { "epoch": 3.74, "learning_rate": 4.51852067571919e-05, "loss": 0.0179, "step": 18387 }, { "epoch": 3.74, "learning_rate": 4.517134029026854e-05, "loss": 0.0058, "step": 18388 }, { "epoch": 3.74, "learning_rate": 4.515747557418167e-05, "loss": 0.0104, "step": 18389 }, { "epoch": 3.74, "learning_rate": 4.514361260916287e-05, "loss": 0.0208, "step": 18390 }, { "epoch": 3.74, "learning_rate": 4.512975139544366e-05, "loss": 0.0107, "step": 18391 }, { "epoch": 3.74, "learning_rate": 4.511589193325556e-05, "loss": 0.0017, "step": 18392 }, { "epoch": 3.75, "learning_rate": 4.510203422283006e-05, "loss": 0.0032, "step": 18393 }, { "epoch": 3.75, "learning_rate": 4.5088178264398624e-05, "loss": 0.0116, "step": 18394 }, { "epoch": 3.75, "learning_rate": 4.507432405819257e-05, "loss": 0.0062, "step": 18395 }, { "epoch": 3.75, "learning_rate": 4.5060471604443444e-05, "loss": 0.0027, "step": 18396 }, { "epoch": 3.75, "learning_rate": 4.504662090338245e-05, "loss": 0.0027, "step": 18397 }, { "epoch": 3.75, "learning_rate": 4.503277195524104e-05, "loss": 0.0031, "step": 18398 }, { "epoch": 3.75, "learning_rate": 4.501892476025053e-05, "loss": 0.0019, "step": 18399 }, { "epoch": 3.75, "learning_rate": 4.500507931864204e-05, "loss": 0.0089, "step": 18400 }, { "epoch": 3.75, "learning_rate": 4.4991235630647023e-05, "loss": 0.0024, "step": 18401 }, { "epoch": 3.75, "learning_rate": 4.497739369649649e-05, "loss": 0.0025, "step": 18402 }, { "epoch": 3.75, "learning_rate": 4.496355351642181e-05, "loss": 0.0106, "step": 18403 }, { "epoch": 3.75, "learning_rate": 4.494971509065403e-05, "loss": 0.0009, "step": 18404 }, { "epoch": 3.75, "learning_rate": 4.493587841942428e-05, "loss": 0.0047, "step": 18405 }, { "epoch": 3.75, "learning_rate": 4.492204350296369e-05, "loss": 0.0064, "step": 18406 }, { "epoch": 3.75, "learning_rate": 4.4908210341503334e-05, "loss": 0.0068, "step": 18407 }, { "epoch": 3.75, "learning_rate": 4.489437893527423e-05, "loss": 0.0031, "step": 18408 }, { "epoch": 3.75, "learning_rate": 4.488054928450741e-05, "loss": 0.0021, "step": 18409 }, { "epoch": 3.75, "learning_rate": 4.486672138943383e-05, "loss": 0.0085, "step": 18410 }, { "epoch": 3.75, "learning_rate": 4.485289525028447e-05, "loss": 0.0007, "step": 18411 }, { "epoch": 3.75, "learning_rate": 4.483907086729027e-05, "loss": 0.0029, "step": 18412 }, { "epoch": 3.75, "learning_rate": 4.482524824068202e-05, "loss": 0.0019, "step": 18413 }, { "epoch": 3.75, "learning_rate": 4.481142737069072e-05, "loss": 0.003, "step": 18414 }, { "epoch": 3.75, "learning_rate": 4.479760825754707e-05, "loss": 0.0034, "step": 18415 }, { "epoch": 3.75, "learning_rate": 4.4783790901482016e-05, "loss": 0.0011, "step": 18416 }, { "epoch": 3.75, "learning_rate": 4.476997530272623e-05, "loss": 0.002, "step": 18417 }, { "epoch": 3.75, "learning_rate": 4.475616146151051e-05, "loss": 0.0136, "step": 18418 }, { "epoch": 3.75, "learning_rate": 4.474234937806554e-05, "loss": 0.0021, "step": 18419 }, { "epoch": 3.75, "learning_rate": 4.472853905262197e-05, "loss": 0.0049, "step": 18420 }, { "epoch": 3.75, "learning_rate": 4.4714730485410624e-05, "loss": 0.0032, "step": 18421 }, { "epoch": 3.75, "learning_rate": 4.470092367666196e-05, "loss": 0.0213, "step": 18422 }, { "epoch": 3.75, "learning_rate": 4.468711862660662e-05, "loss": 0.0002, "step": 18423 }, { "epoch": 3.75, "learning_rate": 4.4673315335475204e-05, "loss": 0.0071, "step": 18424 }, { "epoch": 3.75, "learning_rate": 4.465951380349825e-05, "loss": 0.0019, "step": 18425 }, { "epoch": 3.75, "learning_rate": 4.464571403090626e-05, "loss": 0.0054, "step": 18426 }, { "epoch": 3.75, "learning_rate": 4.463191601792971e-05, "loss": 0.0039, "step": 18427 }, { "epoch": 3.75, "learning_rate": 4.461811976479906e-05, "loss": 0.0001, "step": 18428 }, { "epoch": 3.75, "learning_rate": 4.460432527174473e-05, "loss": 0.0027, "step": 18429 }, { "epoch": 3.75, "learning_rate": 4.459053253899712e-05, "loss": 0.0021, "step": 18430 }, { "epoch": 3.75, "learning_rate": 4.457674156678658e-05, "loss": 0.0041, "step": 18431 }, { "epoch": 3.75, "learning_rate": 4.456295235534352e-05, "loss": 0.0075, "step": 18432 }, { "epoch": 3.75, "learning_rate": 4.454916490489807e-05, "loss": 0.0049, "step": 18433 }, { "epoch": 3.75, "learning_rate": 4.453537921568073e-05, "loss": 0.0011, "step": 18434 }, { "epoch": 3.75, "learning_rate": 4.4521595287921566e-05, "loss": 0.0057, "step": 18435 }, { "epoch": 3.75, "learning_rate": 4.450781312185089e-05, "loss": 0.0064, "step": 18436 }, { "epoch": 3.75, "learning_rate": 4.4494032717698855e-05, "loss": 0.0021, "step": 18437 }, { "epoch": 3.75, "learning_rate": 4.4480254075695624e-05, "loss": 0.0103, "step": 18438 }, { "epoch": 3.75, "learning_rate": 4.4466477196071345e-05, "loss": 0.0032, "step": 18439 }, { "epoch": 3.75, "learning_rate": 4.44527020790561e-05, "loss": 0.0038, "step": 18440 }, { "epoch": 3.75, "learning_rate": 4.443892872487997e-05, "loss": 0.0018, "step": 18441 }, { "epoch": 3.76, "learning_rate": 4.4425157133772976e-05, "loss": 0.0028, "step": 18442 }, { "epoch": 3.76, "learning_rate": 4.441138730596516e-05, "loss": 0.0046, "step": 18443 }, { "epoch": 3.76, "learning_rate": 4.4397619241686474e-05, "loss": 0.0024, "step": 18444 }, { "epoch": 3.76, "learning_rate": 4.4383852941166953e-05, "loss": 0.0071, "step": 18445 }, { "epoch": 3.76, "learning_rate": 4.437008840463635e-05, "loss": 0.0074, "step": 18446 }, { "epoch": 3.76, "learning_rate": 4.4356325632324755e-05, "loss": 0.0006, "step": 18447 }, { "epoch": 3.76, "learning_rate": 4.4342564624461826e-05, "loss": 0.0058, "step": 18448 }, { "epoch": 3.76, "learning_rate": 4.432880538127763e-05, "loss": 0.0038, "step": 18449 }, { "epoch": 3.76, "learning_rate": 4.4315047903001795e-05, "loss": 0.0117, "step": 18450 }, { "epoch": 3.76, "learning_rate": 4.430129218986411e-05, "loss": 0.0063, "step": 18451 }, { "epoch": 3.76, "learning_rate": 4.4287538242094454e-05, "loss": 0.0023, "step": 18452 }, { "epoch": 3.76, "learning_rate": 4.4273786059922354e-05, "loss": 0.0104, "step": 18453 }, { "epoch": 3.76, "learning_rate": 4.426003564357771e-05, "loss": 0.0033, "step": 18454 }, { "epoch": 3.76, "learning_rate": 4.424628699329002e-05, "loss": 0.0017, "step": 18455 }, { "epoch": 3.76, "learning_rate": 4.423254010928896e-05, "loss": 0.0116, "step": 18456 }, { "epoch": 3.76, "learning_rate": 4.421879499180413e-05, "loss": 0.0043, "step": 18457 }, { "epoch": 3.76, "learning_rate": 4.4205051641065096e-05, "loss": 0.0056, "step": 18458 }, { "epoch": 3.76, "learning_rate": 4.41913100573014e-05, "loss": 0.0013, "step": 18459 }, { "epoch": 3.76, "learning_rate": 4.4177570240742566e-05, "loss": 0.0006, "step": 18460 }, { "epoch": 3.76, "learning_rate": 4.416383219161805e-05, "loss": 0.0041, "step": 18461 }, { "epoch": 3.76, "learning_rate": 4.4150095910157314e-05, "loss": 0.0059, "step": 18462 }, { "epoch": 3.76, "learning_rate": 4.4136361396589845e-05, "loss": 0.0008, "step": 18463 }, { "epoch": 3.76, "learning_rate": 4.412262865114487e-05, "loss": 0.0062, "step": 18464 }, { "epoch": 3.76, "learning_rate": 4.4108897674051945e-05, "loss": 0.0028, "step": 18465 }, { "epoch": 3.76, "learning_rate": 4.409516846554022e-05, "loss": 0.0016, "step": 18466 }, { "epoch": 3.76, "learning_rate": 4.4081441025839194e-05, "loss": 0.0024, "step": 18467 }, { "epoch": 3.76, "learning_rate": 4.406771535517798e-05, "loss": 0.0001, "step": 18468 }, { "epoch": 3.76, "learning_rate": 4.405399145378588e-05, "loss": 0.001, "step": 18469 }, { "epoch": 3.76, "learning_rate": 4.404026932189211e-05, "loss": 0.0031, "step": 18470 }, { "epoch": 3.76, "learning_rate": 4.402654895972588e-05, "loss": 0.0054, "step": 18471 }, { "epoch": 3.76, "learning_rate": 4.401283036751629e-05, "loss": 0.0044, "step": 18472 }, { "epoch": 3.76, "learning_rate": 4.399911354549252e-05, "loss": 0.0006, "step": 18473 }, { "epoch": 3.76, "learning_rate": 4.398539849388362e-05, "loss": 0.0089, "step": 18474 }, { "epoch": 3.76, "learning_rate": 4.397168521291871e-05, "loss": 0.0043, "step": 18475 }, { "epoch": 3.76, "learning_rate": 4.395797370282678e-05, "loss": 0.0006, "step": 18476 }, { "epoch": 3.76, "learning_rate": 4.394426396383687e-05, "loss": 0.0088, "step": 18477 }, { "epoch": 3.76, "learning_rate": 4.3930555996177986e-05, "loss": 0.0017, "step": 18478 }, { "epoch": 3.76, "learning_rate": 4.3916849800078936e-05, "loss": 0.0057, "step": 18479 }, { "epoch": 3.76, "learning_rate": 4.39031453757688e-05, "loss": 0.0044, "step": 18480 }, { "epoch": 3.76, "learning_rate": 4.3889442723476395e-05, "loss": 0.0036, "step": 18481 }, { "epoch": 3.76, "learning_rate": 4.3875741843430614e-05, "loss": 0.0048, "step": 18482 }, { "epoch": 3.76, "learning_rate": 4.386204273586029e-05, "loss": 0.0014, "step": 18483 }, { "epoch": 3.76, "learning_rate": 4.384834540099414e-05, "loss": 0.0042, "step": 18484 }, { "epoch": 3.76, "learning_rate": 4.383464983906107e-05, "loss": 0.0011, "step": 18485 }, { "epoch": 3.76, "learning_rate": 4.38209560502897e-05, "loss": 0.004, "step": 18486 }, { "epoch": 3.76, "learning_rate": 4.38072640349088e-05, "loss": 0.0004, "step": 18487 }, { "epoch": 3.76, "learning_rate": 4.3793573793147035e-05, "loss": 0.0171, "step": 18488 }, { "epoch": 3.76, "learning_rate": 4.377988532523307e-05, "loss": 0.0007, "step": 18489 }, { "epoch": 3.76, "learning_rate": 4.3766198631395526e-05, "loss": 0.0022, "step": 18490 }, { "epoch": 3.77, "learning_rate": 4.3752513711863e-05, "loss": 0.001, "step": 18491 }, { "epoch": 3.77, "learning_rate": 4.3738830566864044e-05, "loss": 0.0008, "step": 18492 }, { "epoch": 3.77, "learning_rate": 4.37251491966272e-05, "loss": 0.0029, "step": 18493 }, { "epoch": 3.77, "learning_rate": 4.3711469601380984e-05, "loss": 0.0077, "step": 18494 }, { "epoch": 3.77, "learning_rate": 4.369779178135384e-05, "loss": 0.0063, "step": 18495 }, { "epoch": 3.77, "learning_rate": 4.368411573677429e-05, "loss": 0.0013, "step": 18496 }, { "epoch": 3.77, "learning_rate": 4.367044146787061e-05, "loss": 0.0041, "step": 18497 }, { "epoch": 3.77, "learning_rate": 4.365676897487135e-05, "loss": 0.0027, "step": 18498 }, { "epoch": 3.77, "learning_rate": 4.364309825800469e-05, "loss": 0.0024, "step": 18499 }, { "epoch": 3.77, "learning_rate": 4.3629429317499145e-05, "loss": 0.0029, "step": 18500 }, { "epoch": 3.77, "learning_rate": 4.361576215358288e-05, "loss": 0.001, "step": 18501 }, { "epoch": 3.77, "learning_rate": 4.3602096766484196e-05, "loss": 0.005, "step": 18502 }, { "epoch": 3.77, "learning_rate": 4.3588433156431333e-05, "loss": 0.0082, "step": 18503 }, { "epoch": 3.77, "learning_rate": 4.357477132365247e-05, "loss": 0.0071, "step": 18504 }, { "epoch": 3.77, "learning_rate": 4.35611112683759e-05, "loss": 0.0086, "step": 18505 }, { "epoch": 3.77, "learning_rate": 4.354745299082964e-05, "loss": 0.0115, "step": 18506 }, { "epoch": 3.77, "learning_rate": 4.353379649124186e-05, "loss": 0.0094, "step": 18507 }, { "epoch": 3.77, "learning_rate": 4.352014176984065e-05, "loss": 0.0015, "step": 18508 }, { "epoch": 3.77, "learning_rate": 4.350648882685412e-05, "loss": 0.0103, "step": 18509 }, { "epoch": 3.77, "learning_rate": 4.349283766251015e-05, "loss": 0.0048, "step": 18510 }, { "epoch": 3.77, "learning_rate": 4.347918827703687e-05, "loss": 0.0053, "step": 18511 }, { "epoch": 3.77, "learning_rate": 4.3465540670662245e-05, "loss": 0.0003, "step": 18512 }, { "epoch": 3.77, "learning_rate": 4.345189484361417e-05, "loss": 0.0024, "step": 18513 }, { "epoch": 3.77, "learning_rate": 4.343825079612063e-05, "loss": 0.0034, "step": 18514 }, { "epoch": 3.77, "learning_rate": 4.342460852840935e-05, "loss": 0.0091, "step": 18515 }, { "epoch": 3.77, "learning_rate": 4.341096804070839e-05, "loss": 0.0033, "step": 18516 }, { "epoch": 3.77, "learning_rate": 4.339732933324535e-05, "loss": 0.0061, "step": 18517 }, { "epoch": 3.77, "learning_rate": 4.338369240624824e-05, "loss": 0.0011, "step": 18518 }, { "epoch": 3.77, "learning_rate": 4.337005725994468e-05, "loss": 0.0076, "step": 18519 }, { "epoch": 3.77, "learning_rate": 4.335642389456244e-05, "loss": 0.0035, "step": 18520 }, { "epoch": 3.77, "learning_rate": 4.334279231032921e-05, "loss": 0.0002, "step": 18521 }, { "epoch": 3.77, "learning_rate": 4.332916250747269e-05, "loss": 0.005, "step": 18522 }, { "epoch": 3.77, "learning_rate": 4.331553448622052e-05, "loss": 0.0017, "step": 18523 }, { "epoch": 3.77, "learning_rate": 4.3301908246800296e-05, "loss": 0.0032, "step": 18524 }, { "epoch": 3.77, "learning_rate": 4.328828378943961e-05, "loss": 0.0038, "step": 18525 }, { "epoch": 3.77, "learning_rate": 4.3274661114366024e-05, "loss": 0.0026, "step": 18526 }, { "epoch": 3.77, "learning_rate": 4.326104022180705e-05, "loss": 0.0011, "step": 18527 }, { "epoch": 3.77, "learning_rate": 4.324742111199019e-05, "loss": 0.0012, "step": 18528 }, { "epoch": 3.77, "learning_rate": 4.323380378514295e-05, "loss": 0.0059, "step": 18529 }, { "epoch": 3.77, "learning_rate": 4.322018824149264e-05, "loss": 0.0037, "step": 18530 }, { "epoch": 3.77, "learning_rate": 4.320657448126683e-05, "loss": 0.0069, "step": 18531 }, { "epoch": 3.77, "learning_rate": 4.319296250469271e-05, "loss": 0.0064, "step": 18532 }, { "epoch": 3.77, "learning_rate": 4.317935231199781e-05, "loss": 0.0002, "step": 18533 }, { "epoch": 3.77, "learning_rate": 4.3165743903409377e-05, "loss": 0.0022, "step": 18534 }, { "epoch": 3.77, "learning_rate": 4.315213727915461e-05, "loss": 0.0037, "step": 18535 }, { "epoch": 3.77, "learning_rate": 4.3138532439460915e-05, "loss": 0.0005, "step": 18536 }, { "epoch": 3.77, "learning_rate": 4.3124929384555415e-05, "loss": 0.0031, "step": 18537 }, { "epoch": 3.77, "learning_rate": 4.311132811466534e-05, "loss": 0.0105, "step": 18538 }, { "epoch": 3.77, "learning_rate": 4.309772863001783e-05, "loss": 0.002, "step": 18539 }, { "epoch": 3.78, "learning_rate": 4.308413093084006e-05, "loss": 0.0009, "step": 18540 }, { "epoch": 3.78, "learning_rate": 4.3070535017359116e-05, "loss": 0.0059, "step": 18541 }, { "epoch": 3.78, "learning_rate": 4.305694088980208e-05, "loss": 0.001, "step": 18542 }, { "epoch": 3.78, "learning_rate": 4.3043348548396e-05, "loss": 0.0049, "step": 18543 }, { "epoch": 3.78, "learning_rate": 4.3029757993367906e-05, "loss": 0.0038, "step": 18544 }, { "epoch": 3.78, "learning_rate": 4.301616922494477e-05, "loss": 0.013, "step": 18545 }, { "epoch": 3.78, "learning_rate": 4.300258224335355e-05, "loss": 0.0038, "step": 18546 }, { "epoch": 3.78, "learning_rate": 4.2988997048821214e-05, "loss": 0.0065, "step": 18547 }, { "epoch": 3.78, "learning_rate": 4.297541364157455e-05, "loss": 0.0009, "step": 18548 }, { "epoch": 3.78, "learning_rate": 4.2961832021840575e-05, "loss": 0.0045, "step": 18549 }, { "epoch": 3.78, "learning_rate": 4.2948252189845974e-05, "loss": 0.0051, "step": 18550 }, { "epoch": 3.78, "learning_rate": 4.293467414581773e-05, "loss": 0.0047, "step": 18551 }, { "epoch": 3.78, "learning_rate": 4.2921097889982474e-05, "loss": 0.0034, "step": 18552 }, { "epoch": 3.78, "learning_rate": 4.290752342256702e-05, "loss": 0.0052, "step": 18553 }, { "epoch": 3.78, "learning_rate": 4.289395074379808e-05, "loss": 0.0092, "step": 18554 }, { "epoch": 3.78, "learning_rate": 4.2880379853902316e-05, "loss": 0.0223, "step": 18555 }, { "epoch": 3.78, "learning_rate": 4.286681075310643e-05, "loss": 0.009, "step": 18556 }, { "epoch": 3.78, "learning_rate": 4.2853243441637025e-05, "loss": 0.0113, "step": 18557 }, { "epoch": 3.78, "learning_rate": 4.283967791972071e-05, "loss": 0.0092, "step": 18558 }, { "epoch": 3.78, "learning_rate": 4.282611418758406e-05, "loss": 0.0207, "step": 18559 }, { "epoch": 3.78, "learning_rate": 4.281255224545364e-05, "loss": 0.0047, "step": 18560 }, { "epoch": 3.78, "learning_rate": 4.279899209355586e-05, "loss": 0.0034, "step": 18561 }, { "epoch": 3.78, "learning_rate": 4.278543373211734e-05, "loss": 0.0003, "step": 18562 }, { "epoch": 3.78, "learning_rate": 4.2771877161364364e-05, "loss": 0.0033, "step": 18563 }, { "epoch": 3.78, "learning_rate": 4.2758322381523494e-05, "loss": 0.004, "step": 18564 }, { "epoch": 3.78, "learning_rate": 4.274476939282113e-05, "loss": 0.002, "step": 18565 }, { "epoch": 3.78, "learning_rate": 4.273121819548349e-05, "loss": 0.0091, "step": 18566 }, { "epoch": 3.78, "learning_rate": 4.2717668789737055e-05, "loss": 0.0045, "step": 18567 }, { "epoch": 3.78, "learning_rate": 4.2704121175807984e-05, "loss": 0.0029, "step": 18568 }, { "epoch": 3.78, "learning_rate": 4.269057535392273e-05, "loss": 0.0033, "step": 18569 }, { "epoch": 3.78, "learning_rate": 4.267703132430737e-05, "loss": 0.0073, "step": 18570 }, { "epoch": 3.78, "learning_rate": 4.266348908718818e-05, "loss": 0.0085, "step": 18571 }, { "epoch": 3.78, "learning_rate": 4.2649948642791326e-05, "loss": 0.0018, "step": 18572 }, { "epoch": 3.78, "learning_rate": 4.263640999134296e-05, "loss": 0.001, "step": 18573 }, { "epoch": 3.78, "learning_rate": 4.262287313306922e-05, "loss": 0.0049, "step": 18574 }, { "epoch": 3.78, "learning_rate": 4.26093380681962e-05, "loss": 0.0039, "step": 18575 }, { "epoch": 3.78, "learning_rate": 4.2595804796949916e-05, "loss": 0.005, "step": 18576 }, { "epoch": 3.78, "learning_rate": 4.2582273319556454e-05, "loss": 0.0045, "step": 18577 }, { "epoch": 3.78, "learning_rate": 4.2568743636241794e-05, "loss": 0.0004, "step": 18578 }, { "epoch": 3.78, "learning_rate": 4.25552157472319e-05, "loss": 0.0054, "step": 18579 }, { "epoch": 3.78, "learning_rate": 4.254168965275277e-05, "loss": 0.0133, "step": 18580 }, { "epoch": 3.78, "learning_rate": 4.252816535303016e-05, "loss": 0.0019, "step": 18581 }, { "epoch": 3.78, "learning_rate": 4.251464284829017e-05, "loss": 0.0104, "step": 18582 }, { "epoch": 3.78, "learning_rate": 4.2501122138758477e-05, "loss": 0.0089, "step": 18583 }, { "epoch": 3.78, "learning_rate": 4.2487603224660965e-05, "loss": 0.0037, "step": 18584 }, { "epoch": 3.78, "learning_rate": 4.247408610622343e-05, "loss": 0.004, "step": 18585 }, { "epoch": 3.78, "learning_rate": 4.246057078367158e-05, "loss": 0.0042, "step": 18586 }, { "epoch": 3.78, "learning_rate": 4.244705725723127e-05, "loss": 0.0051, "step": 18587 }, { "epoch": 3.78, "learning_rate": 4.2433545527128094e-05, "loss": 0.0072, "step": 18588 }, { "epoch": 3.79, "learning_rate": 4.2420035593587746e-05, "loss": 0.0016, "step": 18589 }, { "epoch": 3.79, "learning_rate": 4.240652745683587e-05, "loss": 0.0008, "step": 18590 }, { "epoch": 3.79, "learning_rate": 4.23930211170981e-05, "loss": 0.0028, "step": 18591 }, { "epoch": 3.79, "learning_rate": 4.237951657459998e-05, "loss": 0.0003, "step": 18592 }, { "epoch": 3.79, "learning_rate": 4.236601382956709e-05, "loss": 0.008, "step": 18593 }, { "epoch": 3.79, "learning_rate": 4.235251288222495e-05, "loss": 0.002, "step": 18594 }, { "epoch": 3.79, "learning_rate": 4.233901373279904e-05, "loss": 0.0033, "step": 18595 }, { "epoch": 3.79, "learning_rate": 4.232551638151481e-05, "loss": 0.0026, "step": 18596 }, { "epoch": 3.79, "learning_rate": 4.231202082859773e-05, "loss": 0.0031, "step": 18597 }, { "epoch": 3.79, "learning_rate": 4.22985270742732e-05, "loss": 0.0022, "step": 18598 }, { "epoch": 3.79, "learning_rate": 4.2285035118766496e-05, "loss": 0.0025, "step": 18599 }, { "epoch": 3.79, "learning_rate": 4.227154496230311e-05, "loss": 0.0031, "step": 18600 }, { "epoch": 3.79, "learning_rate": 4.2258056605108195e-05, "loss": 0.0005, "step": 18601 }, { "epoch": 3.79, "learning_rate": 4.22445700474072e-05, "loss": 0.0033, "step": 18602 }, { "epoch": 3.79, "learning_rate": 4.223108528942524e-05, "loss": 0.0071, "step": 18603 }, { "epoch": 3.79, "learning_rate": 4.221760233138757e-05, "loss": 0.0056, "step": 18604 }, { "epoch": 3.79, "learning_rate": 4.2204121173519424e-05, "loss": 0.0013, "step": 18605 }, { "epoch": 3.79, "learning_rate": 4.219064181604591e-05, "loss": 0.0092, "step": 18606 }, { "epoch": 3.79, "learning_rate": 4.217716425919219e-05, "loss": 0.006, "step": 18607 }, { "epoch": 3.79, "learning_rate": 4.216368850318337e-05, "loss": 0.005, "step": 18608 }, { "epoch": 3.79, "learning_rate": 4.215021454824449e-05, "loss": 0.0025, "step": 18609 }, { "epoch": 3.79, "learning_rate": 4.2136742394600606e-05, "loss": 0.0057, "step": 18610 }, { "epoch": 3.79, "learning_rate": 4.2123272042476785e-05, "loss": 0.0008, "step": 18611 }, { "epoch": 3.79, "learning_rate": 4.210980349209787e-05, "loss": 0.0025, "step": 18612 }, { "epoch": 3.79, "learning_rate": 4.209633674368896e-05, "loss": 0.0035, "step": 18613 }, { "epoch": 3.79, "learning_rate": 4.208287179747485e-05, "loss": 0.002, "step": 18614 }, { "epoch": 3.79, "learning_rate": 4.206940865368055e-05, "loss": 0.0027, "step": 18615 }, { "epoch": 3.79, "learning_rate": 4.205594731253083e-05, "loss": 0.0053, "step": 18616 }, { "epoch": 3.79, "learning_rate": 4.2042487774250497e-05, "loss": 0.0092, "step": 18617 }, { "epoch": 3.79, "learning_rate": 4.202903003906449e-05, "loss": 0.0059, "step": 18618 }, { "epoch": 3.79, "learning_rate": 4.2015574107197414e-05, "loss": 0.0024, "step": 18619 }, { "epoch": 3.79, "learning_rate": 4.200211997887417e-05, "loss": 0.0072, "step": 18620 }, { "epoch": 3.79, "learning_rate": 4.1988667654319335e-05, "loss": 0.0135, "step": 18621 }, { "epoch": 3.79, "learning_rate": 4.1975217133757626e-05, "loss": 0.0077, "step": 18622 }, { "epoch": 3.79, "learning_rate": 4.1961768417413724e-05, "loss": 0.0112, "step": 18623 }, { "epoch": 3.79, "learning_rate": 4.194832150551221e-05, "loss": 0.0062, "step": 18624 }, { "epoch": 3.79, "learning_rate": 4.19348763982777e-05, "loss": 0.0012, "step": 18625 }, { "epoch": 3.79, "learning_rate": 4.192143309593473e-05, "loss": 0.0029, "step": 18626 }, { "epoch": 3.79, "learning_rate": 4.190799159870785e-05, "loss": 0.0047, "step": 18627 }, { "epoch": 3.79, "learning_rate": 4.189455190682153e-05, "loss": 0.0094, "step": 18628 }, { "epoch": 3.79, "learning_rate": 4.188111402050028e-05, "loss": 0.0034, "step": 18629 }, { "epoch": 3.79, "learning_rate": 4.186767793996851e-05, "loss": 0.0085, "step": 18630 }, { "epoch": 3.79, "learning_rate": 4.185424366545066e-05, "loss": 0.0028, "step": 18631 }, { "epoch": 3.79, "learning_rate": 4.1840811197171006e-05, "loss": 0.0073, "step": 18632 }, { "epoch": 3.79, "learning_rate": 4.182738053535406e-05, "loss": 0.0031, "step": 18633 }, { "epoch": 3.79, "learning_rate": 4.1813951680224e-05, "loss": 0.0006, "step": 18634 }, { "epoch": 3.79, "learning_rate": 4.180052463200516e-05, "loss": 0.0033, "step": 18635 }, { "epoch": 3.79, "learning_rate": 4.1787099390921815e-05, "loss": 0.0032, "step": 18636 }, { "epoch": 3.79, "learning_rate": 4.177367595719816e-05, "loss": 0.0015, "step": 18637 }, { "epoch": 3.8, "learning_rate": 4.1760254331058404e-05, "loss": 0.0052, "step": 18638 }, { "epoch": 3.8, "learning_rate": 4.174683451272674e-05, "loss": 0.0041, "step": 18639 }, { "epoch": 3.8, "learning_rate": 4.173341650242726e-05, "loss": 0.0006, "step": 18640 }, { "epoch": 3.8, "learning_rate": 4.17200003003841e-05, "loss": 0.0019, "step": 18641 }, { "epoch": 3.8, "learning_rate": 4.1706585906821334e-05, "loss": 0.0077, "step": 18642 }, { "epoch": 3.8, "learning_rate": 4.1693173321962985e-05, "loss": 0.0018, "step": 18643 }, { "epoch": 3.8, "learning_rate": 4.1679762546033145e-05, "loss": 0.0034, "step": 18644 }, { "epoch": 3.8, "learning_rate": 4.1666353579255654e-05, "loss": 0.0096, "step": 18645 }, { "epoch": 3.8, "learning_rate": 4.165294642185459e-05, "loss": 0.0015, "step": 18646 }, { "epoch": 3.8, "learning_rate": 4.1639541074053826e-05, "loss": 0.0033, "step": 18647 }, { "epoch": 3.8, "learning_rate": 4.162613753607729e-05, "loss": 0.0054, "step": 18648 }, { "epoch": 3.8, "learning_rate": 4.161273580814887e-05, "loss": 0.0043, "step": 18649 }, { "epoch": 3.8, "learning_rate": 4.159933589049226e-05, "loss": 0.0048, "step": 18650 }, { "epoch": 3.8, "learning_rate": 4.158593778333147e-05, "loss": 0.0067, "step": 18651 }, { "epoch": 3.8, "learning_rate": 4.157254148689006e-05, "loss": 0.0005, "step": 18652 }, { "epoch": 3.8, "learning_rate": 4.155914700139197e-05, "loss": 0.0002, "step": 18653 }, { "epoch": 3.8, "learning_rate": 4.1545754327060765e-05, "loss": 0.0165, "step": 18654 }, { "epoch": 3.8, "learning_rate": 4.15323634641202e-05, "loss": 0.0029, "step": 18655 }, { "epoch": 3.8, "learning_rate": 4.1518974412793906e-05, "loss": 0.0073, "step": 18656 }, { "epoch": 3.8, "learning_rate": 4.150558717330552e-05, "loss": 0.0017, "step": 18657 }, { "epoch": 3.8, "learning_rate": 4.1492201745878604e-05, "loss": 0.0032, "step": 18658 }, { "epoch": 3.8, "learning_rate": 4.1478818130736767e-05, "loss": 0.0227, "step": 18659 }, { "epoch": 3.8, "learning_rate": 4.146543632810351e-05, "loss": 0.0062, "step": 18660 }, { "epoch": 3.8, "learning_rate": 4.145205633820233e-05, "loss": 0.0091, "step": 18661 }, { "epoch": 3.8, "learning_rate": 4.1438678161256764e-05, "loss": 0.0018, "step": 18662 }, { "epoch": 3.8, "learning_rate": 4.142530179749009e-05, "loss": 0.0075, "step": 18663 }, { "epoch": 3.8, "learning_rate": 4.141192724712594e-05, "loss": 0.0029, "step": 18664 }, { "epoch": 3.8, "learning_rate": 4.1398554510387476e-05, "loss": 0.0003, "step": 18665 }, { "epoch": 3.8, "learning_rate": 4.1385183587498235e-05, "loss": 0.0009, "step": 18666 }, { "epoch": 3.8, "learning_rate": 4.1371814478681406e-05, "loss": 0.0019, "step": 18667 }, { "epoch": 3.8, "learning_rate": 4.135844718416034e-05, "loss": 0.0022, "step": 18668 }, { "epoch": 3.8, "learning_rate": 4.1345081704158275e-05, "loss": 0.0011, "step": 18669 }, { "epoch": 3.8, "learning_rate": 4.13317180388984e-05, "loss": 0.0055, "step": 18670 }, { "epoch": 3.8, "learning_rate": 4.1318356188604056e-05, "loss": 0.0068, "step": 18671 }, { "epoch": 3.8, "learning_rate": 4.130499615349826e-05, "loss": 0.0064, "step": 18672 }, { "epoch": 3.8, "learning_rate": 4.129163793380422e-05, "loss": 0.0064, "step": 18673 }, { "epoch": 3.8, "learning_rate": 4.127828152974502e-05, "loss": 0.0023, "step": 18674 }, { "epoch": 3.8, "learning_rate": 4.126492694154373e-05, "loss": 0.0051, "step": 18675 }, { "epoch": 3.8, "learning_rate": 4.125157416942343e-05, "loss": 0.0044, "step": 18676 }, { "epoch": 3.8, "learning_rate": 4.123822321360712e-05, "loss": 0.0033, "step": 18677 }, { "epoch": 3.8, "learning_rate": 4.122487407431777e-05, "loss": 0.0016, "step": 18678 }, { "epoch": 3.8, "learning_rate": 4.1211526751778354e-05, "loss": 0.0004, "step": 18679 }, { "epoch": 3.8, "learning_rate": 4.119818124621181e-05, "loss": 0.0031, "step": 18680 }, { "epoch": 3.8, "learning_rate": 4.1184837557841e-05, "loss": 0.0049, "step": 18681 }, { "epoch": 3.8, "learning_rate": 4.117149568688887e-05, "loss": 0.0022, "step": 18682 }, { "epoch": 3.8, "learning_rate": 4.115815563357809e-05, "loss": 0.0006, "step": 18683 }, { "epoch": 3.8, "learning_rate": 4.1144817398131634e-05, "loss": 0.0076, "step": 18684 }, { "epoch": 3.8, "learning_rate": 4.113148098077218e-05, "loss": 0.0024, "step": 18685 }, { "epoch": 3.8, "learning_rate": 4.1118146381722514e-05, "loss": 0.0015, "step": 18686 }, { "epoch": 3.81, "learning_rate": 4.11048136012053e-05, "loss": 0.0126, "step": 18687 }, { "epoch": 3.81, "learning_rate": 4.1091482639443266e-05, "loss": 0.0002, "step": 18688 }, { "epoch": 3.81, "learning_rate": 4.107815349665906e-05, "loss": 0.0146, "step": 18689 }, { "epoch": 3.81, "learning_rate": 4.1064826173075284e-05, "loss": 0.0037, "step": 18690 }, { "epoch": 3.81, "learning_rate": 4.1051500668914554e-05, "loss": 0.0048, "step": 18691 }, { "epoch": 3.81, "learning_rate": 4.1038176984399415e-05, "loss": 0.0006, "step": 18692 }, { "epoch": 3.81, "learning_rate": 4.102485511975239e-05, "loss": 0.0097, "step": 18693 }, { "epoch": 3.81, "learning_rate": 4.101153507519598e-05, "loss": 0.0023, "step": 18694 }, { "epoch": 3.81, "learning_rate": 4.0998216850952745e-05, "loss": 0.003, "step": 18695 }, { "epoch": 3.81, "learning_rate": 4.0984900447244924e-05, "loss": 0.0032, "step": 18696 }, { "epoch": 3.81, "learning_rate": 4.0971585864295145e-05, "loss": 0.0026, "step": 18697 }, { "epoch": 3.81, "learning_rate": 4.095827310232559e-05, "loss": 0.0093, "step": 18698 }, { "epoch": 3.81, "learning_rate": 4.094496216155877e-05, "loss": 0.0054, "step": 18699 }, { "epoch": 3.81, "learning_rate": 4.093165304221696e-05, "loss": 0.0079, "step": 18700 }, { "epoch": 3.81, "learning_rate": 4.091834574452235e-05, "loss": 0.0049, "step": 18701 }, { "epoch": 3.81, "learning_rate": 4.090504026869736e-05, "loss": 0.0164, "step": 18702 }, { "epoch": 3.81, "learning_rate": 4.089173661496404e-05, "loss": 0.004, "step": 18703 }, { "epoch": 3.81, "learning_rate": 4.087843478354476e-05, "loss": 0.0006, "step": 18704 }, { "epoch": 3.81, "learning_rate": 4.0865134774661553e-05, "loss": 0.0028, "step": 18705 }, { "epoch": 3.81, "learning_rate": 4.085183658853661e-05, "loss": 0.0044, "step": 18706 }, { "epoch": 3.81, "learning_rate": 4.083854022539202e-05, "loss": 0.0051, "step": 18707 }, { "epoch": 3.81, "learning_rate": 4.0825245685449866e-05, "loss": 0.0007, "step": 18708 }, { "epoch": 3.81, "learning_rate": 4.081195296893221e-05, "loss": 0.0002, "step": 18709 }, { "epoch": 3.81, "learning_rate": 4.079866207606101e-05, "loss": 0.0037, "step": 18710 }, { "epoch": 3.81, "learning_rate": 4.078537300705831e-05, "loss": 0.0011, "step": 18711 }, { "epoch": 3.81, "learning_rate": 4.077208576214604e-05, "loss": 0.0061, "step": 18712 }, { "epoch": 3.81, "learning_rate": 4.075880034154616e-05, "loss": 0.0066, "step": 18713 }, { "epoch": 3.81, "learning_rate": 4.074551674548043e-05, "loss": 0.0106, "step": 18714 }, { "epoch": 3.81, "learning_rate": 4.0732234974170894e-05, "loss": 0.0073, "step": 18715 }, { "epoch": 3.81, "learning_rate": 4.0718955027839206e-05, "loss": 0.0057, "step": 18716 }, { "epoch": 3.81, "learning_rate": 4.0705676906707326e-05, "loss": 0.0021, "step": 18717 }, { "epoch": 3.81, "learning_rate": 4.069240061099692e-05, "loss": 0.0006, "step": 18718 }, { "epoch": 3.81, "learning_rate": 4.0679126140929754e-05, "loss": 0.0107, "step": 18719 }, { "epoch": 3.81, "learning_rate": 4.066585349672754e-05, "loss": 0.0037, "step": 18720 }, { "epoch": 3.81, "learning_rate": 4.0652582678611954e-05, "loss": 0.0078, "step": 18721 }, { "epoch": 3.81, "learning_rate": 4.063931368680464e-05, "loss": 0.0031, "step": 18722 }, { "epoch": 3.81, "learning_rate": 4.0626046521527225e-05, "loss": 0.0067, "step": 18723 }, { "epoch": 3.81, "learning_rate": 4.0612781183001285e-05, "loss": 0.0042, "step": 18724 }, { "epoch": 3.81, "learning_rate": 4.059951767144839e-05, "loss": 0.0108, "step": 18725 }, { "epoch": 3.81, "learning_rate": 4.058625598709005e-05, "loss": 0.0039, "step": 18726 }, { "epoch": 3.81, "learning_rate": 4.057299613014777e-05, "loss": 0.0029, "step": 18727 }, { "epoch": 3.81, "learning_rate": 4.055973810084306e-05, "loss": 0.0033, "step": 18728 }, { "epoch": 3.81, "learning_rate": 4.054648189939722e-05, "loss": 0.0001, "step": 18729 }, { "epoch": 3.81, "learning_rate": 4.053322752603178e-05, "loss": 0.0041, "step": 18730 }, { "epoch": 3.81, "learning_rate": 4.051997498096808e-05, "loss": 0.004, "step": 18731 }, { "epoch": 3.81, "learning_rate": 4.050672426442745e-05, "loss": 0.0015, "step": 18732 }, { "epoch": 3.81, "learning_rate": 4.049347537663126e-05, "loss": 0.0022, "step": 18733 }, { "epoch": 3.81, "learning_rate": 4.048022831780065e-05, "loss": 0.0124, "step": 18734 }, { "epoch": 3.81, "learning_rate": 4.046698308815704e-05, "loss": 0.0037, "step": 18735 }, { "epoch": 3.82, "learning_rate": 4.045373968792154e-05, "loss": 0.0018, "step": 18736 }, { "epoch": 3.82, "learning_rate": 4.044049811731535e-05, "loss": 0.0041, "step": 18737 }, { "epoch": 3.82, "learning_rate": 4.042725837655967e-05, "loss": 0.0061, "step": 18738 }, { "epoch": 3.82, "learning_rate": 4.041402046587559e-05, "loss": 0.0014, "step": 18739 }, { "epoch": 3.82, "learning_rate": 4.0400784385484244e-05, "loss": 0.0048, "step": 18740 }, { "epoch": 3.82, "learning_rate": 4.038755013560668e-05, "loss": 0.0013, "step": 18741 }, { "epoch": 3.82, "learning_rate": 4.037431771646393e-05, "loss": 0.006, "step": 18742 }, { "epoch": 3.82, "learning_rate": 4.0361087128277e-05, "loss": 0.0113, "step": 18743 }, { "epoch": 3.82, "learning_rate": 4.034785837126688e-05, "loss": 0.0029, "step": 18744 }, { "epoch": 3.82, "learning_rate": 4.033463144565451e-05, "loss": 0.0007, "step": 18745 }, { "epoch": 3.82, "learning_rate": 4.0321406351660846e-05, "loss": 0.0039, "step": 18746 }, { "epoch": 3.82, "learning_rate": 4.0308183089506644e-05, "loss": 0.0065, "step": 18747 }, { "epoch": 3.82, "learning_rate": 4.029496165941293e-05, "loss": 0.0035, "step": 18748 }, { "epoch": 3.82, "learning_rate": 4.028174206160035e-05, "loss": 0.0004, "step": 18749 }, { "epoch": 3.82, "learning_rate": 4.026852429628986e-05, "loss": 0.0017, "step": 18750 }, { "epoch": 3.82, "learning_rate": 4.025530836370211e-05, "loss": 0.0038, "step": 18751 }, { "epoch": 3.82, "learning_rate": 4.0242094264057835e-05, "loss": 0.0012, "step": 18752 }, { "epoch": 3.82, "learning_rate": 4.022888199757785e-05, "loss": 0.0055, "step": 18753 }, { "epoch": 3.82, "learning_rate": 4.0215671564482654e-05, "loss": 0.0012, "step": 18754 }, { "epoch": 3.82, "learning_rate": 4.020246296499307e-05, "loss": 0.0061, "step": 18755 }, { "epoch": 3.82, "learning_rate": 4.0189256199329564e-05, "loss": 0.0003, "step": 18756 }, { "epoch": 3.82, "learning_rate": 4.017605126771277e-05, "loss": 0.0094, "step": 18757 }, { "epoch": 3.82, "learning_rate": 4.016284817036321e-05, "loss": 0.0061, "step": 18758 }, { "epoch": 3.82, "learning_rate": 4.014964690750148e-05, "loss": 0.0082, "step": 18759 }, { "epoch": 3.82, "learning_rate": 4.0136447479347904e-05, "loss": 0.0018, "step": 18760 }, { "epoch": 3.82, "learning_rate": 4.012324988612309e-05, "loss": 0.017, "step": 18761 }, { "epoch": 3.82, "learning_rate": 4.01100541280474e-05, "loss": 0.0079, "step": 18762 }, { "epoch": 3.82, "learning_rate": 4.009686020534124e-05, "loss": 0.0129, "step": 18763 }, { "epoch": 3.82, "learning_rate": 4.008366811822501e-05, "loss": 0.011, "step": 18764 }, { "epoch": 3.82, "learning_rate": 4.007047786691893e-05, "loss": 0.0064, "step": 18765 }, { "epoch": 3.82, "learning_rate": 4.0057289451643466e-05, "loss": 0.0003, "step": 18766 }, { "epoch": 3.82, "learning_rate": 4.00441028726187e-05, "loss": 0.0052, "step": 18767 }, { "epoch": 3.82, "learning_rate": 4.003091813006506e-05, "loss": 0.0007, "step": 18768 }, { "epoch": 3.82, "learning_rate": 4.001773522420263e-05, "loss": 0.0034, "step": 18769 }, { "epoch": 3.82, "learning_rate": 4.000455415525162e-05, "loss": 0.0061, "step": 18770 }, { "epoch": 3.82, "learning_rate": 3.9991374923432195e-05, "loss": 0.0056, "step": 18771 }, { "epoch": 3.82, "learning_rate": 3.997819752896446e-05, "loss": 0.0005, "step": 18772 }, { "epoch": 3.82, "learning_rate": 3.996502197206852e-05, "loss": 0.0067, "step": 18773 }, { "epoch": 3.82, "learning_rate": 3.99518482529644e-05, "loss": 0.0043, "step": 18774 }, { "epoch": 3.82, "learning_rate": 3.9938676371872155e-05, "loss": 0.0045, "step": 18775 }, { "epoch": 3.82, "learning_rate": 3.9925506329011767e-05, "loss": 0.0042, "step": 18776 }, { "epoch": 3.82, "learning_rate": 3.991233812460321e-05, "loss": 0.005, "step": 18777 }, { "epoch": 3.82, "learning_rate": 3.9899171758866406e-05, "loss": 0.0018, "step": 18778 }, { "epoch": 3.82, "learning_rate": 3.988600723202131e-05, "loss": 0.0025, "step": 18779 }, { "epoch": 3.82, "learning_rate": 3.9872844544287654e-05, "loss": 0.0032, "step": 18780 }, { "epoch": 3.82, "learning_rate": 3.985968369588547e-05, "loss": 0.0029, "step": 18781 }, { "epoch": 3.82, "learning_rate": 3.984652468703443e-05, "loss": 0.0002, "step": 18782 }, { "epoch": 3.82, "learning_rate": 3.983336751795431e-05, "loss": 0.0074, "step": 18783 }, { "epoch": 3.82, "learning_rate": 3.9820212188864984e-05, "loss": 0.0117, "step": 18784 }, { "epoch": 3.82, "learning_rate": 3.9807058699986014e-05, "loss": 0.0043, "step": 18785 }, { "epoch": 3.83, "learning_rate": 3.9793907051537263e-05, "loss": 0.0048, "step": 18786 }, { "epoch": 3.83, "learning_rate": 3.978075724373824e-05, "loss": 0.0074, "step": 18787 }, { "epoch": 3.83, "learning_rate": 3.976760927680863e-05, "loss": 0.0017, "step": 18788 }, { "epoch": 3.83, "learning_rate": 3.9754463150968016e-05, "loss": 0.0081, "step": 18789 }, { "epoch": 3.83, "learning_rate": 3.974131886643598e-05, "loss": 0.0072, "step": 18790 }, { "epoch": 3.83, "learning_rate": 3.972817642343203e-05, "loss": 0.0036, "step": 18791 }, { "epoch": 3.83, "learning_rate": 3.971503582217571e-05, "loss": 0.0004, "step": 18792 }, { "epoch": 3.83, "learning_rate": 3.970189706288645e-05, "loss": 0.0001, "step": 18793 }, { "epoch": 3.83, "learning_rate": 3.9688760145783724e-05, "loss": 0.0079, "step": 18794 }, { "epoch": 3.83, "learning_rate": 3.9675625071086934e-05, "loss": 0.0109, "step": 18795 }, { "epoch": 3.83, "learning_rate": 3.966249183901544e-05, "loss": 0.0027, "step": 18796 }, { "epoch": 3.83, "learning_rate": 3.964936044978867e-05, "loss": 0.0021, "step": 18797 }, { "epoch": 3.83, "learning_rate": 3.963623090362579e-05, "loss": 0.0042, "step": 18798 }, { "epoch": 3.83, "learning_rate": 3.9623103200746265e-05, "loss": 0.0004, "step": 18799 }, { "epoch": 3.83, "learning_rate": 3.960997734136918e-05, "loss": 0.002, "step": 18800 }, { "epoch": 3.83, "learning_rate": 3.959685332571393e-05, "loss": 0.0008, "step": 18801 }, { "epoch": 3.83, "learning_rate": 3.95837311539996e-05, "loss": 0.0016, "step": 18802 }, { "epoch": 3.83, "learning_rate": 3.9570610826445375e-05, "loss": 0.0088, "step": 18803 }, { "epoch": 3.83, "learning_rate": 3.95574923432704e-05, "loss": 0.004, "step": 18804 }, { "epoch": 3.83, "learning_rate": 3.954437570469379e-05, "loss": 0.0042, "step": 18805 }, { "epoch": 3.83, "learning_rate": 3.9531260910934586e-05, "loss": 0.0023, "step": 18806 }, { "epoch": 3.83, "learning_rate": 3.951814796221186e-05, "loss": 0.0031, "step": 18807 }, { "epoch": 3.83, "learning_rate": 3.9505036858744615e-05, "loss": 0.0036, "step": 18808 }, { "epoch": 3.83, "learning_rate": 3.9491927600751824e-05, "loss": 0.0068, "step": 18809 }, { "epoch": 3.83, "learning_rate": 3.9478820188452485e-05, "loss": 0.0044, "step": 18810 }, { "epoch": 3.83, "learning_rate": 3.946571462206539e-05, "loss": 0.0071, "step": 18811 }, { "epoch": 3.83, "learning_rate": 3.945261090180958e-05, "loss": 0.002, "step": 18812 }, { "epoch": 3.83, "learning_rate": 3.943950902790377e-05, "loss": 0.0003, "step": 18813 }, { "epoch": 3.83, "learning_rate": 3.9426409000566906e-05, "loss": 0.0021, "step": 18814 }, { "epoch": 3.83, "learning_rate": 3.9413310820017765e-05, "loss": 0.0024, "step": 18815 }, { "epoch": 3.83, "learning_rate": 3.9400214486474983e-05, "loss": 0.0037, "step": 18816 }, { "epoch": 3.83, "learning_rate": 3.9387120000157496e-05, "loss": 0.0033, "step": 18817 }, { "epoch": 3.83, "learning_rate": 3.9374027361283825e-05, "loss": 0.0025, "step": 18818 }, { "epoch": 3.83, "learning_rate": 3.936093657007279e-05, "loss": 0.0013, "step": 18819 }, { "epoch": 3.83, "learning_rate": 3.93478476267429e-05, "loss": 0.0021, "step": 18820 }, { "epoch": 3.83, "learning_rate": 3.9334760531512855e-05, "loss": 0.0075, "step": 18821 }, { "epoch": 3.83, "learning_rate": 3.932167528460119e-05, "loss": 0.0016, "step": 18822 }, { "epoch": 3.83, "learning_rate": 3.930859188622646e-05, "loss": 0.0061, "step": 18823 }, { "epoch": 3.83, "learning_rate": 3.9295510336607204e-05, "loss": 0.005, "step": 18824 }, { "epoch": 3.83, "learning_rate": 3.92824306359619e-05, "loss": 0.0085, "step": 18825 }, { "epoch": 3.83, "learning_rate": 3.926935278450898e-05, "loss": 0.0053, "step": 18826 }, { "epoch": 3.83, "learning_rate": 3.9256276782466905e-05, "loss": 0.0048, "step": 18827 }, { "epoch": 3.83, "learning_rate": 3.924320263005404e-05, "loss": 0.0049, "step": 18828 }, { "epoch": 3.83, "learning_rate": 3.923013032748876e-05, "loss": 0.0023, "step": 18829 }, { "epoch": 3.83, "learning_rate": 3.9217059874989455e-05, "loss": 0.0051, "step": 18830 }, { "epoch": 3.83, "learning_rate": 3.920399127277426e-05, "loss": 0.0091, "step": 18831 }, { "epoch": 3.83, "learning_rate": 3.919092452106165e-05, "loss": 0.0161, "step": 18832 }, { "epoch": 3.83, "learning_rate": 3.917785962006972e-05, "loss": 0.0017, "step": 18833 }, { "epoch": 3.83, "learning_rate": 3.9164796570016735e-05, "loss": 0.0013, "step": 18834 }, { "epoch": 3.84, "learning_rate": 3.9151735371120854e-05, "loss": 0.0301, "step": 18835 }, { "epoch": 3.84, "learning_rate": 3.913867602360019e-05, "loss": 0.0017, "step": 18836 }, { "epoch": 3.84, "learning_rate": 3.9125618527673e-05, "loss": 0.0002, "step": 18837 }, { "epoch": 3.84, "learning_rate": 3.9112562883557216e-05, "loss": 0.0021, "step": 18838 }, { "epoch": 3.84, "learning_rate": 3.9099509091470944e-05, "loss": 0.0037, "step": 18839 }, { "epoch": 3.84, "learning_rate": 3.908645715163223e-05, "loss": 0.0003, "step": 18840 }, { "epoch": 3.84, "learning_rate": 3.9073407064259026e-05, "loss": 0.0021, "step": 18841 }, { "epoch": 3.84, "learning_rate": 3.906035882956932e-05, "loss": 0.0038, "step": 18842 }, { "epoch": 3.84, "learning_rate": 3.904731244778102e-05, "loss": 0.0041, "step": 18843 }, { "epoch": 3.84, "learning_rate": 3.9034267919112066e-05, "loss": 0.0023, "step": 18844 }, { "epoch": 3.84, "learning_rate": 3.902122524378028e-05, "loss": 0.0091, "step": 18845 }, { "epoch": 3.84, "learning_rate": 3.900818442200354e-05, "loss": 0.0021, "step": 18846 }, { "epoch": 3.84, "learning_rate": 3.899514545399961e-05, "loss": 0.0017, "step": 18847 }, { "epoch": 3.84, "learning_rate": 3.898210833998634e-05, "loss": 0.0018, "step": 18848 }, { "epoch": 3.84, "learning_rate": 3.896907308018134e-05, "loss": 0.0057, "step": 18849 }, { "epoch": 3.84, "learning_rate": 3.895603967480248e-05, "loss": 0.005, "step": 18850 }, { "epoch": 3.84, "learning_rate": 3.894300812406729e-05, "loss": 0.0058, "step": 18851 }, { "epoch": 3.84, "learning_rate": 3.892997842819358e-05, "loss": 0.0006, "step": 18852 }, { "epoch": 3.84, "learning_rate": 3.891695058739886e-05, "loss": 0.0084, "step": 18853 }, { "epoch": 3.84, "learning_rate": 3.8903924601900736e-05, "loss": 0.0082, "step": 18854 }, { "epoch": 3.84, "learning_rate": 3.8890900471916774e-05, "loss": 0.0028, "step": 18855 }, { "epoch": 3.84, "learning_rate": 3.887787819766453e-05, "loss": 0.002, "step": 18856 }, { "epoch": 3.84, "learning_rate": 3.886485777936146e-05, "loss": 0.0038, "step": 18857 }, { "epoch": 3.84, "learning_rate": 3.885183921722505e-05, "loss": 0.0015, "step": 18858 }, { "epoch": 3.84, "learning_rate": 3.883882251147273e-05, "loss": 0.001, "step": 18859 }, { "epoch": 3.84, "learning_rate": 3.8825807662321925e-05, "loss": 0.0005, "step": 18860 }, { "epoch": 3.84, "learning_rate": 3.881279466999001e-05, "loss": 0.0048, "step": 18861 }, { "epoch": 3.84, "learning_rate": 3.8799783534694225e-05, "loss": 0.0023, "step": 18862 }, { "epoch": 3.84, "learning_rate": 3.8786774256652055e-05, "loss": 0.001, "step": 18863 }, { "epoch": 3.84, "learning_rate": 3.877376683608058e-05, "loss": 0.0009, "step": 18864 }, { "epoch": 3.84, "learning_rate": 3.876076127319725e-05, "loss": 0.006, "step": 18865 }, { "epoch": 3.84, "learning_rate": 3.874775756821915e-05, "loss": 0.0042, "step": 18866 }, { "epoch": 3.84, "learning_rate": 3.8734755721363444e-05, "loss": 0.0062, "step": 18867 }, { "epoch": 3.84, "learning_rate": 3.872175573284744e-05, "loss": 0.0005, "step": 18868 }, { "epoch": 3.84, "learning_rate": 3.8708757602888074e-05, "loss": 0.0014, "step": 18869 }, { "epoch": 3.84, "learning_rate": 3.869576133170263e-05, "loss": 0.008, "step": 18870 }, { "epoch": 3.84, "learning_rate": 3.868276691950803e-05, "loss": 0.0072, "step": 18871 }, { "epoch": 3.84, "learning_rate": 3.866977436652135e-05, "loss": 0.0049, "step": 18872 }, { "epoch": 3.84, "learning_rate": 3.8656783672959585e-05, "loss": 0.0029, "step": 18873 }, { "epoch": 3.84, "learning_rate": 3.864379483903971e-05, "loss": 0.0019, "step": 18874 }, { "epoch": 3.84, "learning_rate": 3.863080786497865e-05, "loss": 0.0066, "step": 18875 }, { "epoch": 3.84, "learning_rate": 3.8617822750993324e-05, "loss": 0.003, "step": 18876 }, { "epoch": 3.84, "learning_rate": 3.8604839497300626e-05, "loss": 0.0079, "step": 18877 }, { "epoch": 3.84, "learning_rate": 3.859185810411736e-05, "loss": 0.0082, "step": 18878 }, { "epoch": 3.84, "learning_rate": 3.857887857166037e-05, "loss": 0.0039, "step": 18879 }, { "epoch": 3.84, "learning_rate": 3.856590090014643e-05, "loss": 0.0079, "step": 18880 }, { "epoch": 3.84, "learning_rate": 3.8552925089792346e-05, "loss": 0.004, "step": 18881 }, { "epoch": 3.84, "learning_rate": 3.853995114081469e-05, "loss": 0.0039, "step": 18882 }, { "epoch": 3.84, "learning_rate": 3.852697905343032e-05, "loss": 0.0026, "step": 18883 }, { "epoch": 3.85, "learning_rate": 3.851400882785579e-05, "loss": 0.0004, "step": 18884 }, { "epoch": 3.85, "learning_rate": 3.850104046430775e-05, "loss": 0.0026, "step": 18885 }, { "epoch": 3.85, "learning_rate": 3.848807396300281e-05, "loss": 0.01, "step": 18886 }, { "epoch": 3.85, "learning_rate": 3.8475109324157515e-05, "loss": 0.0035, "step": 18887 }, { "epoch": 3.85, "learning_rate": 3.846214654798843e-05, "loss": 0.0016, "step": 18888 }, { "epoch": 3.85, "learning_rate": 3.844918563471204e-05, "loss": 0.01, "step": 18889 }, { "epoch": 3.85, "learning_rate": 3.84362265845448e-05, "loss": 0.0024, "step": 18890 }, { "epoch": 3.85, "learning_rate": 3.8423269397703175e-05, "loss": 0.0017, "step": 18891 }, { "epoch": 3.85, "learning_rate": 3.841031407440358e-05, "loss": 0.0017, "step": 18892 }, { "epoch": 3.85, "learning_rate": 3.8397360614862365e-05, "loss": 0.0041, "step": 18893 }, { "epoch": 3.85, "learning_rate": 3.838440901929594e-05, "loss": 0.0027, "step": 18894 }, { "epoch": 3.85, "learning_rate": 3.837145928792048e-05, "loss": 0.0053, "step": 18895 }, { "epoch": 3.85, "learning_rate": 3.835851142095242e-05, "loss": 0.007, "step": 18896 }, { "epoch": 3.85, "learning_rate": 3.834556541860796e-05, "loss": 0.0048, "step": 18897 }, { "epoch": 3.85, "learning_rate": 3.833262128110332e-05, "loss": 0.0061, "step": 18898 }, { "epoch": 3.85, "learning_rate": 3.831967900865472e-05, "loss": 0.0003, "step": 18899 }, { "epoch": 3.85, "learning_rate": 3.830673860147821e-05, "loss": 0.0122, "step": 18900 }, { "epoch": 3.85, "learning_rate": 3.82938000597901e-05, "loss": 0.0009, "step": 18901 }, { "epoch": 3.85, "learning_rate": 3.8280863383806295e-05, "loss": 0.0159, "step": 18902 }, { "epoch": 3.85, "learning_rate": 3.826792857374304e-05, "loss": 0.005, "step": 18903 }, { "epoch": 3.85, "learning_rate": 3.825499562981623e-05, "loss": 0.0046, "step": 18904 }, { "epoch": 3.85, "learning_rate": 3.824206455224195e-05, "loss": 0.0028, "step": 18905 }, { "epoch": 3.85, "learning_rate": 3.8229135341236146e-05, "loss": 0.0014, "step": 18906 }, { "epoch": 3.85, "learning_rate": 3.8216207997014755e-05, "loss": 0.0239, "step": 18907 }, { "epoch": 3.85, "learning_rate": 3.82032825197937e-05, "loss": 0.0074, "step": 18908 }, { "epoch": 3.85, "learning_rate": 3.819035890978886e-05, "loss": 0.0051, "step": 18909 }, { "epoch": 3.85, "learning_rate": 3.8177437167216094e-05, "loss": 0.0049, "step": 18910 }, { "epoch": 3.85, "learning_rate": 3.8164517292291185e-05, "loss": 0.0023, "step": 18911 }, { "epoch": 3.85, "learning_rate": 3.815159928523e-05, "loss": 0.0043, "step": 18912 }, { "epoch": 3.85, "learning_rate": 3.813868314624815e-05, "loss": 0.0065, "step": 18913 }, { "epoch": 3.85, "learning_rate": 3.812576887556153e-05, "loss": 0.006, "step": 18914 }, { "epoch": 3.85, "learning_rate": 3.811285647338566e-05, "loss": 0.0049, "step": 18915 }, { "epoch": 3.85, "learning_rate": 3.809994593993637e-05, "loss": 0.0006, "step": 18916 }, { "epoch": 3.85, "learning_rate": 3.808703727542917e-05, "loss": 0.0025, "step": 18917 }, { "epoch": 3.85, "learning_rate": 3.80741304800797e-05, "loss": 0.004, "step": 18918 }, { "epoch": 3.85, "learning_rate": 3.806122555410352e-05, "loss": 0.0128, "step": 18919 }, { "epoch": 3.85, "learning_rate": 3.804832249771612e-05, "loss": 0.0077, "step": 18920 }, { "epoch": 3.85, "learning_rate": 3.803542131113317e-05, "loss": 0.0016, "step": 18921 }, { "epoch": 3.85, "learning_rate": 3.8022521994569974e-05, "loss": 0.0027, "step": 18922 }, { "epoch": 3.85, "learning_rate": 3.800962454824202e-05, "loss": 0.0028, "step": 18923 }, { "epoch": 3.85, "learning_rate": 3.799672897236475e-05, "loss": 0.0087, "step": 18924 }, { "epoch": 3.85, "learning_rate": 3.798383526715354e-05, "loss": 0.0059, "step": 18925 }, { "epoch": 3.85, "learning_rate": 3.797094343282371e-05, "loss": 0.0095, "step": 18926 }, { "epoch": 3.85, "learning_rate": 3.795805346959059e-05, "loss": 0.0041, "step": 18927 }, { "epoch": 3.85, "learning_rate": 3.7945165377669475e-05, "loss": 0.0125, "step": 18928 }, { "epoch": 3.85, "learning_rate": 3.7932279157275626e-05, "loss": 0.0041, "step": 18929 }, { "epoch": 3.85, "learning_rate": 3.7919394808624284e-05, "loss": 0.0237, "step": 18930 }, { "epoch": 3.85, "learning_rate": 3.7906512331930555e-05, "loss": 0.0024, "step": 18931 }, { "epoch": 3.85, "learning_rate": 3.789363172740972e-05, "loss": 0.0065, "step": 18932 }, { "epoch": 3.86, "learning_rate": 3.7880752995276785e-05, "loss": 0.0041, "step": 18933 }, { "epoch": 3.86, "learning_rate": 3.786787613574699e-05, "loss": 0.0005, "step": 18934 }, { "epoch": 3.86, "learning_rate": 3.785500114903529e-05, "loss": 0.0039, "step": 18935 }, { "epoch": 3.86, "learning_rate": 3.784212803535675e-05, "loss": 0.0071, "step": 18936 }, { "epoch": 3.86, "learning_rate": 3.7829256794926394e-05, "loss": 0.0005, "step": 18937 }, { "epoch": 3.86, "learning_rate": 3.78163874279592e-05, "loss": 0.0082, "step": 18938 }, { "epoch": 3.86, "learning_rate": 3.780351993467007e-05, "loss": 0.0078, "step": 18939 }, { "epoch": 3.86, "learning_rate": 3.779065431527396e-05, "loss": 0.0013, "step": 18940 }, { "epoch": 3.86, "learning_rate": 3.7777790569985725e-05, "loss": 0.0102, "step": 18941 }, { "epoch": 3.86, "learning_rate": 3.776492869902023e-05, "loss": 0.0005, "step": 18942 }, { "epoch": 3.86, "learning_rate": 3.775206870259228e-05, "loss": 0.0144, "step": 18943 }, { "epoch": 3.86, "learning_rate": 3.773921058091667e-05, "loss": 0.0024, "step": 18944 }, { "epoch": 3.86, "learning_rate": 3.7726354334208185e-05, "loss": 0.0014, "step": 18945 }, { "epoch": 3.86, "learning_rate": 3.771349996268143e-05, "loss": 0.0037, "step": 18946 }, { "epoch": 3.86, "learning_rate": 3.770064746655128e-05, "loss": 0.0038, "step": 18947 }, { "epoch": 3.86, "learning_rate": 3.76877968460322e-05, "loss": 0.0071, "step": 18948 }, { "epoch": 3.86, "learning_rate": 3.767494810133896e-05, "loss": 0.0048, "step": 18949 }, { "epoch": 3.86, "learning_rate": 3.766210123268616e-05, "loss": 0.0056, "step": 18950 }, { "epoch": 3.86, "learning_rate": 3.764925624028823e-05, "loss": 0.0028, "step": 18951 }, { "epoch": 3.86, "learning_rate": 3.763641312435989e-05, "loss": 0.0013, "step": 18952 }, { "epoch": 3.86, "learning_rate": 3.7623571885115465e-05, "loss": 0.0075, "step": 18953 }, { "epoch": 3.86, "learning_rate": 3.761073252276961e-05, "loss": 0.0015, "step": 18954 }, { "epoch": 3.86, "learning_rate": 3.759789503753662e-05, "loss": 0.0023, "step": 18955 }, { "epoch": 3.86, "learning_rate": 3.7585059429630955e-05, "loss": 0.0022, "step": 18956 }, { "epoch": 3.86, "learning_rate": 3.7572225699266993e-05, "loss": 0.0012, "step": 18957 }, { "epoch": 3.86, "learning_rate": 3.7559393846659086e-05, "loss": 0.0017, "step": 18958 }, { "epoch": 3.86, "learning_rate": 3.7546563872021554e-05, "loss": 0.0032, "step": 18959 }, { "epoch": 3.86, "learning_rate": 3.753373577556867e-05, "loss": 0.0017, "step": 18960 }, { "epoch": 3.86, "learning_rate": 3.75209095575147e-05, "loss": 0.0072, "step": 18961 }, { "epoch": 3.86, "learning_rate": 3.7508085218073863e-05, "loss": 0.0034, "step": 18962 }, { "epoch": 3.86, "learning_rate": 3.749526275746039e-05, "loss": 0.0027, "step": 18963 }, { "epoch": 3.86, "learning_rate": 3.74824421758883e-05, "loss": 0.0029, "step": 18964 }, { "epoch": 3.86, "learning_rate": 3.7469623473571914e-05, "loss": 0.0022, "step": 18965 }, { "epoch": 3.86, "learning_rate": 3.745680665072513e-05, "loss": 0.0018, "step": 18966 }, { "epoch": 3.86, "learning_rate": 3.744399170756221e-05, "loss": 0.001, "step": 18967 }, { "epoch": 3.86, "learning_rate": 3.743117864429705e-05, "loss": 0.0021, "step": 18968 }, { "epoch": 3.86, "learning_rate": 3.741836746114371e-05, "loss": 0.0042, "step": 18969 }, { "epoch": 3.86, "learning_rate": 3.740555815831612e-05, "loss": 0.0002, "step": 18970 }, { "epoch": 3.86, "learning_rate": 3.7392750736028265e-05, "loss": 0.0029, "step": 18971 }, { "epoch": 3.86, "learning_rate": 3.7379945194494026e-05, "loss": 0.0023, "step": 18972 }, { "epoch": 3.86, "learning_rate": 3.736714153392729e-05, "loss": 0.0082, "step": 18973 }, { "epoch": 3.86, "learning_rate": 3.7354339754541905e-05, "loss": 0.0032, "step": 18974 }, { "epoch": 3.86, "learning_rate": 3.734153985655167e-05, "loss": 0.0053, "step": 18975 }, { "epoch": 3.86, "learning_rate": 3.732874184017038e-05, "loss": 0.0032, "step": 18976 }, { "epoch": 3.86, "learning_rate": 3.731594570561179e-05, "loss": 0.0066, "step": 18977 }, { "epoch": 3.86, "learning_rate": 3.7303151453089645e-05, "loss": 0.0054, "step": 18978 }, { "epoch": 3.86, "learning_rate": 3.7290359082817514e-05, "loss": 0.0019, "step": 18979 }, { "epoch": 3.86, "learning_rate": 3.727756859500919e-05, "loss": 0.0015, "step": 18980 }, { "epoch": 3.86, "learning_rate": 3.72647799898783e-05, "loss": 0.0072, "step": 18981 }, { "epoch": 3.87, "learning_rate": 3.7251993267638304e-05, "loss": 0.0008, "step": 18982 }, { "epoch": 3.87, "learning_rate": 3.7239208428502925e-05, "loss": 0.0077, "step": 18983 }, { "epoch": 3.87, "learning_rate": 3.722642547268552e-05, "loss": 0.0036, "step": 18984 }, { "epoch": 3.87, "learning_rate": 3.721364440039979e-05, "loss": 0.0023, "step": 18985 }, { "epoch": 3.87, "learning_rate": 3.7200865211859036e-05, "loss": 0.0057, "step": 18986 }, { "epoch": 3.87, "learning_rate": 3.718808790727676e-05, "loss": 0.0031, "step": 18987 }, { "epoch": 3.87, "learning_rate": 3.717531248686637e-05, "loss": 0.0005, "step": 18988 }, { "epoch": 3.87, "learning_rate": 3.716253895084124e-05, "loss": 0.0036, "step": 18989 }, { "epoch": 3.87, "learning_rate": 3.7149767299414686e-05, "loss": 0.0008, "step": 18990 }, { "epoch": 3.87, "learning_rate": 3.7136997532800053e-05, "loss": 0.0016, "step": 18991 }, { "epoch": 3.87, "learning_rate": 3.71242296512106e-05, "loss": 0.0036, "step": 18992 }, { "epoch": 3.87, "learning_rate": 3.711146365485959e-05, "loss": 0.0024, "step": 18993 }, { "epoch": 3.87, "learning_rate": 3.709869954396022e-05, "loss": 0.004, "step": 18994 }, { "epoch": 3.87, "learning_rate": 3.7085937318725675e-05, "loss": 0.008, "step": 18995 }, { "epoch": 3.87, "learning_rate": 3.707317697936917e-05, "loss": 0.0022, "step": 18996 }, { "epoch": 3.87, "learning_rate": 3.706041852610369e-05, "loss": 0.011, "step": 18997 }, { "epoch": 3.87, "learning_rate": 3.7047661959142495e-05, "loss": 0.0024, "step": 18998 }, { "epoch": 3.87, "learning_rate": 3.7034907278698464e-05, "loss": 0.0018, "step": 18999 }, { "epoch": 3.87, "learning_rate": 3.7022154484984815e-05, "loss": 0.0202, "step": 19000 }, { "epoch": 3.87, "learning_rate": 3.700940357821439e-05, "loss": 0.0033, "step": 19001 }, { "epoch": 3.87, "learning_rate": 3.699665455860018e-05, "loss": 0.0009, "step": 19002 }, { "epoch": 3.87, "learning_rate": 3.698390742635523e-05, "loss": 0.0067, "step": 19003 }, { "epoch": 3.87, "learning_rate": 3.697116218169232e-05, "loss": 0.0107, "step": 19004 }, { "epoch": 3.87, "learning_rate": 3.695841882482435e-05, "loss": 0.0015, "step": 19005 }, { "epoch": 3.87, "learning_rate": 3.694567735596418e-05, "loss": 0.0029, "step": 19006 }, { "epoch": 3.87, "learning_rate": 3.693293777532458e-05, "loss": 0.0033, "step": 19007 }, { "epoch": 3.87, "learning_rate": 3.692020008311837e-05, "loss": 0.0042, "step": 19008 }, { "epoch": 3.87, "learning_rate": 3.690746427955826e-05, "loss": 0.0004, "step": 19009 }, { "epoch": 3.87, "learning_rate": 3.689473036485698e-05, "loss": 0.0044, "step": 19010 }, { "epoch": 3.87, "learning_rate": 3.688199833922719e-05, "loss": 0.006, "step": 19011 }, { "epoch": 3.87, "learning_rate": 3.686926820288158e-05, "loss": 0.0052, "step": 19012 }, { "epoch": 3.87, "learning_rate": 3.685653995603273e-05, "loss": 0.0044, "step": 19013 }, { "epoch": 3.87, "learning_rate": 3.684381359889326e-05, "loss": 0.0096, "step": 19014 }, { "epoch": 3.87, "learning_rate": 3.683108913167563e-05, "loss": 0.0076, "step": 19015 }, { "epoch": 3.87, "learning_rate": 3.681836655459252e-05, "loss": 0.0018, "step": 19016 }, { "epoch": 3.87, "learning_rate": 3.680564586785625e-05, "loss": 0.0045, "step": 19017 }, { "epoch": 3.87, "learning_rate": 3.6792927071679443e-05, "loss": 0.0002, "step": 19018 }, { "epoch": 3.87, "learning_rate": 3.678021016627441e-05, "loss": 0.0024, "step": 19019 }, { "epoch": 3.87, "learning_rate": 3.6767495151853576e-05, "loss": 0.0057, "step": 19020 }, { "epoch": 3.87, "learning_rate": 3.675478202862933e-05, "loss": 0.0027, "step": 19021 }, { "epoch": 3.87, "learning_rate": 3.674207079681397e-05, "loss": 0.002, "step": 19022 }, { "epoch": 3.87, "learning_rate": 3.672936145661983e-05, "loss": 0.0034, "step": 19023 }, { "epoch": 3.87, "learning_rate": 3.6716654008259155e-05, "loss": 0.0045, "step": 19024 }, { "epoch": 3.87, "learning_rate": 3.670394845194422e-05, "loss": 0.0119, "step": 19025 }, { "epoch": 3.87, "learning_rate": 3.6691244787887183e-05, "loss": 0.003, "step": 19026 }, { "epoch": 3.87, "learning_rate": 3.667854301630025e-05, "loss": 0.002, "step": 19027 }, { "epoch": 3.87, "learning_rate": 3.6665843137395556e-05, "loss": 0.0062, "step": 19028 }, { "epoch": 3.87, "learning_rate": 3.665314515138527e-05, "loss": 0.0013, "step": 19029 }, { "epoch": 3.87, "learning_rate": 3.6640449058481326e-05, "loss": 0.0058, "step": 19030 }, { "epoch": 3.88, "learning_rate": 3.6627754858895945e-05, "loss": 0.0015, "step": 19031 }, { "epoch": 3.88, "learning_rate": 3.661506255284102e-05, "loss": 0.0031, "step": 19032 }, { "epoch": 3.88, "learning_rate": 3.660237214052855e-05, "loss": 0.0012, "step": 19033 }, { "epoch": 3.88, "learning_rate": 3.6589683622170596e-05, "loss": 0.0011, "step": 19034 }, { "epoch": 3.88, "learning_rate": 3.6576996997978916e-05, "loss": 0.0072, "step": 19035 }, { "epoch": 3.88, "learning_rate": 3.656431226816557e-05, "loss": 0.0029, "step": 19036 }, { "epoch": 3.88, "learning_rate": 3.6551629432942294e-05, "loss": 0.0038, "step": 19037 }, { "epoch": 3.88, "learning_rate": 3.653894849252095e-05, "loss": 0.0015, "step": 19038 }, { "epoch": 3.88, "learning_rate": 3.652626944711333e-05, "loss": 0.0004, "step": 19039 }, { "epoch": 3.88, "learning_rate": 3.651359229693123e-05, "loss": 0.008, "step": 19040 }, { "epoch": 3.88, "learning_rate": 3.650091704218634e-05, "loss": 0.0021, "step": 19041 }, { "epoch": 3.88, "learning_rate": 3.64882436830904e-05, "loss": 0.0025, "step": 19042 }, { "epoch": 3.88, "learning_rate": 3.647557221985504e-05, "loss": 0.0081, "step": 19043 }, { "epoch": 3.88, "learning_rate": 3.6462902652691935e-05, "loss": 0.0006, "step": 19044 }, { "epoch": 3.88, "learning_rate": 3.645023498181267e-05, "loss": 0.0089, "step": 19045 }, { "epoch": 3.88, "learning_rate": 3.64375692074288e-05, "loss": 0.0063, "step": 19046 }, { "epoch": 3.88, "learning_rate": 3.642490532975196e-05, "loss": 0.0079, "step": 19047 }, { "epoch": 3.88, "learning_rate": 3.6412243348993486e-05, "loss": 0.0032, "step": 19048 }, { "epoch": 3.88, "learning_rate": 3.639958326536505e-05, "loss": 0.0024, "step": 19049 }, { "epoch": 3.88, "learning_rate": 3.6386925079077916e-05, "loss": 0.0099, "step": 19050 }, { "epoch": 3.88, "learning_rate": 3.637426879034368e-05, "loss": 0.0063, "step": 19051 }, { "epoch": 3.88, "learning_rate": 3.636161439937361e-05, "loss": 0.0055, "step": 19052 }, { "epoch": 3.88, "learning_rate": 3.634896190637908e-05, "loss": 0.0021, "step": 19053 }, { "epoch": 3.88, "learning_rate": 3.63363113115714e-05, "loss": 0.0088, "step": 19054 }, { "epoch": 3.88, "learning_rate": 3.63236626151619e-05, "loss": 0.0057, "step": 19055 }, { "epoch": 3.88, "learning_rate": 3.63110158173618e-05, "loss": 0.0047, "step": 19056 }, { "epoch": 3.88, "learning_rate": 3.629837091838236e-05, "loss": 0.0073, "step": 19057 }, { "epoch": 3.88, "learning_rate": 3.6285727918434726e-05, "loss": 0.0042, "step": 19058 }, { "epoch": 3.88, "learning_rate": 3.6273086817730105e-05, "loss": 0.0102, "step": 19059 }, { "epoch": 3.88, "learning_rate": 3.626044761647965e-05, "loss": 0.009, "step": 19060 }, { "epoch": 3.88, "learning_rate": 3.624781031489433e-05, "loss": 0.002, "step": 19061 }, { "epoch": 3.88, "learning_rate": 3.623517491318534e-05, "loss": 0.0026, "step": 19062 }, { "epoch": 3.88, "learning_rate": 3.6222541411563666e-05, "loss": 0.007, "step": 19063 }, { "epoch": 3.88, "learning_rate": 3.620990981024035e-05, "loss": 0.008, "step": 19064 }, { "epoch": 3.88, "learning_rate": 3.619728010942634e-05, "loss": 0.0045, "step": 19065 }, { "epoch": 3.88, "learning_rate": 3.6184652309332503e-05, "loss": 0.0011, "step": 19066 }, { "epoch": 3.88, "learning_rate": 3.617202641016991e-05, "loss": 0.0133, "step": 19067 }, { "epoch": 3.88, "learning_rate": 3.615940241214924e-05, "loss": 0.0027, "step": 19068 }, { "epoch": 3.88, "learning_rate": 3.614678031548153e-05, "loss": 0.0015, "step": 19069 }, { "epoch": 3.88, "learning_rate": 3.6134160120377464e-05, "loss": 0.0044, "step": 19070 }, { "epoch": 3.88, "learning_rate": 3.612154182704785e-05, "loss": 0.0066, "step": 19071 }, { "epoch": 3.88, "learning_rate": 3.610892543570346e-05, "loss": 0.0039, "step": 19072 }, { "epoch": 3.88, "learning_rate": 3.6096310946555e-05, "loss": 0.0072, "step": 19073 }, { "epoch": 3.88, "learning_rate": 3.6083698359813134e-05, "loss": 0.0059, "step": 19074 }, { "epoch": 3.88, "learning_rate": 3.6071087675688555e-05, "loss": 0.002, "step": 19075 }, { "epoch": 3.88, "learning_rate": 3.605847889439187e-05, "loss": 0.0025, "step": 19076 }, { "epoch": 3.88, "learning_rate": 3.604587201613366e-05, "loss": 0.009, "step": 19077 }, { "epoch": 3.88, "learning_rate": 3.603326704112454e-05, "loss": 0.0008, "step": 19078 }, { "epoch": 3.88, "learning_rate": 3.6020663969574895e-05, "loss": 0.0016, "step": 19079 }, { "epoch": 3.89, "learning_rate": 3.600806280169541e-05, "loss": 0.0041, "step": 19080 }, { "epoch": 3.89, "learning_rate": 3.5995463537696356e-05, "loss": 0.0029, "step": 19081 }, { "epoch": 3.89, "learning_rate": 3.598286617778836e-05, "loss": 0.001, "step": 19082 }, { "epoch": 3.89, "learning_rate": 3.5970270722181654e-05, "loss": 0.0005, "step": 19083 }, { "epoch": 3.89, "learning_rate": 3.595767717108668e-05, "loss": 0.002, "step": 19084 }, { "epoch": 3.89, "learning_rate": 3.594508552471378e-05, "loss": 0.0017, "step": 19085 }, { "epoch": 3.89, "learning_rate": 3.59324957832732e-05, "loss": 0.0057, "step": 19086 }, { "epoch": 3.89, "learning_rate": 3.5919907946975334e-05, "loss": 0.0044, "step": 19087 }, { "epoch": 3.89, "learning_rate": 3.590732201603031e-05, "loss": 0.0018, "step": 19088 }, { "epoch": 3.89, "learning_rate": 3.5894737990648374e-05, "loss": 0.0051, "step": 19089 }, { "epoch": 3.89, "learning_rate": 3.5882155871039694e-05, "loss": 0.0017, "step": 19090 }, { "epoch": 3.89, "learning_rate": 3.586957565741444e-05, "loss": 0.0008, "step": 19091 }, { "epoch": 3.89, "learning_rate": 3.58569973499827e-05, "loss": 0.0087, "step": 19092 }, { "epoch": 3.89, "learning_rate": 3.5844420948954565e-05, "loss": 0.0012, "step": 19093 }, { "epoch": 3.89, "learning_rate": 3.583184645454008e-05, "loss": 0.003, "step": 19094 }, { "epoch": 3.89, "learning_rate": 3.581927386694928e-05, "loss": 0.0013, "step": 19095 }, { "epoch": 3.89, "learning_rate": 3.580670318639212e-05, "loss": 0.0115, "step": 19096 }, { "epoch": 3.89, "learning_rate": 3.579413441307858e-05, "loss": 0.0037, "step": 19097 }, { "epoch": 3.89, "learning_rate": 3.5781567547218615e-05, "loss": 0.0018, "step": 19098 }, { "epoch": 3.89, "learning_rate": 3.5769002589022e-05, "loss": 0.0046, "step": 19099 }, { "epoch": 3.89, "learning_rate": 3.575643953869875e-05, "loss": 0.0083, "step": 19100 }, { "epoch": 3.89, "learning_rate": 3.5743878396458516e-05, "loss": 0.0013, "step": 19101 }, { "epoch": 3.89, "learning_rate": 3.573131916251127e-05, "loss": 0.0044, "step": 19102 }, { "epoch": 3.89, "learning_rate": 3.5718761837066664e-05, "loss": 0.0015, "step": 19103 }, { "epoch": 3.89, "learning_rate": 3.5706206420334445e-05, "loss": 0.0018, "step": 19104 }, { "epoch": 3.89, "learning_rate": 3.569365291252431e-05, "loss": 0.001, "step": 19105 }, { "epoch": 3.89, "learning_rate": 3.5681101313845964e-05, "loss": 0.0005, "step": 19106 }, { "epoch": 3.89, "learning_rate": 3.566855162450901e-05, "loss": 0.0024, "step": 19107 }, { "epoch": 3.89, "learning_rate": 3.565600384472306e-05, "loss": 0.0069, "step": 19108 }, { "epoch": 3.89, "learning_rate": 3.5643457974697686e-05, "loss": 0.0052, "step": 19109 }, { "epoch": 3.89, "learning_rate": 3.5630914014642424e-05, "loss": 0.0051, "step": 19110 }, { "epoch": 3.89, "learning_rate": 3.5618371964766825e-05, "loss": 0.0019, "step": 19111 }, { "epoch": 3.89, "learning_rate": 3.560583182528025e-05, "loss": 0.0011, "step": 19112 }, { "epoch": 3.89, "learning_rate": 3.559329359639229e-05, "loss": 0.0028, "step": 19113 }, { "epoch": 3.89, "learning_rate": 3.55807572783122e-05, "loss": 0.0009, "step": 19114 }, { "epoch": 3.89, "learning_rate": 3.55682228712495e-05, "loss": 0.0123, "step": 19115 }, { "epoch": 3.89, "learning_rate": 3.5555690375413515e-05, "loss": 0.0086, "step": 19116 }, { "epoch": 3.89, "learning_rate": 3.554315979101345e-05, "loss": 0.0022, "step": 19117 }, { "epoch": 3.89, "learning_rate": 3.553063111825875e-05, "loss": 0.0136, "step": 19118 }, { "epoch": 3.89, "learning_rate": 3.5518104357358503e-05, "loss": 0.0044, "step": 19119 }, { "epoch": 3.89, "learning_rate": 3.55055795085221e-05, "loss": 0.0039, "step": 19120 }, { "epoch": 3.89, "learning_rate": 3.5493056571958605e-05, "loss": 0.0041, "step": 19121 }, { "epoch": 3.89, "learning_rate": 3.548053554787722e-05, "loss": 0.0184, "step": 19122 }, { "epoch": 3.89, "learning_rate": 3.5468016436487045e-05, "loss": 0.0036, "step": 19123 }, { "epoch": 3.89, "learning_rate": 3.54554992379972e-05, "loss": 0.0068, "step": 19124 }, { "epoch": 3.89, "learning_rate": 3.544298395261672e-05, "loss": 0.0089, "step": 19125 }, { "epoch": 3.89, "learning_rate": 3.5430470580554665e-05, "loss": 0.0081, "step": 19126 }, { "epoch": 3.89, "learning_rate": 3.541795912202001e-05, "loss": 0.003, "step": 19127 }, { "epoch": 3.89, "learning_rate": 3.540544957722173e-05, "loss": 0.0056, "step": 19128 }, { "epoch": 3.9, "learning_rate": 3.5392941946368794e-05, "loss": 0.0014, "step": 19129 }, { "epoch": 3.9, "learning_rate": 3.5380436229669985e-05, "loss": 0.0041, "step": 19130 }, { "epoch": 3.9, "learning_rate": 3.536793242733432e-05, "loss": 0.0009, "step": 19131 }, { "epoch": 3.9, "learning_rate": 3.5355430539570496e-05, "loss": 0.0014, "step": 19132 }, { "epoch": 3.9, "learning_rate": 3.5342930566587466e-05, "loss": 0.0006, "step": 19133 }, { "epoch": 3.9, "learning_rate": 3.533043250859389e-05, "loss": 0.003, "step": 19134 }, { "epoch": 3.9, "learning_rate": 3.531793636579855e-05, "loss": 0.0053, "step": 19135 }, { "epoch": 3.9, "learning_rate": 3.530544213841014e-05, "loss": 0.007, "step": 19136 }, { "epoch": 3.9, "learning_rate": 3.529294982663736e-05, "loss": 0.0143, "step": 19137 }, { "epoch": 3.9, "learning_rate": 3.5280459430688833e-05, "loss": 0.0033, "step": 19138 }, { "epoch": 3.9, "learning_rate": 3.526797095077319e-05, "loss": 0.0007, "step": 19139 }, { "epoch": 3.9, "learning_rate": 3.5255484387098994e-05, "loss": 0.0023, "step": 19140 }, { "epoch": 3.9, "learning_rate": 3.5242999739874814e-05, "loss": 0.0044, "step": 19141 }, { "epoch": 3.9, "learning_rate": 3.5230517009309144e-05, "loss": 0.0041, "step": 19142 }, { "epoch": 3.9, "learning_rate": 3.5218036195610495e-05, "loss": 0.003, "step": 19143 }, { "epoch": 3.9, "learning_rate": 3.520555729898734e-05, "loss": 0.0022, "step": 19144 }, { "epoch": 3.9, "learning_rate": 3.519308031964799e-05, "loss": 0.0087, "step": 19145 }, { "epoch": 3.9, "learning_rate": 3.518060525780095e-05, "loss": 0.0001, "step": 19146 }, { "epoch": 3.9, "learning_rate": 3.516813211365454e-05, "loss": 0.002, "step": 19147 }, { "epoch": 3.9, "learning_rate": 3.515566088741708e-05, "loss": 0.0026, "step": 19148 }, { "epoch": 3.9, "learning_rate": 3.514319157929692e-05, "loss": 0.0026, "step": 19149 }, { "epoch": 3.9, "learning_rate": 3.513072418950219e-05, "loss": 0.0119, "step": 19150 }, { "epoch": 3.9, "learning_rate": 3.511825871824126e-05, "loss": 0.0088, "step": 19151 }, { "epoch": 3.9, "learning_rate": 3.5105795165722245e-05, "loss": 0.0082, "step": 19152 }, { "epoch": 3.9, "learning_rate": 3.509333353215331e-05, "loss": 0.0015, "step": 19153 }, { "epoch": 3.9, "learning_rate": 3.508087381774261e-05, "loss": 0.0012, "step": 19154 }, { "epoch": 3.9, "learning_rate": 3.506841602269824e-05, "loss": 0.0042, "step": 19155 }, { "epoch": 3.9, "learning_rate": 3.505596014722829e-05, "loss": 0.0006, "step": 19156 }, { "epoch": 3.9, "learning_rate": 3.5043506191540754e-05, "loss": 0.005, "step": 19157 }, { "epoch": 3.9, "learning_rate": 3.5031054155843686e-05, "loss": 0.0009, "step": 19158 }, { "epoch": 3.9, "learning_rate": 3.5018604040345014e-05, "loss": 0.009, "step": 19159 }, { "epoch": 3.9, "learning_rate": 3.5006155845252695e-05, "loss": 0.0043, "step": 19160 }, { "epoch": 3.9, "learning_rate": 3.499370957077465e-05, "loss": 0.0033, "step": 19161 }, { "epoch": 3.9, "learning_rate": 3.4981265217118784e-05, "loss": 0.0001, "step": 19162 }, { "epoch": 3.9, "learning_rate": 3.4968822784492815e-05, "loss": 0.0053, "step": 19163 }, { "epoch": 3.9, "learning_rate": 3.495638227310474e-05, "loss": 0.0033, "step": 19164 }, { "epoch": 3.9, "learning_rate": 3.494394368316213e-05, "loss": 0.0053, "step": 19165 }, { "epoch": 3.9, "learning_rate": 3.493150701487296e-05, "loss": 0.0062, "step": 19166 }, { "epoch": 3.9, "learning_rate": 3.491907226844477e-05, "loss": 0.0092, "step": 19167 }, { "epoch": 3.9, "learning_rate": 3.4906639444085255e-05, "loss": 0.0101, "step": 19168 }, { "epoch": 3.9, "learning_rate": 3.489420854200221e-05, "loss": 0.0061, "step": 19169 }, { "epoch": 3.9, "learning_rate": 3.4881779562403075e-05, "loss": 0.0008, "step": 19170 }, { "epoch": 3.9, "learning_rate": 3.4869352505495606e-05, "loss": 0.0012, "step": 19171 }, { "epoch": 3.9, "learning_rate": 3.485692737148723e-05, "loss": 0.0034, "step": 19172 }, { "epoch": 3.9, "learning_rate": 3.484450416058551e-05, "loss": 0.0026, "step": 19173 }, { "epoch": 3.9, "learning_rate": 3.4832082872997955e-05, "loss": 0.0033, "step": 19174 }, { "epoch": 3.9, "learning_rate": 3.4819663508932e-05, "loss": 0.0008, "step": 19175 }, { "epoch": 3.9, "learning_rate": 3.480724606859509e-05, "loss": 0.0019, "step": 19176 }, { "epoch": 3.9, "learning_rate": 3.4794830552194605e-05, "loss": 0.0046, "step": 19177 }, { "epoch": 3.91, "learning_rate": 3.478241695993794e-05, "loss": 0.0033, "step": 19178 }, { "epoch": 3.91, "learning_rate": 3.477000529203238e-05, "loss": 0.0037, "step": 19179 }, { "epoch": 3.91, "learning_rate": 3.475759554868528e-05, "loss": 0.0074, "step": 19180 }, { "epoch": 3.91, "learning_rate": 3.474518773010378e-05, "loss": 0.0187, "step": 19181 }, { "epoch": 3.91, "learning_rate": 3.473278183649531e-05, "loss": 0.0015, "step": 19182 }, { "epoch": 3.91, "learning_rate": 3.4720377868066874e-05, "loss": 0.0009, "step": 19183 }, { "epoch": 3.91, "learning_rate": 3.4707975825025803e-05, "loss": 0.0012, "step": 19184 }, { "epoch": 3.91, "learning_rate": 3.469557570757913e-05, "loss": 0.0114, "step": 19185 }, { "epoch": 3.91, "learning_rate": 3.468317751593401e-05, "loss": 0.0024, "step": 19186 }, { "epoch": 3.91, "learning_rate": 3.467078125029748e-05, "loss": 0.0002, "step": 19187 }, { "epoch": 3.91, "learning_rate": 3.465838691087662e-05, "loss": 0.0055, "step": 19188 }, { "epoch": 3.91, "learning_rate": 3.464599449787841e-05, "loss": 0.0045, "step": 19189 }, { "epoch": 3.91, "learning_rate": 3.463360401150984e-05, "loss": 0.0006, "step": 19190 }, { "epoch": 3.91, "learning_rate": 3.4621215451977866e-05, "loss": 0.0058, "step": 19191 }, { "epoch": 3.91, "learning_rate": 3.460882881948938e-05, "loss": 0.0098, "step": 19192 }, { "epoch": 3.91, "learning_rate": 3.4596444114251267e-05, "loss": 0.0011, "step": 19193 }, { "epoch": 3.91, "learning_rate": 3.458406133647037e-05, "loss": 0.0005, "step": 19194 }, { "epoch": 3.91, "learning_rate": 3.457168048635356e-05, "loss": 0.0002, "step": 19195 }, { "epoch": 3.91, "learning_rate": 3.4559301564107486e-05, "loss": 0.0048, "step": 19196 }, { "epoch": 3.91, "learning_rate": 3.454692456993907e-05, "loss": 0.0143, "step": 19197 }, { "epoch": 3.91, "learning_rate": 3.453454950405486e-05, "loss": 0.0162, "step": 19198 }, { "epoch": 3.91, "learning_rate": 3.452217636666168e-05, "loss": 0.002, "step": 19199 }, { "epoch": 3.91, "learning_rate": 3.450980515796617e-05, "loss": 0.0067, "step": 19200 }, { "epoch": 3.91, "learning_rate": 3.449743587817483e-05, "loss": 0.0014, "step": 19201 }, { "epoch": 3.91, "learning_rate": 3.448506852749442e-05, "loss": 0.0015, "step": 19202 }, { "epoch": 3.91, "learning_rate": 3.447270310613138e-05, "loss": 0.0023, "step": 19203 }, { "epoch": 3.91, "learning_rate": 3.446033961429227e-05, "loss": 0.0004, "step": 19204 }, { "epoch": 3.91, "learning_rate": 3.444797805218359e-05, "loss": 0.0051, "step": 19205 }, { "epoch": 3.91, "learning_rate": 3.44356184200118e-05, "loss": 0.0028, "step": 19206 }, { "epoch": 3.91, "learning_rate": 3.442326071798331e-05, "loss": 0.0052, "step": 19207 }, { "epoch": 3.91, "learning_rate": 3.441090494630455e-05, "loss": 0.0056, "step": 19208 }, { "epoch": 3.91, "learning_rate": 3.4398551105181847e-05, "loss": 0.0017, "step": 19209 }, { "epoch": 3.91, "learning_rate": 3.4386199194821566e-05, "loss": 0.0088, "step": 19210 }, { "epoch": 3.91, "learning_rate": 3.437384921542999e-05, "loss": 0.0012, "step": 19211 }, { "epoch": 3.91, "learning_rate": 3.436150116721339e-05, "loss": 0.0002, "step": 19212 }, { "epoch": 3.91, "learning_rate": 3.434915505037806e-05, "loss": 0.0011, "step": 19213 }, { "epoch": 3.91, "learning_rate": 3.433681086513006e-05, "loss": 0.0048, "step": 19214 }, { "epoch": 3.91, "learning_rate": 3.432446861167572e-05, "loss": 0.0011, "step": 19215 }, { "epoch": 3.91, "learning_rate": 3.431212829022102e-05, "loss": 0.0053, "step": 19216 }, { "epoch": 3.91, "learning_rate": 3.429978990097226e-05, "loss": 0.0109, "step": 19217 }, { "epoch": 3.91, "learning_rate": 3.4287453444135354e-05, "loss": 0.009, "step": 19218 }, { "epoch": 3.91, "learning_rate": 3.42751189199164e-05, "loss": 0.0043, "step": 19219 }, { "epoch": 3.91, "learning_rate": 3.42627863285214e-05, "loss": 0.0077, "step": 19220 }, { "epoch": 3.91, "learning_rate": 3.42504556701563e-05, "loss": 0.0016, "step": 19221 }, { "epoch": 3.91, "learning_rate": 3.423812694502717e-05, "loss": 0.0076, "step": 19222 }, { "epoch": 3.91, "learning_rate": 3.422580015333979e-05, "loss": 0.0061, "step": 19223 }, { "epoch": 3.91, "learning_rate": 3.421347529530008e-05, "loss": 0.0002, "step": 19224 }, { "epoch": 3.91, "learning_rate": 3.420115237111391e-05, "loss": 0.0032, "step": 19225 }, { "epoch": 3.91, "learning_rate": 3.418883138098712e-05, "loss": 0.0041, "step": 19226 }, { "epoch": 3.91, "learning_rate": 3.4176512325125364e-05, "loss": 0.0066, "step": 19227 }, { "epoch": 3.92, "learning_rate": 3.4164195203734565e-05, "loss": 0.001, "step": 19228 }, { "epoch": 3.92, "learning_rate": 3.415188001702029e-05, "loss": 0.0026, "step": 19229 }, { "epoch": 3.92, "learning_rate": 3.413956676518832e-05, "loss": 0.0022, "step": 19230 }, { "epoch": 3.92, "learning_rate": 3.4127255448444346e-05, "loss": 0.0016, "step": 19231 }, { "epoch": 3.92, "learning_rate": 3.411494606699386e-05, "loss": 0.0148, "step": 19232 }, { "epoch": 3.92, "learning_rate": 3.410263862104258e-05, "loss": 0.0064, "step": 19233 }, { "epoch": 3.92, "learning_rate": 3.409033311079594e-05, "loss": 0.0026, "step": 19234 }, { "epoch": 3.92, "learning_rate": 3.4078029536459604e-05, "loss": 0.0041, "step": 19235 }, { "epoch": 3.92, "learning_rate": 3.406572789823896e-05, "loss": 0.0035, "step": 19236 }, { "epoch": 3.92, "learning_rate": 3.40534281963395e-05, "loss": 0.0041, "step": 19237 }, { "epoch": 3.92, "learning_rate": 3.404113043096665e-05, "loss": 0.003, "step": 19238 }, { "epoch": 3.92, "learning_rate": 3.4028834602325815e-05, "loss": 0.002, "step": 19239 }, { "epoch": 3.92, "learning_rate": 3.401654071062235e-05, "loss": 0.0021, "step": 19240 }, { "epoch": 3.92, "learning_rate": 3.400424875606159e-05, "loss": 0.0035, "step": 19241 }, { "epoch": 3.92, "learning_rate": 3.3991958738848836e-05, "loss": 0.0059, "step": 19242 }, { "epoch": 3.92, "learning_rate": 3.3979670659189345e-05, "loss": 0.0008, "step": 19243 }, { "epoch": 3.92, "learning_rate": 3.396738451728836e-05, "loss": 0.0041, "step": 19244 }, { "epoch": 3.92, "learning_rate": 3.395510031335108e-05, "loss": 0.0071, "step": 19245 }, { "epoch": 3.92, "learning_rate": 3.3942818047582725e-05, "loss": 0.0004, "step": 19246 }, { "epoch": 3.92, "learning_rate": 3.39305377201883e-05, "loss": 0.002, "step": 19247 }, { "epoch": 3.92, "learning_rate": 3.3918259331373056e-05, "loss": 0.0084, "step": 19248 }, { "epoch": 3.92, "learning_rate": 3.390598288134194e-05, "loss": 0.0024, "step": 19249 }, { "epoch": 3.92, "learning_rate": 3.3893708370300117e-05, "loss": 0.0024, "step": 19250 }, { "epoch": 3.92, "learning_rate": 3.38814357984525e-05, "loss": 0.017, "step": 19251 }, { "epoch": 3.92, "learning_rate": 3.3869165166004046e-05, "loss": 0.0043, "step": 19252 }, { "epoch": 3.92, "learning_rate": 3.385689647315984e-05, "loss": 0.0006, "step": 19253 }, { "epoch": 3.92, "learning_rate": 3.3844629720124654e-05, "loss": 0.0001, "step": 19254 }, { "epoch": 3.92, "learning_rate": 3.38323649071034e-05, "loss": 0.0054, "step": 19255 }, { "epoch": 3.92, "learning_rate": 3.382010203430094e-05, "loss": 0.0009, "step": 19256 }, { "epoch": 3.92, "learning_rate": 3.3807841101922096e-05, "loss": 0.0045, "step": 19257 }, { "epoch": 3.92, "learning_rate": 3.3795582110171606e-05, "loss": 0.0059, "step": 19258 }, { "epoch": 3.92, "learning_rate": 3.378332505925427e-05, "loss": 0.0022, "step": 19259 }, { "epoch": 3.92, "learning_rate": 3.3771069949374776e-05, "loss": 0.0038, "step": 19260 }, { "epoch": 3.92, "learning_rate": 3.375881678073779e-05, "loss": 0.0013, "step": 19261 }, { "epoch": 3.92, "learning_rate": 3.374656555354801e-05, "loss": 0.0052, "step": 19262 }, { "epoch": 3.92, "learning_rate": 3.373431626801002e-05, "loss": 0.0091, "step": 19263 }, { "epoch": 3.92, "learning_rate": 3.372206892432846e-05, "loss": 0.0036, "step": 19264 }, { "epoch": 3.92, "learning_rate": 3.370982352270775e-05, "loss": 0.0053, "step": 19265 }, { "epoch": 3.92, "learning_rate": 3.369758006335258e-05, "loss": 0.0043, "step": 19266 }, { "epoch": 3.92, "learning_rate": 3.3685338546467275e-05, "loss": 0.0045, "step": 19267 }, { "epoch": 3.92, "learning_rate": 3.367309897225648e-05, "loss": 0.0038, "step": 19268 }, { "epoch": 3.92, "learning_rate": 3.3660861340924454e-05, "loss": 0.0022, "step": 19269 }, { "epoch": 3.92, "learning_rate": 3.364862565267566e-05, "loss": 0.0015, "step": 19270 }, { "epoch": 3.92, "learning_rate": 3.3636391907714426e-05, "loss": 0.001, "step": 19271 }, { "epoch": 3.92, "learning_rate": 3.362416010624513e-05, "loss": 0.0049, "step": 19272 }, { "epoch": 3.92, "learning_rate": 3.361193024847202e-05, "loss": 0.0003, "step": 19273 }, { "epoch": 3.92, "learning_rate": 3.359970233459937e-05, "loss": 0.006, "step": 19274 }, { "epoch": 3.92, "learning_rate": 3.3587476364831406e-05, "loss": 0.0059, "step": 19275 }, { "epoch": 3.92, "learning_rate": 3.357525233937234e-05, "loss": 0.0075, "step": 19276 }, { "epoch": 3.93, "learning_rate": 3.356303025842636e-05, "loss": 0.0057, "step": 19277 }, { "epoch": 3.93, "learning_rate": 3.355081012219749e-05, "loss": 0.0034, "step": 19278 }, { "epoch": 3.93, "learning_rate": 3.353859193088999e-05, "loss": 0.0043, "step": 19279 }, { "epoch": 3.93, "learning_rate": 3.3526375684707766e-05, "loss": 0.0032, "step": 19280 }, { "epoch": 3.93, "learning_rate": 3.3514161383854994e-05, "loss": 0.0126, "step": 19281 }, { "epoch": 3.93, "learning_rate": 3.350194902853557e-05, "loss": 0.0048, "step": 19282 }, { "epoch": 3.93, "learning_rate": 3.3489738618953466e-05, "loss": 0.005, "step": 19283 }, { "epoch": 3.93, "learning_rate": 3.3477530155312735e-05, "loss": 0.0024, "step": 19284 }, { "epoch": 3.93, "learning_rate": 3.346532363781714e-05, "loss": 0.0023, "step": 19285 }, { "epoch": 3.93, "learning_rate": 3.3453119066670667e-05, "loss": 0.0002, "step": 19286 }, { "epoch": 3.93, "learning_rate": 3.3440916442077084e-05, "loss": 0.0019, "step": 19287 }, { "epoch": 3.93, "learning_rate": 3.342871576424021e-05, "loss": 0.0049, "step": 19288 }, { "epoch": 3.93, "learning_rate": 3.341651703336383e-05, "loss": 0.0025, "step": 19289 }, { "epoch": 3.93, "learning_rate": 3.3404320249651675e-05, "loss": 0.0011, "step": 19290 }, { "epoch": 3.93, "learning_rate": 3.339212541330745e-05, "loss": 0.0086, "step": 19291 }, { "epoch": 3.93, "learning_rate": 3.3379932524534866e-05, "loss": 0.0029, "step": 19292 }, { "epoch": 3.93, "learning_rate": 3.3367741583537526e-05, "loss": 0.012, "step": 19293 }, { "epoch": 3.93, "learning_rate": 3.335555259051908e-05, "loss": 0.02, "step": 19294 }, { "epoch": 3.93, "learning_rate": 3.334336554568308e-05, "loss": 0.0043, "step": 19295 }, { "epoch": 3.93, "learning_rate": 3.333118044923309e-05, "loss": 0.008, "step": 19296 }, { "epoch": 3.93, "learning_rate": 3.331899730137263e-05, "loss": 0.0015, "step": 19297 }, { "epoch": 3.93, "learning_rate": 3.33068161023051e-05, "loss": 0.0006, "step": 19298 }, { "epoch": 3.93, "learning_rate": 3.3294636852234105e-05, "loss": 0.0024, "step": 19299 }, { "epoch": 3.93, "learning_rate": 3.328245955136287e-05, "loss": 0.0053, "step": 19300 }, { "epoch": 3.93, "learning_rate": 3.327028419989498e-05, "loss": 0.0022, "step": 19301 }, { "epoch": 3.93, "learning_rate": 3.325811079803363e-05, "loss": 0.0077, "step": 19302 }, { "epoch": 3.93, "learning_rate": 3.3245939345982215e-05, "loss": 0.0016, "step": 19303 }, { "epoch": 3.93, "learning_rate": 3.323376984394398e-05, "loss": 0.0068, "step": 19304 }, { "epoch": 3.93, "learning_rate": 3.3221602292122215e-05, "loss": 0.005, "step": 19305 }, { "epoch": 3.93, "learning_rate": 3.320943669072013e-05, "loss": 0.0046, "step": 19306 }, { "epoch": 3.93, "learning_rate": 3.319727303994091e-05, "loss": 0.0013, "step": 19307 }, { "epoch": 3.93, "learning_rate": 3.31851113399877e-05, "loss": 0.002, "step": 19308 }, { "epoch": 3.93, "learning_rate": 3.317295159106364e-05, "loss": 0.0088, "step": 19309 }, { "epoch": 3.93, "learning_rate": 3.316079379337184e-05, "loss": 0.0029, "step": 19310 }, { "epoch": 3.93, "learning_rate": 3.314863794711528e-05, "loss": 0.005, "step": 19311 }, { "epoch": 3.93, "learning_rate": 3.313648405249707e-05, "loss": 0.0002, "step": 19312 }, { "epoch": 3.93, "learning_rate": 3.312433210972017e-05, "loss": 0.0002, "step": 19313 }, { "epoch": 3.93, "learning_rate": 3.311218211898754e-05, "loss": 0.0045, "step": 19314 }, { "epoch": 3.93, "learning_rate": 3.310003408050214e-05, "loss": 0.0072, "step": 19315 }, { "epoch": 3.93, "learning_rate": 3.3087887994466773e-05, "loss": 0.0018, "step": 19316 }, { "epoch": 3.93, "learning_rate": 3.307574386108443e-05, "loss": 0.0033, "step": 19317 }, { "epoch": 3.93, "learning_rate": 3.30636016805578e-05, "loss": 0.0009, "step": 19318 }, { "epoch": 3.93, "learning_rate": 3.3051461453089836e-05, "loss": 0.0013, "step": 19319 }, { "epoch": 3.93, "learning_rate": 3.3039323178883184e-05, "loss": 0.024, "step": 19320 }, { "epoch": 3.93, "learning_rate": 3.3027186858140615e-05, "loss": 0.004, "step": 19321 }, { "epoch": 3.93, "learning_rate": 3.301505249106482e-05, "loss": 0.0019, "step": 19322 }, { "epoch": 3.93, "learning_rate": 3.300292007785847e-05, "loss": 0.0075, "step": 19323 }, { "epoch": 3.93, "learning_rate": 3.2990789618724214e-05, "loss": 0.0025, "step": 19324 }, { "epoch": 3.93, "learning_rate": 3.2978661113864637e-05, "loss": 0.0011, "step": 19325 }, { "epoch": 3.94, "learning_rate": 3.2966534563482315e-05, "loss": 0.0041, "step": 19326 }, { "epoch": 3.94, "learning_rate": 3.295440996777978e-05, "loss": 0.0086, "step": 19327 }, { "epoch": 3.94, "learning_rate": 3.294228732695957e-05, "loss": 0.0018, "step": 19328 }, { "epoch": 3.94, "learning_rate": 3.293016664122405e-05, "loss": 0.0046, "step": 19329 }, { "epoch": 3.94, "learning_rate": 3.2918047910775816e-05, "loss": 0.0004, "step": 19330 }, { "epoch": 3.94, "learning_rate": 3.29059311358171e-05, "loss": 0.0022, "step": 19331 }, { "epoch": 3.94, "learning_rate": 3.289381631655047e-05, "loss": 0.0003, "step": 19332 }, { "epoch": 3.94, "learning_rate": 3.2881703453178106e-05, "loss": 0.0027, "step": 19333 }, { "epoch": 3.94, "learning_rate": 3.286959254590236e-05, "loss": 0.0039, "step": 19334 }, { "epoch": 3.94, "learning_rate": 3.2857483594925525e-05, "loss": 0.0021, "step": 19335 }, { "epoch": 3.94, "learning_rate": 3.28453766004498e-05, "loss": 0.0056, "step": 19336 }, { "epoch": 3.94, "learning_rate": 3.283327156267751e-05, "loss": 0.0036, "step": 19337 }, { "epoch": 3.94, "learning_rate": 3.282116848181071e-05, "loss": 0.0007, "step": 19338 }, { "epoch": 3.94, "learning_rate": 3.2809067358051574e-05, "loss": 0.0059, "step": 19339 }, { "epoch": 3.94, "learning_rate": 3.2796968191602245e-05, "loss": 0.0103, "step": 19340 }, { "epoch": 3.94, "learning_rate": 3.2784870982664785e-05, "loss": 0.0046, "step": 19341 }, { "epoch": 3.94, "learning_rate": 3.277277573144123e-05, "loss": 0.0114, "step": 19342 }, { "epoch": 3.94, "learning_rate": 3.276068243813361e-05, "loss": 0.0022, "step": 19343 }, { "epoch": 3.94, "learning_rate": 3.274859110294388e-05, "loss": 0.0006, "step": 19344 }, { "epoch": 3.94, "learning_rate": 3.273650172607403e-05, "loss": 0.001, "step": 19345 }, { "epoch": 3.94, "learning_rate": 3.2724414307725944e-05, "loss": 0.0066, "step": 19346 }, { "epoch": 3.94, "learning_rate": 3.27123288481015e-05, "loss": 0.0044, "step": 19347 }, { "epoch": 3.94, "learning_rate": 3.270024534740262e-05, "loss": 0.0053, "step": 19348 }, { "epoch": 3.94, "learning_rate": 3.268816380583096e-05, "loss": 0.0005, "step": 19349 }, { "epoch": 3.94, "learning_rate": 3.267608422358851e-05, "loss": 0.001, "step": 19350 }, { "epoch": 3.94, "learning_rate": 3.266400660087685e-05, "loss": 0.0052, "step": 19351 }, { "epoch": 3.94, "learning_rate": 3.265193093789779e-05, "loss": 0.0002, "step": 19352 }, { "epoch": 3.94, "learning_rate": 3.2639857234853e-05, "loss": 0.0041, "step": 19353 }, { "epoch": 3.94, "learning_rate": 3.26277854919441e-05, "loss": 0.0106, "step": 19354 }, { "epoch": 3.94, "learning_rate": 3.2615715709372754e-05, "loss": 0.0072, "step": 19355 }, { "epoch": 3.94, "learning_rate": 3.260364788734053e-05, "loss": 0.0034, "step": 19356 }, { "epoch": 3.94, "learning_rate": 3.2591582026048986e-05, "loss": 0.0037, "step": 19357 }, { "epoch": 3.94, "learning_rate": 3.257951812569966e-05, "loss": 0.0004, "step": 19358 }, { "epoch": 3.94, "learning_rate": 3.256745618649402e-05, "loss": 0.0024, "step": 19359 }, { "epoch": 3.94, "learning_rate": 3.2555396208633525e-05, "loss": 0.0095, "step": 19360 }, { "epoch": 3.94, "learning_rate": 3.2543338192319645e-05, "loss": 0.0096, "step": 19361 }, { "epoch": 3.94, "learning_rate": 3.253128213775366e-05, "loss": 0.0075, "step": 19362 }, { "epoch": 3.94, "learning_rate": 3.251922804513708e-05, "loss": 0.005, "step": 19363 }, { "epoch": 3.94, "learning_rate": 3.2507175914671074e-05, "loss": 0.0061, "step": 19364 }, { "epoch": 3.94, "learning_rate": 3.249512574655705e-05, "loss": 0.003, "step": 19365 }, { "epoch": 3.94, "learning_rate": 3.248307754099626e-05, "loss": 0.0009, "step": 19366 }, { "epoch": 3.94, "learning_rate": 3.247103129818985e-05, "loss": 0.0008, "step": 19367 }, { "epoch": 3.94, "learning_rate": 3.245898701833913e-05, "loss": 0.0025, "step": 19368 }, { "epoch": 3.94, "learning_rate": 3.2446944701645125e-05, "loss": 0.0003, "step": 19369 }, { "epoch": 3.94, "learning_rate": 3.2434904348309124e-05, "loss": 0.0056, "step": 19370 }, { "epoch": 3.94, "learning_rate": 3.2422865958532104e-05, "loss": 0.0024, "step": 19371 }, { "epoch": 3.94, "learning_rate": 3.241082953251515e-05, "loss": 0.0051, "step": 19372 }, { "epoch": 3.94, "learning_rate": 3.2398795070459316e-05, "loss": 0.0032, "step": 19373 }, { "epoch": 3.94, "learning_rate": 3.23867625725656e-05, "loss": 0.002, "step": 19374 }, { "epoch": 3.95, "learning_rate": 3.237473203903496e-05, "loss": 0.0083, "step": 19375 }, { "epoch": 3.95, "learning_rate": 3.236270347006832e-05, "loss": 0.0029, "step": 19376 }, { "epoch": 3.95, "learning_rate": 3.2350676865866585e-05, "loss": 0.0028, "step": 19377 }, { "epoch": 3.95, "learning_rate": 3.233865222663064e-05, "loss": 0.0017, "step": 19378 }, { "epoch": 3.95, "learning_rate": 3.232662955256132e-05, "loss": 0.0047, "step": 19379 }, { "epoch": 3.95, "learning_rate": 3.231460884385936e-05, "loss": 0.0003, "step": 19380 }, { "epoch": 3.95, "learning_rate": 3.230259010072563e-05, "loss": 0.0033, "step": 19381 }, { "epoch": 3.95, "learning_rate": 3.2290573323360755e-05, "loss": 0.0022, "step": 19382 }, { "epoch": 3.95, "learning_rate": 3.227855851196557e-05, "loss": 0.0045, "step": 19383 }, { "epoch": 3.95, "learning_rate": 3.226654566674064e-05, "loss": 0.0024, "step": 19384 }, { "epoch": 3.95, "learning_rate": 3.225453478788663e-05, "loss": 0.0004, "step": 19385 }, { "epoch": 3.95, "learning_rate": 3.224252587560415e-05, "loss": 0.0037, "step": 19386 }, { "epoch": 3.95, "learning_rate": 3.2230518930093776e-05, "loss": 0.0042, "step": 19387 }, { "epoch": 3.95, "learning_rate": 3.221851395155603e-05, "loss": 0.0096, "step": 19388 }, { "epoch": 3.95, "learning_rate": 3.2206510940191445e-05, "loss": 0.0044, "step": 19389 }, { "epoch": 3.95, "learning_rate": 3.2194509896200455e-05, "loss": 0.0053, "step": 19390 }, { "epoch": 3.95, "learning_rate": 3.218251081978354e-05, "loss": 0.0003, "step": 19391 }, { "epoch": 3.95, "learning_rate": 3.2170513711141095e-05, "loss": 0.003, "step": 19392 }, { "epoch": 3.95, "learning_rate": 3.215851857047349e-05, "loss": 0.0002, "step": 19393 }, { "epoch": 3.95, "learning_rate": 3.214652539798108e-05, "loss": 0.0026, "step": 19394 }, { "epoch": 3.95, "learning_rate": 3.213453419386411e-05, "loss": 0.0021, "step": 19395 }, { "epoch": 3.95, "learning_rate": 3.2122544958322936e-05, "loss": 0.0017, "step": 19396 }, { "epoch": 3.95, "learning_rate": 3.211055769155776e-05, "loss": 0.0035, "step": 19397 }, { "epoch": 3.95, "learning_rate": 3.2098572393768813e-05, "loss": 0.0187, "step": 19398 }, { "epoch": 3.95, "learning_rate": 3.2086589065156304e-05, "loss": 0.0013, "step": 19399 }, { "epoch": 3.95, "learning_rate": 3.207460770592026e-05, "loss": 0.001, "step": 19400 }, { "epoch": 3.95, "learning_rate": 3.206262831626093e-05, "loss": 0.0002, "step": 19401 }, { "epoch": 3.95, "learning_rate": 3.205065089637829e-05, "loss": 0.0015, "step": 19402 }, { "epoch": 3.95, "learning_rate": 3.203867544647244e-05, "loss": 0.0085, "step": 19403 }, { "epoch": 3.95, "learning_rate": 3.2026701966743374e-05, "loss": 0.0001, "step": 19404 }, { "epoch": 3.95, "learning_rate": 3.201473045739107e-05, "loss": 0.0092, "step": 19405 }, { "epoch": 3.95, "learning_rate": 3.200276091861548e-05, "loss": 0.0058, "step": 19406 }, { "epoch": 3.95, "learning_rate": 3.199079335061652e-05, "loss": 0.0031, "step": 19407 }, { "epoch": 3.95, "learning_rate": 3.197882775359408e-05, "loss": 0.0002, "step": 19408 }, { "epoch": 3.95, "learning_rate": 3.1966864127747987e-05, "loss": 0.0008, "step": 19409 }, { "epoch": 3.95, "learning_rate": 3.1954902473278074e-05, "loss": 0.0093, "step": 19410 }, { "epoch": 3.95, "learning_rate": 3.19429427903841e-05, "loss": 0.0049, "step": 19411 }, { "epoch": 3.95, "learning_rate": 3.193098507926589e-05, "loss": 0.0001, "step": 19412 }, { "epoch": 3.95, "learning_rate": 3.191902934012301e-05, "loss": 0.0026, "step": 19413 }, { "epoch": 3.95, "learning_rate": 3.190707557315531e-05, "loss": 0.0104, "step": 19414 }, { "epoch": 3.95, "learning_rate": 3.189512377856228e-05, "loss": 0.0011, "step": 19415 }, { "epoch": 3.95, "learning_rate": 3.188317395654371e-05, "loss": 0.0019, "step": 19416 }, { "epoch": 3.95, "learning_rate": 3.1871226107299056e-05, "loss": 0.0015, "step": 19417 }, { "epoch": 3.95, "learning_rate": 3.185928023102788e-05, "loss": 0.0011, "step": 19418 }, { "epoch": 3.95, "learning_rate": 3.184733632792979e-05, "loss": 0.0125, "step": 19419 }, { "epoch": 3.95, "learning_rate": 3.1835394398204134e-05, "loss": 0.0018, "step": 19420 }, { "epoch": 3.95, "learning_rate": 3.1823454442050536e-05, "loss": 0.0009, "step": 19421 }, { "epoch": 3.95, "learning_rate": 3.1811516459668276e-05, "loss": 0.0067, "step": 19422 }, { "epoch": 3.95, "learning_rate": 3.1799580451256794e-05, "loss": 0.0037, "step": 19423 }, { "epoch": 3.96, "learning_rate": 3.178764641701544e-05, "loss": 0.0023, "step": 19424 }, { "epoch": 3.96, "learning_rate": 3.1775714357143514e-05, "loss": 0.0079, "step": 19425 }, { "epoch": 3.96, "learning_rate": 3.1763784271840336e-05, "loss": 0.002, "step": 19426 }, { "epoch": 3.96, "learning_rate": 3.175185616130514e-05, "loss": 0.0013, "step": 19427 }, { "epoch": 3.96, "learning_rate": 3.1739930025737163e-05, "loss": 0.0024, "step": 19428 }, { "epoch": 3.96, "learning_rate": 3.1728005865335587e-05, "loss": 0.0094, "step": 19429 }, { "epoch": 3.96, "learning_rate": 3.17160836802996e-05, "loss": 0.0006, "step": 19430 }, { "epoch": 3.96, "learning_rate": 3.170416347082822e-05, "loss": 0.002, "step": 19431 }, { "epoch": 3.96, "learning_rate": 3.16922452371207e-05, "loss": 0.0061, "step": 19432 }, { "epoch": 3.96, "learning_rate": 3.1680328979375895e-05, "loss": 0.0098, "step": 19433 }, { "epoch": 3.96, "learning_rate": 3.166841469779305e-05, "loss": 0.0023, "step": 19434 }, { "epoch": 3.96, "learning_rate": 3.1656502392570975e-05, "loss": 0.0011, "step": 19435 }, { "epoch": 3.96, "learning_rate": 3.164459206390872e-05, "loss": 0.0039, "step": 19436 }, { "epoch": 3.96, "learning_rate": 3.163268371200519e-05, "loss": 0.0018, "step": 19437 }, { "epoch": 3.96, "learning_rate": 3.162077733705928e-05, "loss": 0.0054, "step": 19438 }, { "epoch": 3.96, "learning_rate": 3.160887293926983e-05, "loss": 0.0003, "step": 19439 }, { "epoch": 3.96, "learning_rate": 3.159697051883569e-05, "loss": 0.0016, "step": 19440 }, { "epoch": 3.96, "learning_rate": 3.1585070075955635e-05, "loss": 0.0058, "step": 19441 }, { "epoch": 3.96, "learning_rate": 3.157317161082845e-05, "loss": 0.0003, "step": 19442 }, { "epoch": 3.96, "learning_rate": 3.1561275123652835e-05, "loss": 0.0162, "step": 19443 }, { "epoch": 3.96, "learning_rate": 3.1549380614627495e-05, "loss": 0.0014, "step": 19444 }, { "epoch": 3.96, "learning_rate": 3.153748808395114e-05, "loss": 0.0012, "step": 19445 }, { "epoch": 3.96, "learning_rate": 3.152559753182226e-05, "loss": 0.0022, "step": 19446 }, { "epoch": 3.96, "learning_rate": 3.151370895843962e-05, "loss": 0.003, "step": 19447 }, { "epoch": 3.96, "learning_rate": 3.150182236400161e-05, "loss": 0.0012, "step": 19448 }, { "epoch": 3.96, "learning_rate": 3.148993774870689e-05, "loss": 0.0105, "step": 19449 }, { "epoch": 3.96, "learning_rate": 3.147805511275396e-05, "loss": 0.0038, "step": 19450 }, { "epoch": 3.96, "learning_rate": 3.1466174456341144e-05, "loss": 0.0003, "step": 19451 }, { "epoch": 3.96, "learning_rate": 3.145429577966706e-05, "loss": 0.0038, "step": 19452 }, { "epoch": 3.96, "learning_rate": 3.1442419082929954e-05, "loss": 0.0011, "step": 19453 }, { "epoch": 3.96, "learning_rate": 3.143054436632825e-05, "loss": 0.0095, "step": 19454 }, { "epoch": 3.96, "learning_rate": 3.141867163006027e-05, "loss": 0.0027, "step": 19455 }, { "epoch": 3.96, "learning_rate": 3.1406800874324314e-05, "loss": 0.001, "step": 19456 }, { "epoch": 3.96, "learning_rate": 3.1394932099318646e-05, "loss": 0.0058, "step": 19457 }, { "epoch": 3.96, "learning_rate": 3.1383065305241474e-05, "loss": 0.0033, "step": 19458 }, { "epoch": 3.96, "learning_rate": 3.137120049229103e-05, "loss": 0.0065, "step": 19459 }, { "epoch": 3.96, "learning_rate": 3.1359337660665476e-05, "loss": 0.0013, "step": 19460 }, { "epoch": 3.96, "learning_rate": 3.134747681056292e-05, "loss": 0.0058, "step": 19461 }, { "epoch": 3.96, "learning_rate": 3.1335617942181485e-05, "loss": 0.0075, "step": 19462 }, { "epoch": 3.96, "learning_rate": 3.132376105571926e-05, "loss": 0.0045, "step": 19463 }, { "epoch": 3.96, "learning_rate": 3.1311906151374156e-05, "loss": 0.028, "step": 19464 }, { "epoch": 3.96, "learning_rate": 3.130005322934435e-05, "loss": 0.0022, "step": 19465 }, { "epoch": 3.96, "learning_rate": 3.1288202289827626e-05, "loss": 0.0065, "step": 19466 }, { "epoch": 3.96, "learning_rate": 3.12763533330221e-05, "loss": 0.0035, "step": 19467 }, { "epoch": 3.96, "learning_rate": 3.1264506359125525e-05, "loss": 0.0031, "step": 19468 }, { "epoch": 3.96, "learning_rate": 3.125266136833583e-05, "loss": 0.0015, "step": 19469 }, { "epoch": 3.96, "learning_rate": 3.124081836085084e-05, "loss": 0.0074, "step": 19470 }, { "epoch": 3.96, "learning_rate": 3.122897733686833e-05, "loss": 0.0039, "step": 19471 }, { "epoch": 3.96, "learning_rate": 3.1217138296586154e-05, "loss": 0.0036, "step": 19472 }, { "epoch": 3.97, "learning_rate": 3.1205301240201956e-05, "loss": 0.0018, "step": 19473 }, { "epoch": 3.97, "learning_rate": 3.1193466167913466e-05, "loss": 0.0027, "step": 19474 }, { "epoch": 3.97, "learning_rate": 3.1181633079918375e-05, "loss": 0.0043, "step": 19475 }, { "epoch": 3.97, "learning_rate": 3.116980197641431e-05, "loss": 0.0031, "step": 19476 }, { "epoch": 3.97, "learning_rate": 3.115797285759879e-05, "loss": 0.0001, "step": 19477 }, { "epoch": 3.97, "learning_rate": 3.11461457236695e-05, "loss": 0.0008, "step": 19478 }, { "epoch": 3.97, "learning_rate": 3.113432057482391e-05, "loss": 0.0016, "step": 19479 }, { "epoch": 3.97, "learning_rate": 3.112249741125956e-05, "loss": 0.0019, "step": 19480 }, { "epoch": 3.97, "learning_rate": 3.111067623317394e-05, "loss": 0.0024, "step": 19481 }, { "epoch": 3.97, "learning_rate": 3.1098857040764366e-05, "loss": 0.0021, "step": 19482 }, { "epoch": 3.97, "learning_rate": 3.1087039834228386e-05, "loss": 0.0108, "step": 19483 }, { "epoch": 3.97, "learning_rate": 3.107522461376323e-05, "loss": 0.0014, "step": 19484 }, { "epoch": 3.97, "learning_rate": 3.10634113795664e-05, "loss": 0.0046, "step": 19485 }, { "epoch": 3.97, "learning_rate": 3.105160013183506e-05, "loss": 0.0421, "step": 19486 }, { "epoch": 3.97, "learning_rate": 3.1039790870766526e-05, "loss": 0.0009, "step": 19487 }, { "epoch": 3.97, "learning_rate": 3.1027983596558056e-05, "loss": 0.0033, "step": 19488 }, { "epoch": 3.97, "learning_rate": 3.101617830940683e-05, "loss": 0.0063, "step": 19489 }, { "epoch": 3.97, "learning_rate": 3.100437500951e-05, "loss": 0.0005, "step": 19490 }, { "epoch": 3.97, "learning_rate": 3.0992573697064746e-05, "loss": 0.0028, "step": 19491 }, { "epoch": 3.97, "learning_rate": 3.098077437226816e-05, "loss": 0.0028, "step": 19492 }, { "epoch": 3.97, "learning_rate": 3.096897703531729e-05, "loss": 0.0024, "step": 19493 }, { "epoch": 3.97, "learning_rate": 3.09571816864092e-05, "loss": 0.0088, "step": 19494 }, { "epoch": 3.97, "learning_rate": 3.094538832574088e-05, "loss": 0.0014, "step": 19495 }, { "epoch": 3.97, "learning_rate": 3.093359695350937e-05, "loss": 0.0005, "step": 19496 }, { "epoch": 3.97, "learning_rate": 3.092180756991144e-05, "loss": 0.0081, "step": 19497 }, { "epoch": 3.97, "learning_rate": 3.0910020175144176e-05, "loss": 0.0029, "step": 19498 }, { "epoch": 3.97, "learning_rate": 3.0898234769404344e-05, "loss": 0.0022, "step": 19499 }, { "epoch": 3.97, "learning_rate": 3.0886451352888816e-05, "loss": 0.0049, "step": 19500 }, { "epoch": 3.97, "learning_rate": 3.0874669925794393e-05, "loss": 0.0049, "step": 19501 }, { "epoch": 3.97, "learning_rate": 3.086289048831779e-05, "loss": 0.0046, "step": 19502 }, { "epoch": 3.97, "learning_rate": 3.08511130406559e-05, "loss": 0.0045, "step": 19503 }, { "epoch": 3.97, "learning_rate": 3.083933758300529e-05, "loss": 0.0163, "step": 19504 }, { "epoch": 3.97, "learning_rate": 3.082756411556266e-05, "loss": 0.0117, "step": 19505 }, { "epoch": 3.97, "learning_rate": 3.081579263852468e-05, "loss": 0.0006, "step": 19506 }, { "epoch": 3.97, "learning_rate": 3.0804023152087925e-05, "loss": 0.0001, "step": 19507 }, { "epoch": 3.97, "learning_rate": 3.079225565644899e-05, "loss": 0.0046, "step": 19508 }, { "epoch": 3.97, "learning_rate": 3.078049015180442e-05, "loss": 0.0068, "step": 19509 }, { "epoch": 3.97, "learning_rate": 3.076872663835068e-05, "loss": 0.0004, "step": 19510 }, { "epoch": 3.97, "learning_rate": 3.075696511628429e-05, "loss": 0.001, "step": 19511 }, { "epoch": 3.97, "learning_rate": 3.0745205585801656e-05, "loss": 0.0017, "step": 19512 }, { "epoch": 3.97, "learning_rate": 3.073344804709922e-05, "loss": 0.0004, "step": 19513 }, { "epoch": 3.97, "learning_rate": 3.072169250037335e-05, "loss": 0.0004, "step": 19514 }, { "epoch": 3.97, "learning_rate": 3.07099389458203e-05, "loss": 0.0027, "step": 19515 }, { "epoch": 3.97, "learning_rate": 3.0698187383636524e-05, "loss": 0.0067, "step": 19516 }, { "epoch": 3.97, "learning_rate": 3.068643781401813e-05, "loss": 0.0016, "step": 19517 }, { "epoch": 3.97, "learning_rate": 3.067469023716154e-05, "loss": 0.0089, "step": 19518 }, { "epoch": 3.97, "learning_rate": 3.066294465326281e-05, "loss": 0.0054, "step": 19519 }, { "epoch": 3.97, "learning_rate": 3.065120106251818e-05, "loss": 0.0009, "step": 19520 }, { "epoch": 3.97, "learning_rate": 3.063945946512376e-05, "loss": 0.0006, "step": 19521 }, { "epoch": 3.98, "learning_rate": 3.062771986127569e-05, "loss": 0.0018, "step": 19522 }, { "epoch": 3.98, "learning_rate": 3.061598225117004e-05, "loss": 0.0011, "step": 19523 }, { "epoch": 3.98, "learning_rate": 3.060424663500282e-05, "loss": 0.0035, "step": 19524 }, { "epoch": 3.98, "learning_rate": 3.059251301297006e-05, "loss": 0.0052, "step": 19525 }, { "epoch": 3.98, "learning_rate": 3.058078138526775e-05, "loss": 0.044, "step": 19526 }, { "epoch": 3.98, "learning_rate": 3.0569051752091834e-05, "loss": 0.0045, "step": 19527 }, { "epoch": 3.98, "learning_rate": 3.055732411363812e-05, "loss": 0.0003, "step": 19528 }, { "epoch": 3.98, "learning_rate": 3.0545598470102624e-05, "loss": 0.0049, "step": 19529 }, { "epoch": 3.98, "learning_rate": 3.0533874821681046e-05, "loss": 0.0031, "step": 19530 }, { "epoch": 3.98, "learning_rate": 3.052215316856932e-05, "loss": 0.0017, "step": 19531 }, { "epoch": 3.98, "learning_rate": 3.0510433510963195e-05, "loss": 0.0147, "step": 19532 }, { "epoch": 3.98, "learning_rate": 3.0498715849058302e-05, "loss": 0.009, "step": 19533 }, { "epoch": 3.98, "learning_rate": 3.0487000183050526e-05, "loss": 0.0034, "step": 19534 }, { "epoch": 3.98, "learning_rate": 3.047528651313534e-05, "loss": 0.0079, "step": 19535 }, { "epoch": 3.98, "learning_rate": 3.0463574839508587e-05, "loss": 0.0058, "step": 19536 }, { "epoch": 3.98, "learning_rate": 3.045186516236573e-05, "loss": 0.0064, "step": 19537 }, { "epoch": 3.98, "learning_rate": 3.0440157481902376e-05, "loss": 0.0047, "step": 19538 }, { "epoch": 3.98, "learning_rate": 3.042845179831409e-05, "loss": 0.0134, "step": 19539 }, { "epoch": 3.98, "learning_rate": 3.0416748111796363e-05, "loss": 0.0105, "step": 19540 }, { "epoch": 3.98, "learning_rate": 3.040504642254467e-05, "loss": 0.0075, "step": 19541 }, { "epoch": 3.98, "learning_rate": 3.0393346730754458e-05, "loss": 0.0117, "step": 19542 }, { "epoch": 3.98, "learning_rate": 3.038164903662112e-05, "loss": 0.0017, "step": 19543 }, { "epoch": 3.98, "learning_rate": 3.0369953340340048e-05, "loss": 0.0041, "step": 19544 }, { "epoch": 3.98, "learning_rate": 3.0358259642106568e-05, "loss": 0.008, "step": 19545 }, { "epoch": 3.98, "learning_rate": 3.0346567942115995e-05, "loss": 0.0023, "step": 19546 }, { "epoch": 3.98, "learning_rate": 3.033487824056364e-05, "loss": 0.0019, "step": 19547 }, { "epoch": 3.98, "learning_rate": 3.032319053764462e-05, "loss": 0.0032, "step": 19548 }, { "epoch": 3.98, "learning_rate": 3.0311504833554305e-05, "loss": 0.0009, "step": 19549 }, { "epoch": 3.98, "learning_rate": 3.029982112848774e-05, "loss": 0.0051, "step": 19550 }, { "epoch": 3.98, "learning_rate": 3.028813942264013e-05, "loss": 0.0024, "step": 19551 }, { "epoch": 3.98, "learning_rate": 3.0276459716206535e-05, "loss": 0.0085, "step": 19552 }, { "epoch": 3.98, "learning_rate": 3.026478200938209e-05, "loss": 0.0058, "step": 19553 }, { "epoch": 3.98, "learning_rate": 3.025310630236178e-05, "loss": 0.0036, "step": 19554 }, { "epoch": 3.98, "learning_rate": 3.0241432595340636e-05, "loss": 0.0032, "step": 19555 }, { "epoch": 3.98, "learning_rate": 3.022976088851364e-05, "loss": 0.0003, "step": 19556 }, { "epoch": 3.98, "learning_rate": 3.021809118207569e-05, "loss": 0.0015, "step": 19557 }, { "epoch": 3.98, "learning_rate": 3.0206423476221746e-05, "loss": 0.0036, "step": 19558 }, { "epoch": 3.98, "learning_rate": 3.019475777114666e-05, "loss": 0.0179, "step": 19559 }, { "epoch": 3.98, "learning_rate": 3.0183094067045293e-05, "loss": 0.0038, "step": 19560 }, { "epoch": 3.98, "learning_rate": 3.0171432364112357e-05, "loss": 0.0033, "step": 19561 }, { "epoch": 3.98, "learning_rate": 3.015977266254273e-05, "loss": 0.0022, "step": 19562 }, { "epoch": 3.98, "learning_rate": 3.0148114962531106e-05, "loss": 0.0032, "step": 19563 }, { "epoch": 3.98, "learning_rate": 3.0136459264272213e-05, "loss": 0.0038, "step": 19564 }, { "epoch": 3.98, "learning_rate": 3.012480556796074e-05, "loss": 0.0013, "step": 19565 }, { "epoch": 3.98, "learning_rate": 3.0113153873791206e-05, "loss": 0.0041, "step": 19566 }, { "epoch": 3.98, "learning_rate": 3.0101504181958402e-05, "loss": 0.0019, "step": 19567 }, { "epoch": 3.98, "learning_rate": 3.008985649265672e-05, "loss": 0.0062, "step": 19568 }, { "epoch": 3.98, "learning_rate": 3.0078210806080842e-05, "loss": 0.0058, "step": 19569 }, { "epoch": 3.98, "learning_rate": 3.0066567122425196e-05, "loss": 0.0028, "step": 19570 }, { "epoch": 3.99, "learning_rate": 3.0054925441884252e-05, "loss": 0.0035, "step": 19571 }, { "epoch": 3.99, "learning_rate": 3.004328576465248e-05, "loss": 0.0051, "step": 19572 }, { "epoch": 3.99, "learning_rate": 3.0031648090924254e-05, "loss": 0.012, "step": 19573 }, { "epoch": 3.99, "learning_rate": 3.0020012420893968e-05, "loss": 0.0042, "step": 19574 }, { "epoch": 3.99, "learning_rate": 3.0008378754755967e-05, "loss": 0.0007, "step": 19575 }, { "epoch": 3.99, "learning_rate": 2.9996747092704516e-05, "loss": 0.003, "step": 19576 }, { "epoch": 3.99, "learning_rate": 2.9985117434933937e-05, "loss": 0.0036, "step": 19577 }, { "epoch": 3.99, "learning_rate": 2.997348978163846e-05, "loss": 0.0043, "step": 19578 }, { "epoch": 3.99, "learning_rate": 2.99618641330122e-05, "loss": 0.0017, "step": 19579 }, { "epoch": 3.99, "learning_rate": 2.995024048924948e-05, "loss": 0.0031, "step": 19580 }, { "epoch": 3.99, "learning_rate": 2.993861885054426e-05, "loss": 0.0065, "step": 19581 }, { "epoch": 3.99, "learning_rate": 2.9926999217090825e-05, "loss": 0.0047, "step": 19582 }, { "epoch": 3.99, "learning_rate": 2.9915381589083113e-05, "loss": 0.0047, "step": 19583 }, { "epoch": 3.99, "learning_rate": 2.9903765966715176e-05, "loss": 0.0014, "step": 19584 }, { "epoch": 3.99, "learning_rate": 2.989215235018112e-05, "loss": 0.0015, "step": 19585 }, { "epoch": 3.99, "learning_rate": 2.9880540739674742e-05, "loss": 0.0011, "step": 19586 }, { "epoch": 3.99, "learning_rate": 2.9868931135390183e-05, "loss": 0.0103, "step": 19587 }, { "epoch": 3.99, "learning_rate": 2.9857323537521178e-05, "loss": 0.0017, "step": 19588 }, { "epoch": 3.99, "learning_rate": 2.9845717946261665e-05, "loss": 0.0209, "step": 19589 }, { "epoch": 3.99, "learning_rate": 2.9834114361805463e-05, "loss": 0.0023, "step": 19590 }, { "epoch": 3.99, "learning_rate": 2.9822512784346374e-05, "loss": 0.002, "step": 19591 }, { "epoch": 3.99, "learning_rate": 2.9810913214078187e-05, "loss": 0.0099, "step": 19592 }, { "epoch": 3.99, "learning_rate": 2.9799315651194622e-05, "loss": 0.0034, "step": 19593 }, { "epoch": 3.99, "learning_rate": 2.978772009588938e-05, "loss": 0.004, "step": 19594 }, { "epoch": 3.99, "learning_rate": 2.9776126548356115e-05, "loss": 0.0015, "step": 19595 }, { "epoch": 3.99, "learning_rate": 2.9764535008788497e-05, "loss": 0.0004, "step": 19596 }, { "epoch": 3.99, "learning_rate": 2.9752945477380086e-05, "loss": 0.0051, "step": 19597 }, { "epoch": 3.99, "learning_rate": 2.974135795432451e-05, "loss": 0.0012, "step": 19598 }, { "epoch": 3.99, "learning_rate": 2.972977243981519e-05, "loss": 0.0031, "step": 19599 }, { "epoch": 3.99, "learning_rate": 2.9718188934045765e-05, "loss": 0.0011, "step": 19600 }, { "epoch": 3.99, "learning_rate": 2.9706607437209612e-05, "loss": 0.0081, "step": 19601 }, { "epoch": 3.99, "learning_rate": 2.9695027949500173e-05, "loss": 0.001, "step": 19602 }, { "epoch": 3.99, "learning_rate": 2.968345047111086e-05, "loss": 0.0022, "step": 19603 }, { "epoch": 3.99, "learning_rate": 2.9671875002235033e-05, "loss": 0.0007, "step": 19604 }, { "epoch": 3.99, "learning_rate": 2.9660301543066027e-05, "loss": 0.0076, "step": 19605 }, { "epoch": 3.99, "learning_rate": 2.964873009379715e-05, "loss": 0.0033, "step": 19606 }, { "epoch": 3.99, "learning_rate": 2.963716065462165e-05, "loss": 0.0019, "step": 19607 }, { "epoch": 3.99, "learning_rate": 2.9625593225732787e-05, "loss": 0.0017, "step": 19608 }, { "epoch": 3.99, "learning_rate": 2.961402780732372e-05, "loss": 0.0068, "step": 19609 }, { "epoch": 3.99, "learning_rate": 2.960246439958765e-05, "loss": 0.013, "step": 19610 }, { "epoch": 3.99, "learning_rate": 2.959090300271772e-05, "loss": 0.0063, "step": 19611 }, { "epoch": 3.99, "learning_rate": 2.957934361690691e-05, "loss": 0.0029, "step": 19612 }, { "epoch": 3.99, "learning_rate": 2.9567786242348462e-05, "loss": 0.0016, "step": 19613 }, { "epoch": 3.99, "learning_rate": 2.9556230879235245e-05, "loss": 0.0033, "step": 19614 }, { "epoch": 3.99, "learning_rate": 2.9544677527760346e-05, "loss": 0.0043, "step": 19615 }, { "epoch": 3.99, "learning_rate": 2.953312618811677e-05, "loss": 0.0045, "step": 19616 }, { "epoch": 3.99, "learning_rate": 2.9521576860497288e-05, "loss": 0.0035, "step": 19617 }, { "epoch": 3.99, "learning_rate": 2.951002954509498e-05, "loss": 0.0003, "step": 19618 }, { "epoch": 3.99, "learning_rate": 2.9498484242102533e-05, "loss": 0.0129, "step": 19619 }, { "epoch": 4.0, "learning_rate": 2.948694095171295e-05, "loss": 0.0067, "step": 19620 }, { "epoch": 4.0, "learning_rate": 2.9475399674118882e-05, "loss": 0.0123, "step": 19621 }, { "epoch": 4.0, "learning_rate": 2.9463860409513157e-05, "loss": 0.0037, "step": 19622 }, { "epoch": 4.0, "learning_rate": 2.9452323158088487e-05, "loss": 0.0005, "step": 19623 }, { "epoch": 4.0, "learning_rate": 2.9440787920037584e-05, "loss": 0.0091, "step": 19624 }, { "epoch": 4.0, "learning_rate": 2.942925469555308e-05, "loss": 0.0016, "step": 19625 }, { "epoch": 4.0, "learning_rate": 2.9417723484827616e-05, "loss": 0.0024, "step": 19626 }, { "epoch": 4.0, "learning_rate": 2.940619428805379e-05, "loss": 0.0008, "step": 19627 }, { "epoch": 4.0, "learning_rate": 2.939466710542415e-05, "loss": 0.0043, "step": 19628 }, { "epoch": 4.0, "learning_rate": 2.9383141937131278e-05, "loss": 0.0079, "step": 19629 }, { "epoch": 4.0, "learning_rate": 2.937161878336753e-05, "loss": 0.0046, "step": 19630 }, { "epoch": 4.0, "learning_rate": 2.9360097644325537e-05, "loss": 0.0153, "step": 19631 }, { "epoch": 4.0, "learning_rate": 2.9348578520197548e-05, "loss": 0.0072, "step": 19632 }, { "epoch": 4.0, "learning_rate": 2.9337061411176122e-05, "loss": 0.0039, "step": 19633 }, { "epoch": 4.0, "learning_rate": 2.9325546317453507e-05, "loss": 0.0031, "step": 19634 }, { "epoch": 4.0, "learning_rate": 2.931403323922205e-05, "loss": 0.008, "step": 19635 }, { "epoch": 4.0, "learning_rate": 2.9302522176674047e-05, "loss": 0.002, "step": 19636 }, { "epoch": 4.0, "learning_rate": 2.929101313000173e-05, "loss": 0.0025, "step": 19637 }, { "epoch": 4.0, "learning_rate": 2.9279506099397422e-05, "loss": 0.0004, "step": 19638 }, { "epoch": 4.0, "learning_rate": 2.9268001085053188e-05, "loss": 0.0002, "step": 19639 }, { "epoch": 4.0, "learning_rate": 2.9256498087161247e-05, "loss": 0.0027, "step": 19640 }, { "epoch": 4.0, "learning_rate": 2.9244997105913705e-05, "loss": 0.0014, "step": 19641 }, { "epoch": 4.0, "learning_rate": 2.9233498141502643e-05, "loss": 0.0002, "step": 19642 }, { "epoch": 4.0, "learning_rate": 2.9222001194120143e-05, "loss": 0.0026, "step": 19643 }, { "epoch": 4.0, "learning_rate": 2.9210506263958184e-05, "loss": 0.0017, "step": 19644 }, { "epoch": 4.0, "learning_rate": 2.9199013351208793e-05, "loss": 0.0056, "step": 19645 }, { "epoch": 4.0, "learning_rate": 2.9187522456063906e-05, "loss": 0.0016, "step": 19646 }, { "epoch": 4.0, "learning_rate": 2.917603357871548e-05, "loss": 0.0006, "step": 19647 }, { "epoch": 4.0, "learning_rate": 2.916454671935528e-05, "loss": 0.0002, "step": 19648 }, { "epoch": 4.0, "learning_rate": 2.9153061878175337e-05, "loss": 0.0025, "step": 19649 }, { "epoch": 4.0, "learning_rate": 2.9141579055367283e-05, "loss": 0.0015, "step": 19650 }, { "epoch": 4.0, "learning_rate": 2.9130098251123075e-05, "loss": 0.0005, "step": 19651 }, { "epoch": 4.0, "learning_rate": 2.9118619465634348e-05, "loss": 0.0015, "step": 19652 }, { "epoch": 4.0, "learning_rate": 2.9107142699092862e-05, "loss": 0.0011, "step": 19653 }, { "epoch": 4.0, "learning_rate": 2.909566795169028e-05, "loss": 0.0016, "step": 19654 }, { "epoch": 4.0, "learning_rate": 2.908419522361829e-05, "loss": 0.0033, "step": 19655 }, { "epoch": 4.0, "learning_rate": 2.9072724515068463e-05, "loss": 0.0028, "step": 19656 }, { "epoch": 4.0, "learning_rate": 2.9061255826232416e-05, "loss": 0.0011, "step": 19657 }, { "epoch": 4.0, "learning_rate": 2.904978915730168e-05, "loss": 0.0003, "step": 19658 }, { "epoch": 4.0, "learning_rate": 2.9038324508467764e-05, "loss": 0.0005, "step": 19659 }, { "epoch": 4.0, "learning_rate": 2.902686187992217e-05, "loss": 0.0006, "step": 19660 }, { "epoch": 4.0, "learning_rate": 2.9015401271856325e-05, "loss": 0.0005, "step": 19661 }, { "epoch": 4.0, "learning_rate": 2.900394268446171e-05, "loss": 0.003, "step": 19662 }, { "epoch": 4.0, "learning_rate": 2.8992486117929557e-05, "loss": 0.0014, "step": 19663 }, { "epoch": 4.0, "learning_rate": 2.8981031572451395e-05, "loss": 0.0021, "step": 19664 }, { "epoch": 4.0, "learning_rate": 2.8969579048218354e-05, "loss": 0.0006, "step": 19665 }, { "epoch": 4.0, "learning_rate": 2.8958128545421882e-05, "loss": 0.0011, "step": 19666 }, { "epoch": 4.0, "learning_rate": 2.8946680064253125e-05, "loss": 0.0018, "step": 19667 }, { "epoch": 4.0, "learning_rate": 2.8935233604903264e-05, "loss": 0.0022, "step": 19668 }, { "epoch": 4.0, "learning_rate": 2.8923789167563594e-05, "loss": 0.0065, "step": 19669 }, { "epoch": 4.01, "learning_rate": 2.891234675242513e-05, "loss": 0.0058, "step": 19670 }, { "epoch": 4.01, "learning_rate": 2.890090635967912e-05, "loss": 0.0001, "step": 19671 }, { "epoch": 4.01, "learning_rate": 2.8889467989516528e-05, "loss": 0.002, "step": 19672 }, { "epoch": 4.01, "learning_rate": 2.887803164212842e-05, "loss": 0.0008, "step": 19673 }, { "epoch": 4.01, "learning_rate": 2.8866597317705837e-05, "loss": 0.0016, "step": 19674 }, { "epoch": 4.01, "learning_rate": 2.8855165016439712e-05, "loss": 0.0029, "step": 19675 }, { "epoch": 4.01, "learning_rate": 2.884373473852103e-05, "loss": 0.0024, "step": 19676 }, { "epoch": 4.01, "learning_rate": 2.8832306484140666e-05, "loss": 0.009, "step": 19677 }, { "epoch": 4.01, "learning_rate": 2.8820880253489503e-05, "loss": 0.0007, "step": 19678 }, { "epoch": 4.01, "learning_rate": 2.8809456046758372e-05, "loss": 0.0003, "step": 19679 }, { "epoch": 4.01, "learning_rate": 2.879803386413814e-05, "loss": 0.0026, "step": 19680 }, { "epoch": 4.01, "learning_rate": 2.8786613705819445e-05, "loss": 0.0012, "step": 19681 }, { "epoch": 4.01, "learning_rate": 2.8775195571993192e-05, "loss": 0.0009, "step": 19682 }, { "epoch": 4.01, "learning_rate": 2.8763779462849912e-05, "loss": 0.0019, "step": 19683 }, { "epoch": 4.01, "learning_rate": 2.875236537858045e-05, "loss": 0.0028, "step": 19684 }, { "epoch": 4.01, "learning_rate": 2.874095331937532e-05, "loss": 0.0039, "step": 19685 }, { "epoch": 4.01, "learning_rate": 2.872954328542517e-05, "loss": 0.0026, "step": 19686 }, { "epoch": 4.01, "learning_rate": 2.871813527692055e-05, "loss": 0.0005, "step": 19687 }, { "epoch": 4.01, "learning_rate": 2.8706729294052004e-05, "loss": 0.0027, "step": 19688 }, { "epoch": 4.01, "learning_rate": 2.8695325337010033e-05, "loss": 0.0011, "step": 19689 }, { "epoch": 4.01, "learning_rate": 2.8683923405985115e-05, "loss": 0.0011, "step": 19690 }, { "epoch": 4.01, "learning_rate": 2.8672523501167684e-05, "loss": 0.0015, "step": 19691 }, { "epoch": 4.01, "learning_rate": 2.8661125622748117e-05, "loss": 0.0024, "step": 19692 }, { "epoch": 4.01, "learning_rate": 2.8649729770916812e-05, "loss": 0.0024, "step": 19693 }, { "epoch": 4.01, "learning_rate": 2.8638335945864073e-05, "loss": 0.0004, "step": 19694 }, { "epoch": 4.01, "learning_rate": 2.8626944147780255e-05, "loss": 0.0012, "step": 19695 }, { "epoch": 4.01, "learning_rate": 2.8615554376855497e-05, "loss": 0.0001, "step": 19696 }, { "epoch": 4.01, "learning_rate": 2.8604166633280144e-05, "loss": 0.0038, "step": 19697 }, { "epoch": 4.01, "learning_rate": 2.8592780917244396e-05, "loss": 0.0041, "step": 19698 }, { "epoch": 4.01, "learning_rate": 2.8581397228938314e-05, "loss": 0.0003, "step": 19699 }, { "epoch": 4.01, "learning_rate": 2.8570015568552164e-05, "loss": 0.0017, "step": 19700 }, { "epoch": 4.01, "learning_rate": 2.8558635936275892e-05, "loss": 0.0013, "step": 19701 }, { "epoch": 4.01, "learning_rate": 2.8547258332299718e-05, "loss": 0.0031, "step": 19702 }, { "epoch": 4.01, "learning_rate": 2.8535882756813533e-05, "loss": 0.0004, "step": 19703 }, { "epoch": 4.01, "learning_rate": 2.852450921000741e-05, "loss": 0.0063, "step": 19704 }, { "epoch": 4.01, "learning_rate": 2.851313769207127e-05, "loss": 0.0005, "step": 19705 }, { "epoch": 4.01, "learning_rate": 2.8501768203195053e-05, "loss": 0.0014, "step": 19706 }, { "epoch": 4.01, "learning_rate": 2.8490400743568653e-05, "loss": 0.0034, "step": 19707 }, { "epoch": 4.01, "learning_rate": 2.847903531338192e-05, "loss": 0.0036, "step": 19708 }, { "epoch": 4.01, "learning_rate": 2.8467671912824703e-05, "loss": 0.0047, "step": 19709 }, { "epoch": 4.01, "learning_rate": 2.8456310542086763e-05, "loss": 0.0008, "step": 19710 }, { "epoch": 4.01, "learning_rate": 2.844495120135785e-05, "loss": 0.0018, "step": 19711 }, { "epoch": 4.01, "learning_rate": 2.843359389082773e-05, "loss": 0.0002, "step": 19712 }, { "epoch": 4.01, "learning_rate": 2.8422238610686087e-05, "loss": 0.0009, "step": 19713 }, { "epoch": 4.01, "learning_rate": 2.8410885361122483e-05, "loss": 0.0013, "step": 19714 }, { "epoch": 4.01, "learning_rate": 2.839953414232668e-05, "loss": 0.0006, "step": 19715 }, { "epoch": 4.01, "learning_rate": 2.838818495448813e-05, "loss": 0.0013, "step": 19716 }, { "epoch": 4.01, "learning_rate": 2.8376837797796515e-05, "loss": 0.0024, "step": 19717 }, { "epoch": 4.01, "learning_rate": 2.8365492672441265e-05, "loss": 0.0002, "step": 19718 }, { "epoch": 4.02, "learning_rate": 2.8354149578611863e-05, "loss": 0.0014, "step": 19719 }, { "epoch": 4.02, "learning_rate": 2.8342808516497805e-05, "loss": 0.0023, "step": 19720 }, { "epoch": 4.02, "learning_rate": 2.8331469486288493e-05, "loss": 0.0004, "step": 19721 }, { "epoch": 4.02, "learning_rate": 2.832013248817329e-05, "loss": 0.0002, "step": 19722 }, { "epoch": 4.02, "learning_rate": 2.8308797522341564e-05, "loss": 0.0029, "step": 19723 }, { "epoch": 4.02, "learning_rate": 2.8297464588982645e-05, "loss": 0.0045, "step": 19724 }, { "epoch": 4.02, "learning_rate": 2.8286133688285777e-05, "loss": 0.007, "step": 19725 }, { "epoch": 4.02, "learning_rate": 2.8274804820440284e-05, "loss": 0.0002, "step": 19726 }, { "epoch": 4.02, "learning_rate": 2.8263477985635224e-05, "loss": 0.0022, "step": 19727 }, { "epoch": 4.02, "learning_rate": 2.8252153184059933e-05, "loss": 0.003, "step": 19728 }, { "epoch": 4.02, "learning_rate": 2.8240830415903492e-05, "loss": 0.001, "step": 19729 }, { "epoch": 4.02, "learning_rate": 2.8229509681355016e-05, "loss": 0.0028, "step": 19730 }, { "epoch": 4.02, "learning_rate": 2.821819098060364e-05, "loss": 0.0035, "step": 19731 }, { "epoch": 4.02, "learning_rate": 2.8206874313838258e-05, "loss": 0.0016, "step": 19732 }, { "epoch": 4.02, "learning_rate": 2.819555968124807e-05, "loss": 0.0021, "step": 19733 }, { "epoch": 4.02, "learning_rate": 2.818424708302186e-05, "loss": 0.0044, "step": 19734 }, { "epoch": 4.02, "learning_rate": 2.817293651934876e-05, "loss": 0.0006, "step": 19735 }, { "epoch": 4.02, "learning_rate": 2.816162799041755e-05, "loss": 0.0005, "step": 19736 }, { "epoch": 4.02, "learning_rate": 2.8150321496417135e-05, "loss": 0.0016, "step": 19737 }, { "epoch": 4.02, "learning_rate": 2.8139017037536356e-05, "loss": 0.0015, "step": 19738 }, { "epoch": 4.02, "learning_rate": 2.8127714613964015e-05, "loss": 0.0015, "step": 19739 }, { "epoch": 4.02, "learning_rate": 2.8116414225888893e-05, "loss": 0.0016, "step": 19740 }, { "epoch": 4.02, "learning_rate": 2.810511587349973e-05, "loss": 0.0004, "step": 19741 }, { "epoch": 4.02, "learning_rate": 2.8093819556985214e-05, "loss": 0.0023, "step": 19742 }, { "epoch": 4.02, "learning_rate": 2.8082525276534034e-05, "loss": 0.0032, "step": 19743 }, { "epoch": 4.02, "learning_rate": 2.8071233032334822e-05, "loss": 0.0022, "step": 19744 }, { "epoch": 4.02, "learning_rate": 2.8059942824576176e-05, "loss": 0.0001, "step": 19745 }, { "epoch": 4.02, "learning_rate": 2.8048654653446697e-05, "loss": 0.0019, "step": 19746 }, { "epoch": 4.02, "learning_rate": 2.8037368519134794e-05, "loss": 0.0018, "step": 19747 }, { "epoch": 4.02, "learning_rate": 2.802608442182916e-05, "loss": 0.0003, "step": 19748 }, { "epoch": 4.02, "learning_rate": 2.8014802361718102e-05, "loss": 0.0043, "step": 19749 }, { "epoch": 4.02, "learning_rate": 2.8003522338990074e-05, "loss": 0.0108, "step": 19750 }, { "epoch": 4.02, "learning_rate": 2.7992244353833577e-05, "loss": 0.0018, "step": 19751 }, { "epoch": 4.02, "learning_rate": 2.7980968406436838e-05, "loss": 0.0004, "step": 19752 }, { "epoch": 4.02, "learning_rate": 2.7969694496988326e-05, "loss": 0.0001, "step": 19753 }, { "epoch": 4.02, "learning_rate": 2.795842262567624e-05, "loss": 0.0035, "step": 19754 }, { "epoch": 4.02, "learning_rate": 2.794715279268885e-05, "loss": 0.0051, "step": 19755 }, { "epoch": 4.02, "learning_rate": 2.7935884998214414e-05, "loss": 0.0028, "step": 19756 }, { "epoch": 4.02, "learning_rate": 2.7924619242441086e-05, "loss": 0.0095, "step": 19757 }, { "epoch": 4.02, "learning_rate": 2.791335552555707e-05, "loss": 0.0001, "step": 19758 }, { "epoch": 4.02, "learning_rate": 2.790209384775047e-05, "loss": 0.0048, "step": 19759 }, { "epoch": 4.02, "learning_rate": 2.7890834209209383e-05, "loss": 0.0015, "step": 19760 }, { "epoch": 4.02, "learning_rate": 2.787957661012185e-05, "loss": 0.0037, "step": 19761 }, { "epoch": 4.02, "learning_rate": 2.7868321050675907e-05, "loss": 0.0019, "step": 19762 }, { "epoch": 4.02, "learning_rate": 2.7857067531059552e-05, "loss": 0.0001, "step": 19763 }, { "epoch": 4.02, "learning_rate": 2.784581605146077e-05, "loss": 0.0007, "step": 19764 }, { "epoch": 4.02, "learning_rate": 2.7834566612067356e-05, "loss": 0.0065, "step": 19765 }, { "epoch": 4.02, "learning_rate": 2.7823319213067364e-05, "loss": 0.0013, "step": 19766 }, { "epoch": 4.02, "learning_rate": 2.7812073854648475e-05, "loss": 0.0033, "step": 19767 }, { "epoch": 4.03, "learning_rate": 2.780083053699869e-05, "loss": 0.0006, "step": 19768 }, { "epoch": 4.03, "learning_rate": 2.778958926030566e-05, "loss": 0.0017, "step": 19769 }, { "epoch": 4.03, "learning_rate": 2.7778350024757185e-05, "loss": 0.0014, "step": 19770 }, { "epoch": 4.03, "learning_rate": 2.776711283054098e-05, "loss": 0.0003, "step": 19771 }, { "epoch": 4.03, "learning_rate": 2.7755877677844706e-05, "loss": 0.0013, "step": 19772 }, { "epoch": 4.03, "learning_rate": 2.7744644566856023e-05, "loss": 0.0033, "step": 19773 }, { "epoch": 4.03, "learning_rate": 2.7733413497762557e-05, "loss": 0.0007, "step": 19774 }, { "epoch": 4.03, "learning_rate": 2.7722184470751896e-05, "loss": 0.0033, "step": 19775 }, { "epoch": 4.03, "learning_rate": 2.7710957486011552e-05, "loss": 0.0017, "step": 19776 }, { "epoch": 4.03, "learning_rate": 2.7699732543729096e-05, "loss": 0.0021, "step": 19777 }, { "epoch": 4.03, "learning_rate": 2.7688509644091895e-05, "loss": 0.0027, "step": 19778 }, { "epoch": 4.03, "learning_rate": 2.7677288787287526e-05, "loss": 0.0003, "step": 19779 }, { "epoch": 4.03, "learning_rate": 2.766606997350326e-05, "loss": 0.0004, "step": 19780 }, { "epoch": 4.03, "learning_rate": 2.7654853202926587e-05, "loss": 0.0006, "step": 19781 }, { "epoch": 4.03, "learning_rate": 2.7643638475744862e-05, "loss": 0.001, "step": 19782 }, { "epoch": 4.03, "learning_rate": 2.763242579214524e-05, "loss": 0.0021, "step": 19783 }, { "epoch": 4.03, "learning_rate": 2.762121515231519e-05, "loss": 0.0003, "step": 19784 }, { "epoch": 4.03, "learning_rate": 2.7610006556441762e-05, "loss": 0.0002, "step": 19785 }, { "epoch": 4.03, "learning_rate": 2.7598800004712336e-05, "loss": 0.0047, "step": 19786 }, { "epoch": 4.03, "learning_rate": 2.7587595497313948e-05, "loss": 0.0003, "step": 19787 }, { "epoch": 4.03, "learning_rate": 2.7576393034433797e-05, "loss": 0.0005, "step": 19788 }, { "epoch": 4.03, "learning_rate": 2.756519261625897e-05, "loss": 0.0001, "step": 19789 }, { "epoch": 4.03, "learning_rate": 2.7553994242976528e-05, "loss": 0.0018, "step": 19790 }, { "epoch": 4.03, "learning_rate": 2.7542797914773528e-05, "loss": 0.0018, "step": 19791 }, { "epoch": 4.03, "learning_rate": 2.753160363183695e-05, "loss": 0.0004, "step": 19792 }, { "epoch": 4.03, "learning_rate": 2.752041139435378e-05, "loss": 0.0001, "step": 19793 }, { "epoch": 4.03, "learning_rate": 2.7509221202510915e-05, "loss": 0.0001, "step": 19794 }, { "epoch": 4.03, "learning_rate": 2.749803305649533e-05, "loss": 0.0004, "step": 19795 }, { "epoch": 4.03, "learning_rate": 2.7486846956493746e-05, "loss": 0.0037, "step": 19796 }, { "epoch": 4.03, "learning_rate": 2.7475662902693174e-05, "loss": 0.0023, "step": 19797 }, { "epoch": 4.03, "learning_rate": 2.746448089528021e-05, "loss": 0.0006, "step": 19798 }, { "epoch": 4.03, "learning_rate": 2.7453300934441808e-05, "loss": 0.001, "step": 19799 }, { "epoch": 4.03, "learning_rate": 2.7442123020364565e-05, "loss": 0.0025, "step": 19800 }, { "epoch": 4.03, "learning_rate": 2.74309471532352e-05, "loss": 0.0005, "step": 19801 }, { "epoch": 4.03, "learning_rate": 2.7419773333240397e-05, "loss": 0.0029, "step": 19802 }, { "epoch": 4.03, "learning_rate": 2.7408601560566757e-05, "loss": 0.003, "step": 19803 }, { "epoch": 4.03, "learning_rate": 2.739743183540088e-05, "loss": 0.0003, "step": 19804 }, { "epoch": 4.03, "learning_rate": 2.7386264157929317e-05, "loss": 0.0056, "step": 19805 }, { "epoch": 4.03, "learning_rate": 2.7375098528338603e-05, "loss": 0.0058, "step": 19806 }, { "epoch": 4.03, "learning_rate": 2.73639349468152e-05, "loss": 0.0028, "step": 19807 }, { "epoch": 4.03, "learning_rate": 2.7352773413545588e-05, "loss": 0.0003, "step": 19808 }, { "epoch": 4.03, "learning_rate": 2.734161392871617e-05, "loss": 0.0016, "step": 19809 }, { "epoch": 4.03, "learning_rate": 2.7330456492513374e-05, "loss": 0.0027, "step": 19810 }, { "epoch": 4.03, "learning_rate": 2.731930110512343e-05, "loss": 0.0013, "step": 19811 }, { "epoch": 4.03, "learning_rate": 2.7308147766732773e-05, "loss": 0.0001, "step": 19812 }, { "epoch": 4.03, "learning_rate": 2.729699647752764e-05, "loss": 0.0054, "step": 19813 }, { "epoch": 4.03, "learning_rate": 2.728584723769429e-05, "loss": 0.0017, "step": 19814 }, { "epoch": 4.03, "learning_rate": 2.727470004741897e-05, "loss": 0.0001, "step": 19815 }, { "epoch": 4.03, "learning_rate": 2.7263554906887736e-05, "loss": 0.0028, "step": 19816 }, { "epoch": 4.04, "learning_rate": 2.7252411816286895e-05, "loss": 0.0008, "step": 19817 }, { "epoch": 4.04, "learning_rate": 2.7241270775802414e-05, "loss": 0.0038, "step": 19818 }, { "epoch": 4.04, "learning_rate": 2.7230131785620497e-05, "loss": 0.0046, "step": 19819 }, { "epoch": 4.04, "learning_rate": 2.721899484592709e-05, "loss": 0.0014, "step": 19820 }, { "epoch": 4.04, "learning_rate": 2.7207859956908247e-05, "loss": 0.0033, "step": 19821 }, { "epoch": 4.04, "learning_rate": 2.7196727118749917e-05, "loss": 0.002, "step": 19822 }, { "epoch": 4.04, "learning_rate": 2.7185596331638053e-05, "loss": 0.0005, "step": 19823 }, { "epoch": 4.04, "learning_rate": 2.717446759575856e-05, "loss": 0.0002, "step": 19824 }, { "epoch": 4.04, "learning_rate": 2.71633409112973e-05, "loss": 0.0034, "step": 19825 }, { "epoch": 4.04, "learning_rate": 2.7152216278440124e-05, "loss": 0.0084, "step": 19826 }, { "epoch": 4.04, "learning_rate": 2.7141093697372824e-05, "loss": 0.0007, "step": 19827 }, { "epoch": 4.04, "learning_rate": 2.712997316828121e-05, "loss": 0.0046, "step": 19828 }, { "epoch": 4.04, "learning_rate": 2.7118854691350907e-05, "loss": 0.0054, "step": 19829 }, { "epoch": 4.04, "learning_rate": 2.710773826676776e-05, "loss": 0.0061, "step": 19830 }, { "epoch": 4.04, "learning_rate": 2.709662389471729e-05, "loss": 0.0085, "step": 19831 }, { "epoch": 4.04, "learning_rate": 2.7085511575385266e-05, "loss": 0.006, "step": 19832 }, { "epoch": 4.04, "learning_rate": 2.707440130895717e-05, "loss": 0.0008, "step": 19833 }, { "epoch": 4.04, "learning_rate": 2.7063293095618578e-05, "loss": 0.0007, "step": 19834 }, { "epoch": 4.04, "learning_rate": 2.705218693555513e-05, "loss": 0.0023, "step": 19835 }, { "epoch": 4.04, "learning_rate": 2.704108282895217e-05, "loss": 0.0002, "step": 19836 }, { "epoch": 4.04, "learning_rate": 2.7029980775995298e-05, "loss": 0.0026, "step": 19837 }, { "epoch": 4.04, "learning_rate": 2.701888077686983e-05, "loss": 0.0017, "step": 19838 }, { "epoch": 4.04, "learning_rate": 2.7007782831761197e-05, "loss": 0.0023, "step": 19839 }, { "epoch": 4.04, "learning_rate": 2.6996686940854762e-05, "loss": 0.0002, "step": 19840 }, { "epoch": 4.04, "learning_rate": 2.6985593104335833e-05, "loss": 0.0014, "step": 19841 }, { "epoch": 4.04, "learning_rate": 2.69745013223897e-05, "loss": 0.0016, "step": 19842 }, { "epoch": 4.04, "learning_rate": 2.6963411595201633e-05, "loss": 0.0025, "step": 19843 }, { "epoch": 4.04, "learning_rate": 2.6952323922956846e-05, "loss": 0.0026, "step": 19844 }, { "epoch": 4.04, "learning_rate": 2.6941238305840496e-05, "loss": 0.003, "step": 19845 }, { "epoch": 4.04, "learning_rate": 2.6930154744037813e-05, "loss": 0.0089, "step": 19846 }, { "epoch": 4.04, "learning_rate": 2.6919073237733767e-05, "loss": 0.0006, "step": 19847 }, { "epoch": 4.04, "learning_rate": 2.6907993787113614e-05, "loss": 0.0001, "step": 19848 }, { "epoch": 4.04, "learning_rate": 2.689691639236225e-05, "loss": 0.0035, "step": 19849 }, { "epoch": 4.04, "learning_rate": 2.6885841053664814e-05, "loss": 0.0049, "step": 19850 }, { "epoch": 4.04, "learning_rate": 2.6874767771206207e-05, "loss": 0.0003, "step": 19851 }, { "epoch": 4.04, "learning_rate": 2.686369654517138e-05, "loss": 0.0015, "step": 19852 }, { "epoch": 4.04, "learning_rate": 2.6852627375745257e-05, "loss": 0.0008, "step": 19853 }, { "epoch": 4.04, "learning_rate": 2.6841560263112717e-05, "loss": 0.0002, "step": 19854 }, { "epoch": 4.04, "learning_rate": 2.6830495207458596e-05, "loss": 0.0016, "step": 19855 }, { "epoch": 4.04, "learning_rate": 2.6819432208967718e-05, "loss": 0.0014, "step": 19856 }, { "epoch": 4.04, "learning_rate": 2.680837126782483e-05, "loss": 0.0012, "step": 19857 }, { "epoch": 4.04, "learning_rate": 2.6797312384214685e-05, "loss": 0.0004, "step": 19858 }, { "epoch": 4.04, "learning_rate": 2.6786255558321972e-05, "loss": 0.0049, "step": 19859 }, { "epoch": 4.04, "learning_rate": 2.677520079033139e-05, "loss": 0.0029, "step": 19860 }, { "epoch": 4.04, "learning_rate": 2.6764148080427596e-05, "loss": 0.0016, "step": 19861 }, { "epoch": 4.04, "learning_rate": 2.6753097428795066e-05, "loss": 0.0025, "step": 19862 }, { "epoch": 4.04, "learning_rate": 2.6742048835618545e-05, "loss": 0.0015, "step": 19863 }, { "epoch": 4.04, "learning_rate": 2.6731002301082382e-05, "loss": 0.0003, "step": 19864 }, { "epoch": 4.04, "learning_rate": 2.6719957825371212e-05, "loss": 0.0036, "step": 19865 }, { "epoch": 4.05, "learning_rate": 2.670891540866949e-05, "loss": 0.0011, "step": 19866 }, { "epoch": 4.05, "learning_rate": 2.6697875051161548e-05, "loss": 0.0013, "step": 19867 }, { "epoch": 4.05, "learning_rate": 2.6686836753031892e-05, "loss": 0.0007, "step": 19868 }, { "epoch": 4.05, "learning_rate": 2.6675800514464806e-05, "loss": 0.0065, "step": 19869 }, { "epoch": 4.05, "learning_rate": 2.6664766335644662e-05, "loss": 0.0058, "step": 19870 }, { "epoch": 4.05, "learning_rate": 2.6653734216755706e-05, "loss": 0.002, "step": 19871 }, { "epoch": 4.05, "learning_rate": 2.6642704157982232e-05, "loss": 0.0006, "step": 19872 }, { "epoch": 4.05, "learning_rate": 2.6631676159508453e-05, "loss": 0.0018, "step": 19873 }, { "epoch": 4.05, "learning_rate": 2.662065022151854e-05, "loss": 0.0034, "step": 19874 }, { "epoch": 4.05, "learning_rate": 2.6609626344196684e-05, "loss": 0.0001, "step": 19875 }, { "epoch": 4.05, "learning_rate": 2.659860452772698e-05, "loss": 0.0017, "step": 19876 }, { "epoch": 4.05, "learning_rate": 2.6587584772293503e-05, "loss": 0.0057, "step": 19877 }, { "epoch": 4.05, "learning_rate": 2.6576567078080336e-05, "loss": 0.0022, "step": 19878 }, { "epoch": 4.05, "learning_rate": 2.65655514452715e-05, "loss": 0.0032, "step": 19879 }, { "epoch": 4.05, "learning_rate": 2.6554537874050878e-05, "loss": 0.0008, "step": 19880 }, { "epoch": 4.05, "learning_rate": 2.654352636460258e-05, "loss": 0.002, "step": 19881 }, { "epoch": 4.05, "learning_rate": 2.6532516917110352e-05, "loss": 0.0045, "step": 19882 }, { "epoch": 4.05, "learning_rate": 2.6521509531758233e-05, "loss": 0.0031, "step": 19883 }, { "epoch": 4.05, "learning_rate": 2.6510504208729942e-05, "loss": 0.0043, "step": 19884 }, { "epoch": 4.05, "learning_rate": 2.6499500948209335e-05, "loss": 0.0021, "step": 19885 }, { "epoch": 4.05, "learning_rate": 2.6488499750380192e-05, "loss": 0.0005, "step": 19886 }, { "epoch": 4.05, "learning_rate": 2.6477500615426206e-05, "loss": 0.0015, "step": 19887 }, { "epoch": 4.05, "learning_rate": 2.6466503543531193e-05, "loss": 0.0077, "step": 19888 }, { "epoch": 4.05, "learning_rate": 2.6455508534878737e-05, "loss": 0.001, "step": 19889 }, { "epoch": 4.05, "learning_rate": 2.644451558965248e-05, "loss": 0.0056, "step": 19890 }, { "epoch": 4.05, "learning_rate": 2.6433524708036043e-05, "loss": 0.0004, "step": 19891 }, { "epoch": 4.05, "learning_rate": 2.6422535890213002e-05, "loss": 0.0054, "step": 19892 }, { "epoch": 4.05, "learning_rate": 2.6411549136366874e-05, "loss": 0.0037, "step": 19893 }, { "epoch": 4.05, "learning_rate": 2.640056444668115e-05, "loss": 0.0009, "step": 19894 }, { "epoch": 4.05, "learning_rate": 2.6389581821339325e-05, "loss": 0.0086, "step": 19895 }, { "epoch": 4.05, "learning_rate": 2.637860126052481e-05, "loss": 0.0027, "step": 19896 }, { "epoch": 4.05, "learning_rate": 2.6367622764421053e-05, "loss": 0.0018, "step": 19897 }, { "epoch": 4.05, "learning_rate": 2.6356646333211283e-05, "loss": 0.0044, "step": 19898 }, { "epoch": 4.05, "learning_rate": 2.634567196707899e-05, "loss": 0.0053, "step": 19899 }, { "epoch": 4.05, "learning_rate": 2.6334699666207325e-05, "loss": 0.0004, "step": 19900 }, { "epoch": 4.05, "learning_rate": 2.6323729430779662e-05, "loss": 0.002, "step": 19901 }, { "epoch": 4.05, "learning_rate": 2.631276126097915e-05, "loss": 0.0038, "step": 19902 }, { "epoch": 4.05, "learning_rate": 2.6301795156989008e-05, "loss": 0.0103, "step": 19903 }, { "epoch": 4.05, "learning_rate": 2.6290831118992378e-05, "loss": 0.0006, "step": 19904 }, { "epoch": 4.05, "learning_rate": 2.627986914717238e-05, "loss": 0.0016, "step": 19905 }, { "epoch": 4.05, "learning_rate": 2.626890924171211e-05, "loss": 0.0047, "step": 19906 }, { "epoch": 4.05, "learning_rate": 2.6257951402794613e-05, "loss": 0.0018, "step": 19907 }, { "epoch": 4.05, "learning_rate": 2.6246995630602908e-05, "loss": 0.0013, "step": 19908 }, { "epoch": 4.05, "learning_rate": 2.6236041925319977e-05, "loss": 0.0058, "step": 19909 }, { "epoch": 4.05, "learning_rate": 2.6225090287128763e-05, "loss": 0.0027, "step": 19910 }, { "epoch": 4.05, "learning_rate": 2.62141407162122e-05, "loss": 0.0018, "step": 19911 }, { "epoch": 4.05, "learning_rate": 2.620319321275316e-05, "loss": 0.0001, "step": 19912 }, { "epoch": 4.05, "learning_rate": 2.6192247776934427e-05, "loss": 0.0021, "step": 19913 }, { "epoch": 4.05, "learning_rate": 2.6181304408938925e-05, "loss": 0.0018, "step": 19914 }, { "epoch": 4.06, "learning_rate": 2.6170363108949272e-05, "loss": 0.002, "step": 19915 }, { "epoch": 4.06, "learning_rate": 2.6159423877148406e-05, "loss": 0.0009, "step": 19916 }, { "epoch": 4.06, "learning_rate": 2.6148486713718862e-05, "loss": 0.0003, "step": 19917 }, { "epoch": 4.06, "learning_rate": 2.613755161884335e-05, "loss": 0.0014, "step": 19918 }, { "epoch": 4.06, "learning_rate": 2.6126618592704617e-05, "loss": 0.002, "step": 19919 }, { "epoch": 4.06, "learning_rate": 2.6115687635485123e-05, "loss": 0.0058, "step": 19920 }, { "epoch": 4.06, "learning_rate": 2.6104758747367516e-05, "loss": 0.0003, "step": 19921 }, { "epoch": 4.06, "learning_rate": 2.6093831928534287e-05, "loss": 0.0013, "step": 19922 }, { "epoch": 4.06, "learning_rate": 2.6082907179167973e-05, "loss": 0.003, "step": 19923 }, { "epoch": 4.06, "learning_rate": 2.6071984499450992e-05, "loss": 0.0006, "step": 19924 }, { "epoch": 4.06, "learning_rate": 2.6061063889565818e-05, "loss": 0.002, "step": 19925 }, { "epoch": 4.06, "learning_rate": 2.605014534969484e-05, "loss": 0.0002, "step": 19926 }, { "epoch": 4.06, "learning_rate": 2.603922888002039e-05, "loss": 0.0017, "step": 19927 }, { "epoch": 4.06, "learning_rate": 2.602831448072481e-05, "loss": 0.0003, "step": 19928 }, { "epoch": 4.06, "learning_rate": 2.60174021519904e-05, "loss": 0.0013, "step": 19929 }, { "epoch": 4.06, "learning_rate": 2.6006491893999438e-05, "loss": 0.0015, "step": 19930 }, { "epoch": 4.06, "learning_rate": 2.5995583706934053e-05, "loss": 0.0009, "step": 19931 }, { "epoch": 4.06, "learning_rate": 2.5984677590976553e-05, "loss": 0.0012, "step": 19932 }, { "epoch": 4.06, "learning_rate": 2.597377354630896e-05, "loss": 0.0, "step": 19933 }, { "epoch": 4.06, "learning_rate": 2.5962871573113564e-05, "loss": 0.0002, "step": 19934 }, { "epoch": 4.06, "learning_rate": 2.595197167157228e-05, "loss": 0.0088, "step": 19935 }, { "epoch": 4.06, "learning_rate": 2.594107384186725e-05, "loss": 0.0001, "step": 19936 }, { "epoch": 4.06, "learning_rate": 2.593017808418046e-05, "loss": 0.0024, "step": 19937 }, { "epoch": 4.06, "learning_rate": 2.591928439869388e-05, "loss": 0.0017, "step": 19938 }, { "epoch": 4.06, "learning_rate": 2.590839278558948e-05, "loss": 0.0048, "step": 19939 }, { "epoch": 4.06, "learning_rate": 2.5897503245049155e-05, "loss": 0.0004, "step": 19940 }, { "epoch": 4.06, "learning_rate": 2.5886615777254788e-05, "loss": 0.0005, "step": 19941 }, { "epoch": 4.06, "learning_rate": 2.5875730382388215e-05, "loss": 0.0025, "step": 19942 }, { "epoch": 4.06, "learning_rate": 2.5864847060631295e-05, "loss": 0.0008, "step": 19943 }, { "epoch": 4.06, "learning_rate": 2.585396581216566e-05, "loss": 0.0019, "step": 19944 }, { "epoch": 4.06, "learning_rate": 2.5843086637173238e-05, "loss": 0.0009, "step": 19945 }, { "epoch": 4.06, "learning_rate": 2.583220953583553e-05, "loss": 0.0022, "step": 19946 }, { "epoch": 4.06, "learning_rate": 2.5821334508334358e-05, "loss": 0.0028, "step": 19947 }, { "epoch": 4.06, "learning_rate": 2.581046155485134e-05, "loss": 0.0024, "step": 19948 }, { "epoch": 4.06, "learning_rate": 2.5799590675567955e-05, "loss": 0.0039, "step": 19949 }, { "epoch": 4.06, "learning_rate": 2.5788721870665936e-05, "loss": 0.0002, "step": 19950 }, { "epoch": 4.06, "learning_rate": 2.5777855140326654e-05, "loss": 0.0004, "step": 19951 }, { "epoch": 4.06, "learning_rate": 2.576699048473173e-05, "loss": 0.0012, "step": 19952 }, { "epoch": 4.06, "learning_rate": 2.5756127904062557e-05, "loss": 0.0002, "step": 19953 }, { "epoch": 4.06, "learning_rate": 2.5745267398500567e-05, "loss": 0.0042, "step": 19954 }, { "epoch": 4.06, "learning_rate": 2.5734408968227154e-05, "loss": 0.0049, "step": 19955 }, { "epoch": 4.06, "learning_rate": 2.5723552613423687e-05, "loss": 0.0002, "step": 19956 }, { "epoch": 4.06, "learning_rate": 2.5712698334271486e-05, "loss": 0.0002, "step": 19957 }, { "epoch": 4.06, "learning_rate": 2.570184613095181e-05, "loss": 0.002, "step": 19958 }, { "epoch": 4.06, "learning_rate": 2.569099600364596e-05, "loss": 0.002, "step": 19959 }, { "epoch": 4.06, "learning_rate": 2.5680147952535106e-05, "loss": 0.0002, "step": 19960 }, { "epoch": 4.06, "learning_rate": 2.566930197780046e-05, "loss": 0.0037, "step": 19961 }, { "epoch": 4.06, "learning_rate": 2.5658458079623157e-05, "loss": 0.0017, "step": 19962 }, { "epoch": 4.06, "learning_rate": 2.5647616258184352e-05, "loss": 0.0006, "step": 19963 }, { "epoch": 4.07, "learning_rate": 2.5636776513665014e-05, "loss": 0.0033, "step": 19964 }, { "epoch": 4.07, "learning_rate": 2.5625938846246337e-05, "loss": 0.0037, "step": 19965 }, { "epoch": 4.07, "learning_rate": 2.5615103256109186e-05, "loss": 0.0011, "step": 19966 }, { "epoch": 4.07, "learning_rate": 2.5604269743434675e-05, "loss": 0.0015, "step": 19967 }, { "epoch": 4.07, "learning_rate": 2.5593438308403617e-05, "loss": 0.0018, "step": 19968 }, { "epoch": 4.07, "learning_rate": 2.5582608951196993e-05, "loss": 0.0113, "step": 19969 }, { "epoch": 4.07, "learning_rate": 2.557178167199565e-05, "loss": 0.0031, "step": 19970 }, { "epoch": 4.07, "learning_rate": 2.556095647098043e-05, "loss": 0.0011, "step": 19971 }, { "epoch": 4.07, "learning_rate": 2.5550133348332123e-05, "loss": 0.0031, "step": 19972 }, { "epoch": 4.07, "learning_rate": 2.5539312304231518e-05, "loss": 0.0001, "step": 19973 }, { "epoch": 4.07, "learning_rate": 2.5528493338859334e-05, "loss": 0.0019, "step": 19974 }, { "epoch": 4.07, "learning_rate": 2.5517676452396264e-05, "loss": 0.0028, "step": 19975 }, { "epoch": 4.07, "learning_rate": 2.5506861645023007e-05, "loss": 0.0011, "step": 19976 }, { "epoch": 4.07, "learning_rate": 2.5496048916920076e-05, "loss": 0.0008, "step": 19977 }, { "epoch": 4.07, "learning_rate": 2.5485238268268204e-05, "loss": 0.0029, "step": 19978 }, { "epoch": 4.07, "learning_rate": 2.5474429699247867e-05, "loss": 0.0004, "step": 19979 }, { "epoch": 4.07, "learning_rate": 2.5463623210039635e-05, "loss": 0.0007, "step": 19980 }, { "epoch": 4.07, "learning_rate": 2.5452818800823997e-05, "loss": 0.0001, "step": 19981 }, { "epoch": 4.07, "learning_rate": 2.5442016471781314e-05, "loss": 0.0051, "step": 19982 }, { "epoch": 4.07, "learning_rate": 2.543121622309215e-05, "loss": 0.0019, "step": 19983 }, { "epoch": 4.07, "learning_rate": 2.542041805493675e-05, "loss": 0.0012, "step": 19984 }, { "epoch": 4.07, "learning_rate": 2.5409621967495597e-05, "loss": 0.0026, "step": 19985 }, { "epoch": 4.07, "learning_rate": 2.5398827960948886e-05, "loss": 0.0019, "step": 19986 }, { "epoch": 4.07, "learning_rate": 2.5388036035476972e-05, "loss": 0.0003, "step": 19987 }, { "epoch": 4.07, "learning_rate": 2.5377246191260074e-05, "loss": 0.0002, "step": 19988 }, { "epoch": 4.07, "learning_rate": 2.5366458428478403e-05, "loss": 0.0011, "step": 19989 }, { "epoch": 4.07, "learning_rate": 2.535567274731213e-05, "loss": 0.0013, "step": 19990 }, { "epoch": 4.07, "learning_rate": 2.5344889147941404e-05, "loss": 0.0005, "step": 19991 }, { "epoch": 4.07, "learning_rate": 2.5334107630546357e-05, "loss": 0.0001, "step": 19992 }, { "epoch": 4.07, "learning_rate": 2.532332819530701e-05, "loss": 0.002, "step": 19993 }, { "epoch": 4.07, "learning_rate": 2.5312550842403477e-05, "loss": 0.0001, "step": 19994 }, { "epoch": 4.07, "learning_rate": 2.5301775572015624e-05, "loss": 0.0059, "step": 19995 }, { "epoch": 4.07, "learning_rate": 2.529100238432359e-05, "loss": 0.0016, "step": 19996 }, { "epoch": 4.07, "learning_rate": 2.528023127950714e-05, "loss": 0.0003, "step": 19997 }, { "epoch": 4.07, "learning_rate": 2.5269462257746338e-05, "loss": 0.0003, "step": 19998 }, { "epoch": 4.07, "learning_rate": 2.52586953192209e-05, "loss": 0.0007, "step": 19999 }, { "epoch": 4.07, "learning_rate": 2.5247930464110705e-05, "loss": 0.0038, "step": 20000 }, { "epoch": 4.07, "learning_rate": 2.523716769259562e-05, "loss": 0.0011, "step": 20001 }, { "epoch": 4.07, "learning_rate": 2.522640700485526e-05, "loss": 0.0014, "step": 20002 }, { "epoch": 4.07, "learning_rate": 2.5215648401069522e-05, "loss": 0.0043, "step": 20003 }, { "epoch": 4.07, "learning_rate": 2.520489188141795e-05, "loss": 0.0063, "step": 20004 }, { "epoch": 4.07, "learning_rate": 2.5194137446080264e-05, "loss": 0.0016, "step": 20005 }, { "epoch": 4.07, "learning_rate": 2.5183385095236057e-05, "loss": 0.0003, "step": 20006 }, { "epoch": 4.07, "learning_rate": 2.5172634829064935e-05, "loss": 0.008, "step": 20007 }, { "epoch": 4.07, "learning_rate": 2.5161886647746436e-05, "loss": 0.0048, "step": 20008 }, { "epoch": 4.07, "learning_rate": 2.5151140551460085e-05, "loss": 0.0068, "step": 20009 }, { "epoch": 4.07, "learning_rate": 2.5140396540385353e-05, "loss": 0.0079, "step": 20010 }, { "epoch": 4.07, "learning_rate": 2.5129654614701685e-05, "loss": 0.0002, "step": 20011 }, { "epoch": 4.07, "learning_rate": 2.5118914774588495e-05, "loss": 0.0037, "step": 20012 }, { "epoch": 4.08, "learning_rate": 2.5108177020225163e-05, "loss": 0.0006, "step": 20013 }, { "epoch": 4.08, "learning_rate": 2.509744135179106e-05, "loss": 0.0065, "step": 20014 }, { "epoch": 4.08, "learning_rate": 2.5086707769465374e-05, "loss": 0.0001, "step": 20015 }, { "epoch": 4.08, "learning_rate": 2.5075976273427534e-05, "loss": 0.0001, "step": 20016 }, { "epoch": 4.08, "learning_rate": 2.5065246863856642e-05, "loss": 0.0026, "step": 20017 }, { "epoch": 4.08, "learning_rate": 2.5054519540932022e-05, "loss": 0.0004, "step": 20018 }, { "epoch": 4.08, "learning_rate": 2.504379430483273e-05, "loss": 0.0001, "step": 20019 }, { "epoch": 4.08, "learning_rate": 2.503307115573796e-05, "loss": 0.0001, "step": 20020 }, { "epoch": 4.08, "learning_rate": 2.502235009382678e-05, "loss": 0.0008, "step": 20021 }, { "epoch": 4.08, "learning_rate": 2.5011631119278286e-05, "loss": 0.002, "step": 20022 }, { "epoch": 4.08, "learning_rate": 2.5000914232271462e-05, "loss": 0.0026, "step": 20023 }, { "epoch": 4.08, "learning_rate": 2.4990199432985337e-05, "loss": 0.0015, "step": 20024 }, { "epoch": 4.08, "learning_rate": 2.4979486721598845e-05, "loss": 0.0023, "step": 20025 }, { "epoch": 4.08, "learning_rate": 2.496877609829093e-05, "loss": 0.0027, "step": 20026 }, { "epoch": 4.08, "learning_rate": 2.49580675632405e-05, "loss": 0.0038, "step": 20027 }, { "epoch": 4.08, "learning_rate": 2.4947361116626297e-05, "loss": 0.0032, "step": 20028 }, { "epoch": 4.08, "learning_rate": 2.493665675862729e-05, "loss": 0.0057, "step": 20029 }, { "epoch": 4.08, "learning_rate": 2.4925954489422117e-05, "loss": 0.0008, "step": 20030 }, { "epoch": 4.08, "learning_rate": 2.491525430918964e-05, "loss": 0.0007, "step": 20031 }, { "epoch": 4.08, "learning_rate": 2.4904556218108567e-05, "loss": 0.0002, "step": 20032 }, { "epoch": 4.08, "learning_rate": 2.4893860216357452e-05, "loss": 0.0034, "step": 20033 }, { "epoch": 4.08, "learning_rate": 2.488316630411512e-05, "loss": 0.0011, "step": 20034 }, { "epoch": 4.08, "learning_rate": 2.4872474481559994e-05, "loss": 0.0049, "step": 20035 }, { "epoch": 4.08, "learning_rate": 2.4861784748870817e-05, "loss": 0.0019, "step": 20036 }, { "epoch": 4.08, "learning_rate": 2.4851097106226024e-05, "loss": 0.0062, "step": 20037 }, { "epoch": 4.08, "learning_rate": 2.484041155380413e-05, "loss": 0.0002, "step": 20038 }, { "epoch": 4.08, "learning_rate": 2.482972809178362e-05, "loss": 0.0018, "step": 20039 }, { "epoch": 4.08, "learning_rate": 2.4819046720342934e-05, "loss": 0.0009, "step": 20040 }, { "epoch": 4.08, "learning_rate": 2.4808367439660465e-05, "loss": 0.0001, "step": 20041 }, { "epoch": 4.08, "learning_rate": 2.479769024991457e-05, "loss": 0.0005, "step": 20042 }, { "epoch": 4.08, "learning_rate": 2.478701515128359e-05, "loss": 0.0007, "step": 20043 }, { "epoch": 4.08, "learning_rate": 2.47763421439458e-05, "loss": 0.002, "step": 20044 }, { "epoch": 4.08, "learning_rate": 2.476567122807952e-05, "loss": 0.001, "step": 20045 }, { "epoch": 4.08, "learning_rate": 2.475500240386286e-05, "loss": 0.0003, "step": 20046 }, { "epoch": 4.08, "learning_rate": 2.474433567147413e-05, "loss": 0.0007, "step": 20047 }, { "epoch": 4.08, "learning_rate": 2.4733671031091368e-05, "loss": 0.0015, "step": 20048 }, { "epoch": 4.08, "learning_rate": 2.472300848289283e-05, "loss": 0.0002, "step": 20049 }, { "epoch": 4.08, "learning_rate": 2.4712348027056494e-05, "loss": 0.003, "step": 20050 }, { "epoch": 4.08, "learning_rate": 2.470168966376045e-05, "loss": 0.0024, "step": 20051 }, { "epoch": 4.08, "learning_rate": 2.46910333931827e-05, "loss": 0.009, "step": 20052 }, { "epoch": 4.08, "learning_rate": 2.4680379215501178e-05, "loss": 0.0001, "step": 20053 }, { "epoch": 4.08, "learning_rate": 2.466972713089397e-05, "loss": 0.0016, "step": 20054 }, { "epoch": 4.08, "learning_rate": 2.4659077139538862e-05, "loss": 0.0044, "step": 20055 }, { "epoch": 4.08, "learning_rate": 2.4648429241613755e-05, "loss": 0.0026, "step": 20056 }, { "epoch": 4.08, "learning_rate": 2.46377834372965e-05, "loss": 0.0007, "step": 20057 }, { "epoch": 4.08, "learning_rate": 2.4627139726764904e-05, "loss": 0.0024, "step": 20058 }, { "epoch": 4.08, "learning_rate": 2.4616498110196732e-05, "loss": 0.0054, "step": 20059 }, { "epoch": 4.08, "learning_rate": 2.4605858587769717e-05, "loss": 0.0005, "step": 20060 }, { "epoch": 4.08, "learning_rate": 2.4595221159661555e-05, "loss": 0.0008, "step": 20061 }, { "epoch": 4.09, "learning_rate": 2.458458582604992e-05, "loss": 0.0033, "step": 20062 }, { "epoch": 4.09, "learning_rate": 2.457395258711245e-05, "loss": 0.0012, "step": 20063 }, { "epoch": 4.09, "learning_rate": 2.4563321443026722e-05, "loss": 0.0024, "step": 20064 }, { "epoch": 4.09, "learning_rate": 2.4552692393970346e-05, "loss": 0.0015, "step": 20065 }, { "epoch": 4.09, "learning_rate": 2.454206544012073e-05, "loss": 0.0003, "step": 20066 }, { "epoch": 4.09, "learning_rate": 2.453144058165551e-05, "loss": 0.0009, "step": 20067 }, { "epoch": 4.09, "learning_rate": 2.4520817818752032e-05, "loss": 0.0073, "step": 20068 }, { "epoch": 4.09, "learning_rate": 2.4510197151587767e-05, "loss": 0.0019, "step": 20069 }, { "epoch": 4.09, "learning_rate": 2.449957858034008e-05, "loss": 0.0027, "step": 20070 }, { "epoch": 4.09, "learning_rate": 2.448896210518632e-05, "loss": 0.0061, "step": 20071 }, { "epoch": 4.09, "learning_rate": 2.4478347726303838e-05, "loss": 0.0015, "step": 20072 }, { "epoch": 4.09, "learning_rate": 2.4467735443869868e-05, "loss": 0.0041, "step": 20073 }, { "epoch": 4.09, "learning_rate": 2.445712525806167e-05, "loss": 0.0003, "step": 20074 }, { "epoch": 4.09, "learning_rate": 2.4446517169056474e-05, "loss": 0.0017, "step": 20075 }, { "epoch": 4.09, "learning_rate": 2.4435911177031432e-05, "loss": 0.0037, "step": 20076 }, { "epoch": 4.09, "learning_rate": 2.4425307282163704e-05, "loss": 0.0152, "step": 20077 }, { "epoch": 4.09, "learning_rate": 2.4414705484630398e-05, "loss": 0.0002, "step": 20078 }, { "epoch": 4.09, "learning_rate": 2.4404105784608523e-05, "loss": 0.0008, "step": 20079 }, { "epoch": 4.09, "learning_rate": 2.4393508182275207e-05, "loss": 0.0053, "step": 20080 }, { "epoch": 4.09, "learning_rate": 2.4382912677807355e-05, "loss": 0.0015, "step": 20081 }, { "epoch": 4.09, "learning_rate": 2.437231927138204e-05, "loss": 0.0005, "step": 20082 }, { "epoch": 4.09, "learning_rate": 2.436172796317609e-05, "loss": 0.0008, "step": 20083 }, { "epoch": 4.09, "learning_rate": 2.4351138753366416e-05, "loss": 0.0112, "step": 20084 }, { "epoch": 4.09, "learning_rate": 2.4340551642129973e-05, "loss": 0.002, "step": 20085 }, { "epoch": 4.09, "learning_rate": 2.4329966629643455e-05, "loss": 0.0022, "step": 20086 }, { "epoch": 4.09, "learning_rate": 2.4319383716083768e-05, "loss": 0.0009, "step": 20087 }, { "epoch": 4.09, "learning_rate": 2.4308802901627587e-05, "loss": 0.0037, "step": 20088 }, { "epoch": 4.09, "learning_rate": 2.4298224186451643e-05, "loss": 0.0019, "step": 20089 }, { "epoch": 4.09, "learning_rate": 2.4287647570732656e-05, "loss": 0.0006, "step": 20090 }, { "epoch": 4.09, "learning_rate": 2.4277073054647233e-05, "loss": 0.0002, "step": 20091 }, { "epoch": 4.09, "learning_rate": 2.426650063837202e-05, "loss": 0.0002, "step": 20092 }, { "epoch": 4.09, "learning_rate": 2.4255930322083578e-05, "loss": 0.0017, "step": 20093 }, { "epoch": 4.09, "learning_rate": 2.424536210595846e-05, "loss": 0.0026, "step": 20094 }, { "epoch": 4.09, "learning_rate": 2.4234795990173177e-05, "loss": 0.0094, "step": 20095 }, { "epoch": 4.09, "learning_rate": 2.4224231974904242e-05, "loss": 0.0003, "step": 20096 }, { "epoch": 4.09, "learning_rate": 2.4213670060327973e-05, "loss": 0.0001, "step": 20097 }, { "epoch": 4.09, "learning_rate": 2.4203110246620916e-05, "loss": 0.0035, "step": 20098 }, { "epoch": 4.09, "learning_rate": 2.4192552533959316e-05, "loss": 0.0041, "step": 20099 }, { "epoch": 4.09, "learning_rate": 2.418199692251964e-05, "loss": 0.0029, "step": 20100 }, { "epoch": 4.09, "learning_rate": 2.4171443412478074e-05, "loss": 0.0048, "step": 20101 }, { "epoch": 4.09, "learning_rate": 2.4160892004010924e-05, "loss": 0.002, "step": 20102 }, { "epoch": 4.09, "learning_rate": 2.4150342697294412e-05, "loss": 0.0007, "step": 20103 }, { "epoch": 4.09, "learning_rate": 2.413979549250473e-05, "loss": 0.0021, "step": 20104 }, { "epoch": 4.09, "learning_rate": 2.4129250389818043e-05, "loss": 0.0023, "step": 20105 }, { "epoch": 4.09, "learning_rate": 2.4118707389410474e-05, "loss": 0.0073, "step": 20106 }, { "epoch": 4.09, "learning_rate": 2.4108166491458116e-05, "loss": 0.0027, "step": 20107 }, { "epoch": 4.09, "learning_rate": 2.4097627696137008e-05, "loss": 0.0049, "step": 20108 }, { "epoch": 4.09, "learning_rate": 2.4087091003623177e-05, "loss": 0.0006, "step": 20109 }, { "epoch": 4.09, "learning_rate": 2.40765564140926e-05, "loss": 0.0065, "step": 20110 }, { "epoch": 4.09, "learning_rate": 2.4066023927721275e-05, "loss": 0.0038, "step": 20111 }, { "epoch": 4.1, "learning_rate": 2.4055493544684985e-05, "loss": 0.0042, "step": 20112 }, { "epoch": 4.1, "learning_rate": 2.4044965265159726e-05, "loss": 0.0002, "step": 20113 }, { "epoch": 4.1, "learning_rate": 2.403443908932131e-05, "loss": 0.0036, "step": 20114 }, { "epoch": 4.1, "learning_rate": 2.402391501734553e-05, "loss": 0.0003, "step": 20115 }, { "epoch": 4.1, "learning_rate": 2.4013393049408208e-05, "loss": 0.0005, "step": 20116 }, { "epoch": 4.1, "learning_rate": 2.4002873185684973e-05, "loss": 0.0019, "step": 20117 }, { "epoch": 4.1, "learning_rate": 2.399235542635165e-05, "loss": 0.0049, "step": 20118 }, { "epoch": 4.1, "learning_rate": 2.3981839771583834e-05, "loss": 0.0003, "step": 20119 }, { "epoch": 4.1, "learning_rate": 2.3971326221557147e-05, "loss": 0.0003, "step": 20120 }, { "epoch": 4.1, "learning_rate": 2.396081477644722e-05, "loss": 0.0009, "step": 20121 }, { "epoch": 4.1, "learning_rate": 2.395030543642959e-05, "loss": 0.0013, "step": 20122 }, { "epoch": 4.1, "learning_rate": 2.3939798201679804e-05, "loss": 0.0001, "step": 20123 }, { "epoch": 4.1, "learning_rate": 2.392929307237334e-05, "loss": 0.0015, "step": 20124 }, { "epoch": 4.1, "learning_rate": 2.391879004868567e-05, "loss": 0.0007, "step": 20125 }, { "epoch": 4.1, "learning_rate": 2.390828913079219e-05, "loss": 0.0029, "step": 20126 }, { "epoch": 4.1, "learning_rate": 2.3897790318868293e-05, "loss": 0.0011, "step": 20127 }, { "epoch": 4.1, "learning_rate": 2.3887293613089337e-05, "loss": 0.0, "step": 20128 }, { "epoch": 4.1, "learning_rate": 2.3876799013630666e-05, "loss": 0.0014, "step": 20129 }, { "epoch": 4.1, "learning_rate": 2.3866306520667455e-05, "loss": 0.0015, "step": 20130 }, { "epoch": 4.1, "learning_rate": 2.38558161343751e-05, "loss": 0.0001, "step": 20131 }, { "epoch": 4.1, "learning_rate": 2.3845327854928644e-05, "loss": 0.0015, "step": 20132 }, { "epoch": 4.1, "learning_rate": 2.3834841682503424e-05, "loss": 0.0004, "step": 20133 }, { "epoch": 4.1, "learning_rate": 2.3824357617274475e-05, "loss": 0.0002, "step": 20134 }, { "epoch": 4.1, "learning_rate": 2.381387565941692e-05, "loss": 0.0019, "step": 20135 }, { "epoch": 4.1, "learning_rate": 2.380339580910582e-05, "loss": 0.0001, "step": 20136 }, { "epoch": 4.1, "learning_rate": 2.37929180665162e-05, "loss": 0.0039, "step": 20137 }, { "epoch": 4.1, "learning_rate": 2.3782442431823152e-05, "loss": 0.0013, "step": 20138 }, { "epoch": 4.1, "learning_rate": 2.3771968905201537e-05, "loss": 0.0002, "step": 20139 }, { "epoch": 4.1, "learning_rate": 2.376149748682632e-05, "loss": 0.001, "step": 20140 }, { "epoch": 4.1, "learning_rate": 2.3751028176872372e-05, "loss": 0.001, "step": 20141 }, { "epoch": 4.1, "learning_rate": 2.3740560975514606e-05, "loss": 0.002, "step": 20142 }, { "epoch": 4.1, "learning_rate": 2.373009588292773e-05, "loss": 0.0004, "step": 20143 }, { "epoch": 4.1, "learning_rate": 2.371963289928664e-05, "loss": 0.0002, "step": 20144 }, { "epoch": 4.1, "learning_rate": 2.3709172024766044e-05, "loss": 0.0018, "step": 20145 }, { "epoch": 4.1, "learning_rate": 2.3698713259540686e-05, "loss": 0.0024, "step": 20146 }, { "epoch": 4.1, "learning_rate": 2.3688256603785245e-05, "loss": 0.0001, "step": 20147 }, { "epoch": 4.1, "learning_rate": 2.3677802057674295e-05, "loss": 0.0001, "step": 20148 }, { "epoch": 4.1, "learning_rate": 2.3667349621382547e-05, "loss": 0.0048, "step": 20149 }, { "epoch": 4.1, "learning_rate": 2.365689929508448e-05, "loss": 0.0045, "step": 20150 }, { "epoch": 4.1, "learning_rate": 2.3646451078954754e-05, "loss": 0.0007, "step": 20151 }, { "epoch": 4.1, "learning_rate": 2.363600497316776e-05, "loss": 0.0022, "step": 20152 }, { "epoch": 4.1, "learning_rate": 2.3625560977898013e-05, "loss": 0.0023, "step": 20153 }, { "epoch": 4.1, "learning_rate": 2.361511909331995e-05, "loss": 0.009, "step": 20154 }, { "epoch": 4.1, "learning_rate": 2.3604679319607954e-05, "loss": 0.0063, "step": 20155 }, { "epoch": 4.1, "learning_rate": 2.359424165693642e-05, "loss": 0.002, "step": 20156 }, { "epoch": 4.1, "learning_rate": 2.3583806105479653e-05, "loss": 0.0027, "step": 20157 }, { "epoch": 4.1, "learning_rate": 2.357337266541195e-05, "loss": 0.0032, "step": 20158 }, { "epoch": 4.1, "learning_rate": 2.356294133690757e-05, "loss": 0.0024, "step": 20159 }, { "epoch": 4.1, "learning_rate": 2.3552512120140725e-05, "loss": 0.0001, "step": 20160 }, { "epoch": 4.11, "learning_rate": 2.3542085015285626e-05, "loss": 0.0057, "step": 20161 }, { "epoch": 4.11, "learning_rate": 2.353166002251645e-05, "loss": 0.0048, "step": 20162 }, { "epoch": 4.11, "learning_rate": 2.352123714200721e-05, "loss": 0.0045, "step": 20163 }, { "epoch": 4.11, "learning_rate": 2.351081637393213e-05, "loss": 0.0036, "step": 20164 }, { "epoch": 4.11, "learning_rate": 2.3500397718465087e-05, "loss": 0.0049, "step": 20165 }, { "epoch": 4.11, "learning_rate": 2.3489981175780243e-05, "loss": 0.0002, "step": 20166 }, { "epoch": 4.11, "learning_rate": 2.347956674605154e-05, "loss": 0.0045, "step": 20167 }, { "epoch": 4.11, "learning_rate": 2.3469154429452846e-05, "loss": 0.0002, "step": 20168 }, { "epoch": 4.11, "learning_rate": 2.3458744226158166e-05, "loss": 0.0001, "step": 20169 }, { "epoch": 4.11, "learning_rate": 2.3448336136341295e-05, "loss": 0.0001, "step": 20170 }, { "epoch": 4.11, "learning_rate": 2.3437930160176095e-05, "loss": 0.0003, "step": 20171 }, { "epoch": 4.11, "learning_rate": 2.3427526297836374e-05, "loss": 0.0006, "step": 20172 }, { "epoch": 4.11, "learning_rate": 2.3417124549495862e-05, "loss": 0.0137, "step": 20173 }, { "epoch": 4.11, "learning_rate": 2.340672491532834e-05, "loss": 0.0035, "step": 20174 }, { "epoch": 4.11, "learning_rate": 2.3396327395507448e-05, "loss": 0.0016, "step": 20175 }, { "epoch": 4.11, "learning_rate": 2.338593199020688e-05, "loss": 0.0019, "step": 20176 }, { "epoch": 4.11, "learning_rate": 2.337553869960025e-05, "loss": 0.0021, "step": 20177 }, { "epoch": 4.11, "learning_rate": 2.336514752386115e-05, "loss": 0.0033, "step": 20178 }, { "epoch": 4.11, "learning_rate": 2.3354758463163108e-05, "loss": 0.0002, "step": 20179 }, { "epoch": 4.11, "learning_rate": 2.334437151767972e-05, "loss": 0.0044, "step": 20180 }, { "epoch": 4.11, "learning_rate": 2.3333986687584317e-05, "loss": 0.0063, "step": 20181 }, { "epoch": 4.11, "learning_rate": 2.332360397305052e-05, "loss": 0.0017, "step": 20182 }, { "epoch": 4.11, "learning_rate": 2.3313223374251576e-05, "loss": 0.0014, "step": 20183 }, { "epoch": 4.11, "learning_rate": 2.3302844891361018e-05, "loss": 0.0, "step": 20184 }, { "epoch": 4.11, "learning_rate": 2.3292468524552048e-05, "loss": 0.001, "step": 20185 }, { "epoch": 4.11, "learning_rate": 2.3282094273998054e-05, "loss": 0.0023, "step": 20186 }, { "epoch": 4.11, "learning_rate": 2.327172213987229e-05, "loss": 0.008, "step": 20187 }, { "epoch": 4.11, "learning_rate": 2.326135212234797e-05, "loss": 0.0015, "step": 20188 }, { "epoch": 4.11, "learning_rate": 2.3250984221598308e-05, "loss": 0.0013, "step": 20189 }, { "epoch": 4.11, "learning_rate": 2.324061843779646e-05, "loss": 0.0006, "step": 20190 }, { "epoch": 4.11, "learning_rate": 2.3230254771115557e-05, "loss": 0.0051, "step": 20191 }, { "epoch": 4.11, "learning_rate": 2.3219893221728697e-05, "loss": 0.0007, "step": 20192 }, { "epoch": 4.11, "learning_rate": 2.3209533789808986e-05, "loss": 0.0023, "step": 20193 }, { "epoch": 4.11, "learning_rate": 2.319917647552931e-05, "loss": 0.0006, "step": 20194 }, { "epoch": 4.11, "learning_rate": 2.3188821279062802e-05, "loss": 0.0017, "step": 20195 }, { "epoch": 4.11, "learning_rate": 2.3178468200582302e-05, "loss": 0.0018, "step": 20196 }, { "epoch": 4.11, "learning_rate": 2.3168117240260796e-05, "loss": 0.0055, "step": 20197 }, { "epoch": 4.11, "learning_rate": 2.3157768398271188e-05, "loss": 0.0002, "step": 20198 }, { "epoch": 4.11, "learning_rate": 2.3147421674786197e-05, "loss": 0.0005, "step": 20199 }, { "epoch": 4.11, "learning_rate": 2.3137077069978792e-05, "loss": 0.0001, "step": 20200 }, { "epoch": 4.11, "learning_rate": 2.3126734584021617e-05, "loss": 0.0045, "step": 20201 }, { "epoch": 4.11, "learning_rate": 2.3116394217087515e-05, "loss": 0.0049, "step": 20202 }, { "epoch": 4.11, "learning_rate": 2.3106055969349112e-05, "loss": 0.0018, "step": 20203 }, { "epoch": 4.11, "learning_rate": 2.3095719840979093e-05, "loss": 0.0007, "step": 20204 }, { "epoch": 4.11, "learning_rate": 2.3085385832150117e-05, "loss": 0.0012, "step": 20205 }, { "epoch": 4.11, "learning_rate": 2.307505394303476e-05, "loss": 0.0009, "step": 20206 }, { "epoch": 4.11, "learning_rate": 2.306472417380559e-05, "loss": 0.0005, "step": 20207 }, { "epoch": 4.11, "learning_rate": 2.3054396524635128e-05, "loss": 0.0003, "step": 20208 }, { "epoch": 4.11, "learning_rate": 2.3044070995695872e-05, "loss": 0.0002, "step": 20209 }, { "epoch": 4.12, "learning_rate": 2.3033747587160272e-05, "loss": 0.0054, "step": 20210 }, { "epoch": 4.12, "learning_rate": 2.302342629920077e-05, "loss": 0.0006, "step": 20211 }, { "epoch": 4.12, "learning_rate": 2.301310713198971e-05, "loss": 0.003, "step": 20212 }, { "epoch": 4.12, "learning_rate": 2.3002790085699523e-05, "loss": 0.0002, "step": 20213 }, { "epoch": 4.12, "learning_rate": 2.2992475160502388e-05, "loss": 0.003, "step": 20214 }, { "epoch": 4.12, "learning_rate": 2.298216235657073e-05, "loss": 0.0017, "step": 20215 }, { "epoch": 4.12, "learning_rate": 2.2971851674076685e-05, "loss": 0.0033, "step": 20216 }, { "epoch": 4.12, "learning_rate": 2.296154311319251e-05, "loss": 0.0006, "step": 20217 }, { "epoch": 4.12, "learning_rate": 2.2951236674090368e-05, "loss": 0.0004, "step": 20218 }, { "epoch": 4.12, "learning_rate": 2.2940932356942354e-05, "loss": 0.0008, "step": 20219 }, { "epoch": 4.12, "learning_rate": 2.293063016192068e-05, "loss": 0.0025, "step": 20220 }, { "epoch": 4.12, "learning_rate": 2.2920330089197296e-05, "loss": 0.0039, "step": 20221 }, { "epoch": 4.12, "learning_rate": 2.2910032138944296e-05, "loss": 0.0005, "step": 20222 }, { "epoch": 4.12, "learning_rate": 2.2899736311333653e-05, "loss": 0.0026, "step": 20223 }, { "epoch": 4.12, "learning_rate": 2.288944260653734e-05, "loss": 0.0002, "step": 20224 }, { "epoch": 4.12, "learning_rate": 2.287915102472726e-05, "loss": 0.002, "step": 20225 }, { "epoch": 4.12, "learning_rate": 2.2868861566075365e-05, "loss": 0.0013, "step": 20226 }, { "epoch": 4.12, "learning_rate": 2.2858574230753378e-05, "loss": 0.0026, "step": 20227 }, { "epoch": 4.12, "learning_rate": 2.2848289018933236e-05, "loss": 0.0017, "step": 20228 }, { "epoch": 4.12, "learning_rate": 2.2838005930786678e-05, "loss": 0.0012, "step": 20229 }, { "epoch": 4.12, "learning_rate": 2.282772496648547e-05, "loss": 0.0003, "step": 20230 }, { "epoch": 4.12, "learning_rate": 2.2817446126201345e-05, "loss": 0.0004, "step": 20231 }, { "epoch": 4.12, "learning_rate": 2.2807169410105858e-05, "loss": 0.003, "step": 20232 }, { "epoch": 4.12, "learning_rate": 2.2796894818370808e-05, "loss": 0.0001, "step": 20233 }, { "epoch": 4.12, "learning_rate": 2.278662235116766e-05, "loss": 0.01, "step": 20234 }, { "epoch": 4.12, "learning_rate": 2.2776352008668125e-05, "loss": 0.0023, "step": 20235 }, { "epoch": 4.12, "learning_rate": 2.276608379104363e-05, "loss": 0.0007, "step": 20236 }, { "epoch": 4.12, "learning_rate": 2.2755817698465713e-05, "loss": 0.0031, "step": 20237 }, { "epoch": 4.12, "learning_rate": 2.274555373110581e-05, "loss": 0.0024, "step": 20238 }, { "epoch": 4.12, "learning_rate": 2.273529188913539e-05, "loss": 0.0015, "step": 20239 }, { "epoch": 4.12, "learning_rate": 2.272503217272581e-05, "loss": 0.002, "step": 20240 }, { "epoch": 4.12, "learning_rate": 2.271477458204844e-05, "loss": 0.0025, "step": 20241 }, { "epoch": 4.12, "learning_rate": 2.2704519117274606e-05, "loss": 0.0005, "step": 20242 }, { "epoch": 4.12, "learning_rate": 2.2694265778575604e-05, "loss": 0.0026, "step": 20243 }, { "epoch": 4.12, "learning_rate": 2.2684014566122683e-05, "loss": 0.0001, "step": 20244 }, { "epoch": 4.12, "learning_rate": 2.2673765480086986e-05, "loss": 0.0005, "step": 20245 }, { "epoch": 4.12, "learning_rate": 2.266351852063983e-05, "loss": 0.0058, "step": 20246 }, { "epoch": 4.12, "learning_rate": 2.265327368795219e-05, "loss": 0.0012, "step": 20247 }, { "epoch": 4.12, "learning_rate": 2.264303098219535e-05, "loss": 0.0006, "step": 20248 }, { "epoch": 4.12, "learning_rate": 2.2632790403540252e-05, "loss": 0.0011, "step": 20249 }, { "epoch": 4.12, "learning_rate": 2.2622551952157947e-05, "loss": 0.0005, "step": 20250 }, { "epoch": 4.12, "learning_rate": 2.261231562821953e-05, "loss": 0.0002, "step": 20251 }, { "epoch": 4.12, "learning_rate": 2.260208143189583e-05, "loss": 0.0009, "step": 20252 }, { "epoch": 4.12, "learning_rate": 2.2591849363357927e-05, "loss": 0.0001, "step": 20253 }, { "epoch": 4.12, "learning_rate": 2.2581619422776603e-05, "loss": 0.0003, "step": 20254 }, { "epoch": 4.12, "learning_rate": 2.257139161032277e-05, "loss": 0.0037, "step": 20255 }, { "epoch": 4.12, "learning_rate": 2.2561165926167208e-05, "loss": 0.001, "step": 20256 }, { "epoch": 4.12, "learning_rate": 2.2550942370480745e-05, "loss": 0.0044, "step": 20257 }, { "epoch": 4.12, "learning_rate": 2.2540720943434133e-05, "loss": 0.0014, "step": 20258 }, { "epoch": 4.13, "learning_rate": 2.2530501645198064e-05, "loss": 0.0027, "step": 20259 }, { "epoch": 4.13, "learning_rate": 2.2520284475943234e-05, "loss": 0.0014, "step": 20260 }, { "epoch": 4.13, "learning_rate": 2.2510069435840293e-05, "loss": 0.0005, "step": 20261 }, { "epoch": 4.13, "learning_rate": 2.2499856525059838e-05, "loss": 0.0004, "step": 20262 }, { "epoch": 4.13, "learning_rate": 2.2489645743772467e-05, "loss": 0.0005, "step": 20263 }, { "epoch": 4.13, "learning_rate": 2.2479437092148723e-05, "loss": 0.0007, "step": 20264 }, { "epoch": 4.13, "learning_rate": 2.2469230570359037e-05, "loss": 0.0014, "step": 20265 }, { "epoch": 4.13, "learning_rate": 2.245902617857399e-05, "loss": 0.0062, "step": 20266 }, { "epoch": 4.13, "learning_rate": 2.244882391696393e-05, "loss": 0.0013, "step": 20267 }, { "epoch": 4.13, "learning_rate": 2.2438623785699273e-05, "loss": 0.001, "step": 20268 }, { "epoch": 4.13, "learning_rate": 2.2428425784950394e-05, "loss": 0.0031, "step": 20269 }, { "epoch": 4.13, "learning_rate": 2.241822991488761e-05, "loss": 0.0002, "step": 20270 }, { "epoch": 4.13, "learning_rate": 2.2408036175681214e-05, "loss": 0.0002, "step": 20271 }, { "epoch": 4.13, "learning_rate": 2.2397844567501478e-05, "loss": 0.0053, "step": 20272 }, { "epoch": 4.13, "learning_rate": 2.2387655090518575e-05, "loss": 0.0006, "step": 20273 }, { "epoch": 4.13, "learning_rate": 2.237746774490274e-05, "loss": 0.0013, "step": 20274 }, { "epoch": 4.13, "learning_rate": 2.2367282530824082e-05, "loss": 0.0075, "step": 20275 }, { "epoch": 4.13, "learning_rate": 2.2357099448452738e-05, "loss": 0.0022, "step": 20276 }, { "epoch": 4.13, "learning_rate": 2.2346918497958815e-05, "loss": 0.0042, "step": 20277 }, { "epoch": 4.13, "learning_rate": 2.2336739679512232e-05, "loss": 0.0007, "step": 20278 }, { "epoch": 4.13, "learning_rate": 2.2326562993283154e-05, "loss": 0.0005, "step": 20279 }, { "epoch": 4.13, "learning_rate": 2.2316388439441407e-05, "loss": 0.0001, "step": 20280 }, { "epoch": 4.13, "learning_rate": 2.2306216018157026e-05, "loss": 0.0021, "step": 20281 }, { "epoch": 4.13, "learning_rate": 2.229604572959992e-05, "loss": 0.0032, "step": 20282 }, { "epoch": 4.13, "learning_rate": 2.2285877573939825e-05, "loss": 0.0015, "step": 20283 }, { "epoch": 4.13, "learning_rate": 2.2275711551346736e-05, "loss": 0.0007, "step": 20284 }, { "epoch": 4.13, "learning_rate": 2.2265547661990286e-05, "loss": 0.004, "step": 20285 }, { "epoch": 4.13, "learning_rate": 2.225538590604037e-05, "loss": 0.0018, "step": 20286 }, { "epoch": 4.13, "learning_rate": 2.22452262836666e-05, "loss": 0.003, "step": 20287 }, { "epoch": 4.13, "learning_rate": 2.223506879503873e-05, "loss": 0.0004, "step": 20288 }, { "epoch": 4.13, "learning_rate": 2.222491344032637e-05, "loss": 0.002, "step": 20289 }, { "epoch": 4.13, "learning_rate": 2.221476021969915e-05, "loss": 0.0037, "step": 20290 }, { "epoch": 4.13, "learning_rate": 2.220460913332664e-05, "loss": 0.0002, "step": 20291 }, { "epoch": 4.13, "learning_rate": 2.2194460181378397e-05, "loss": 0.0003, "step": 20292 }, { "epoch": 4.13, "learning_rate": 2.2184313364023925e-05, "loss": 0.0002, "step": 20293 }, { "epoch": 4.13, "learning_rate": 2.217416868143267e-05, "loss": 0.0013, "step": 20294 }, { "epoch": 4.13, "learning_rate": 2.2164026133774144e-05, "loss": 0.0004, "step": 20295 }, { "epoch": 4.13, "learning_rate": 2.2153885721217594e-05, "loss": 0.0007, "step": 20296 }, { "epoch": 4.13, "learning_rate": 2.2143747443932574e-05, "loss": 0.0016, "step": 20297 }, { "epoch": 4.13, "learning_rate": 2.2133611302088227e-05, "loss": 0.0015, "step": 20298 }, { "epoch": 4.13, "learning_rate": 2.212347729585402e-05, "loss": 0.0013, "step": 20299 }, { "epoch": 4.13, "learning_rate": 2.2113345425399083e-05, "loss": 0.0011, "step": 20300 }, { "epoch": 4.13, "learning_rate": 2.210321569089268e-05, "loss": 0.0001, "step": 20301 }, { "epoch": 4.13, "learning_rate": 2.2093088092504008e-05, "loss": 0.0149, "step": 20302 }, { "epoch": 4.13, "learning_rate": 2.2082962630402168e-05, "loss": 0.0085, "step": 20303 }, { "epoch": 4.13, "learning_rate": 2.2072839304756373e-05, "loss": 0.0016, "step": 20304 }, { "epoch": 4.13, "learning_rate": 2.2062718115735604e-05, "loss": 0.0038, "step": 20305 }, { "epoch": 4.13, "learning_rate": 2.2052599063508962e-05, "loss": 0.0003, "step": 20306 }, { "epoch": 4.13, "learning_rate": 2.204248214824541e-05, "loss": 0.0003, "step": 20307 }, { "epoch": 4.14, "learning_rate": 2.2032367370113963e-05, "loss": 0.0003, "step": 20308 }, { "epoch": 4.14, "learning_rate": 2.2022254729283518e-05, "loss": 0.0028, "step": 20309 }, { "epoch": 4.14, "learning_rate": 2.2012144225923005e-05, "loss": 0.0021, "step": 20310 }, { "epoch": 4.14, "learning_rate": 2.2002035860201277e-05, "loss": 0.0008, "step": 20311 }, { "epoch": 4.14, "learning_rate": 2.1991929632287166e-05, "loss": 0.0006, "step": 20312 }, { "epoch": 4.14, "learning_rate": 2.1981825542349462e-05, "loss": 0.0014, "step": 20313 }, { "epoch": 4.14, "learning_rate": 2.1971723590556922e-05, "loss": 0.0027, "step": 20314 }, { "epoch": 4.14, "learning_rate": 2.196162377707829e-05, "loss": 0.001, "step": 20315 }, { "epoch": 4.14, "learning_rate": 2.1951526102082184e-05, "loss": 0.0038, "step": 20316 }, { "epoch": 4.14, "learning_rate": 2.194143056573735e-05, "loss": 0.0089, "step": 20317 }, { "epoch": 4.14, "learning_rate": 2.1931337168212336e-05, "loss": 0.001, "step": 20318 }, { "epoch": 4.14, "learning_rate": 2.192124590967573e-05, "loss": 0.0002, "step": 20319 }, { "epoch": 4.14, "learning_rate": 2.1911156790296086e-05, "loss": 0.003, "step": 20320 }, { "epoch": 4.14, "learning_rate": 2.1901069810241896e-05, "loss": 0.0051, "step": 20321 }, { "epoch": 4.14, "learning_rate": 2.189098496968165e-05, "loss": 0.0028, "step": 20322 }, { "epoch": 4.14, "learning_rate": 2.188090226878379e-05, "loss": 0.0004, "step": 20323 }, { "epoch": 4.14, "learning_rate": 2.187082170771669e-05, "loss": 0.0001, "step": 20324 }, { "epoch": 4.14, "learning_rate": 2.1860743286648736e-05, "loss": 0.0013, "step": 20325 }, { "epoch": 4.14, "learning_rate": 2.185066700574824e-05, "loss": 0.0007, "step": 20326 }, { "epoch": 4.14, "learning_rate": 2.1840592865183522e-05, "loss": 0.0011, "step": 20327 }, { "epoch": 4.14, "learning_rate": 2.1830520865122842e-05, "loss": 0.0019, "step": 20328 }, { "epoch": 4.14, "learning_rate": 2.1820451005734337e-05, "loss": 0.0043, "step": 20329 }, { "epoch": 4.14, "learning_rate": 2.1810383287186318e-05, "loss": 0.0005, "step": 20330 }, { "epoch": 4.14, "learning_rate": 2.1800317709646804e-05, "loss": 0.0004, "step": 20331 }, { "epoch": 4.14, "learning_rate": 2.179025427328406e-05, "loss": 0.0001, "step": 20332 }, { "epoch": 4.14, "learning_rate": 2.1780192978266032e-05, "loss": 0.0043, "step": 20333 }, { "epoch": 4.14, "learning_rate": 2.177013382476079e-05, "loss": 0.0041, "step": 20334 }, { "epoch": 4.14, "learning_rate": 2.176007681293643e-05, "loss": 0.0019, "step": 20335 }, { "epoch": 4.14, "learning_rate": 2.175002194296078e-05, "loss": 0.0003, "step": 20336 }, { "epoch": 4.14, "learning_rate": 2.1739969215001933e-05, "loss": 0.0026, "step": 20337 }, { "epoch": 4.14, "learning_rate": 2.1729918629227667e-05, "loss": 0.0013, "step": 20338 }, { "epoch": 4.14, "learning_rate": 2.1719870185805892e-05, "loss": 0.0113, "step": 20339 }, { "epoch": 4.14, "learning_rate": 2.170982388490443e-05, "loss": 0.0007, "step": 20340 }, { "epoch": 4.14, "learning_rate": 2.1699779726691064e-05, "loss": 0.0001, "step": 20341 }, { "epoch": 4.14, "learning_rate": 2.168973771133357e-05, "loss": 0.0028, "step": 20342 }, { "epoch": 4.14, "learning_rate": 2.1679697838999653e-05, "loss": 0.0002, "step": 20343 }, { "epoch": 4.14, "learning_rate": 2.1669660109857013e-05, "loss": 0.0002, "step": 20344 }, { "epoch": 4.14, "learning_rate": 2.1659624524073295e-05, "loss": 0.0002, "step": 20345 }, { "epoch": 4.14, "learning_rate": 2.164959108181613e-05, "loss": 0.0035, "step": 20346 }, { "epoch": 4.14, "learning_rate": 2.1639559783253006e-05, "loss": 0.0003, "step": 20347 }, { "epoch": 4.14, "learning_rate": 2.162953062855159e-05, "loss": 0.0001, "step": 20348 }, { "epoch": 4.14, "learning_rate": 2.1619503617879276e-05, "loss": 0.0002, "step": 20349 }, { "epoch": 4.14, "learning_rate": 2.1609478751403646e-05, "loss": 0.0035, "step": 20350 }, { "epoch": 4.14, "learning_rate": 2.159945602929204e-05, "loss": 0.0017, "step": 20351 }, { "epoch": 4.14, "learning_rate": 2.15894354517119e-05, "loss": 0.0019, "step": 20352 }, { "epoch": 4.14, "learning_rate": 2.157941701883058e-05, "loss": 0.0039, "step": 20353 }, { "epoch": 4.14, "learning_rate": 2.1569400730815396e-05, "loss": 0.0015, "step": 20354 }, { "epoch": 4.14, "learning_rate": 2.155938658783366e-05, "loss": 0.0072, "step": 20355 }, { "epoch": 4.14, "learning_rate": 2.154937459005261e-05, "loss": 0.0014, "step": 20356 }, { "epoch": 4.15, "learning_rate": 2.1539364737639476e-05, "loss": 0.0006, "step": 20357 }, { "epoch": 4.15, "learning_rate": 2.152935703076144e-05, "loss": 0.0007, "step": 20358 }, { "epoch": 4.15, "learning_rate": 2.151935146958564e-05, "loss": 0.0011, "step": 20359 }, { "epoch": 4.15, "learning_rate": 2.15093480542792e-05, "loss": 0.0028, "step": 20360 }, { "epoch": 4.15, "learning_rate": 2.149934678500923e-05, "loss": 0.0017, "step": 20361 }, { "epoch": 4.15, "learning_rate": 2.1489347661942658e-05, "loss": 0.0001, "step": 20362 }, { "epoch": 4.15, "learning_rate": 2.147935068524658e-05, "loss": 0.0011, "step": 20363 }, { "epoch": 4.15, "learning_rate": 2.1469355855088005e-05, "loss": 0.0003, "step": 20364 }, { "epoch": 4.15, "learning_rate": 2.1459363171633726e-05, "loss": 0.0012, "step": 20365 }, { "epoch": 4.15, "learning_rate": 2.1449372635050777e-05, "loss": 0.0012, "step": 20366 }, { "epoch": 4.15, "learning_rate": 2.143938424550591e-05, "loss": 0.0024, "step": 20367 }, { "epoch": 4.15, "learning_rate": 2.1429398003166053e-05, "loss": 0.0002, "step": 20368 }, { "epoch": 4.15, "learning_rate": 2.141941390819793e-05, "loss": 0.002, "step": 20369 }, { "epoch": 4.15, "learning_rate": 2.1409431960768303e-05, "loss": 0.0004, "step": 20370 }, { "epoch": 4.15, "learning_rate": 2.1399452161043873e-05, "loss": 0.0008, "step": 20371 }, { "epoch": 4.15, "learning_rate": 2.1389474509191374e-05, "loss": 0.0084, "step": 20372 }, { "epoch": 4.15, "learning_rate": 2.1379499005377404e-05, "loss": 0.0018, "step": 20373 }, { "epoch": 4.15, "learning_rate": 2.136952564976858e-05, "loss": 0.002, "step": 20374 }, { "epoch": 4.15, "learning_rate": 2.135955444253149e-05, "loss": 0.0005, "step": 20375 }, { "epoch": 4.15, "learning_rate": 2.134958538383268e-05, "loss": 0.0002, "step": 20376 }, { "epoch": 4.15, "learning_rate": 2.133961847383863e-05, "loss": 0.009, "step": 20377 }, { "epoch": 4.15, "learning_rate": 2.1329653712715817e-05, "loss": 0.0025, "step": 20378 }, { "epoch": 4.15, "learning_rate": 2.13196911006307e-05, "loss": 0.0021, "step": 20379 }, { "epoch": 4.15, "learning_rate": 2.1309730637749577e-05, "loss": 0.0032, "step": 20380 }, { "epoch": 4.15, "learning_rate": 2.129977232423894e-05, "loss": 0.0009, "step": 20381 }, { "epoch": 4.15, "learning_rate": 2.1289816160264984e-05, "loss": 0.0001, "step": 20382 }, { "epoch": 4.15, "learning_rate": 2.127986214599411e-05, "loss": 0.0002, "step": 20383 }, { "epoch": 4.15, "learning_rate": 2.1269910281592483e-05, "loss": 0.0068, "step": 20384 }, { "epoch": 4.15, "learning_rate": 2.1259960567226357e-05, "loss": 0.0036, "step": 20385 }, { "epoch": 4.15, "learning_rate": 2.12500130030619e-05, "loss": 0.0007, "step": 20386 }, { "epoch": 4.15, "learning_rate": 2.1240067589265226e-05, "loss": 0.0038, "step": 20387 }, { "epoch": 4.15, "learning_rate": 2.1230124326002535e-05, "loss": 0.0023, "step": 20388 }, { "epoch": 4.15, "learning_rate": 2.122018321343981e-05, "loss": 0.0008, "step": 20389 }, { "epoch": 4.15, "learning_rate": 2.1210244251743124e-05, "loss": 0.0028, "step": 20390 }, { "epoch": 4.15, "learning_rate": 2.120030744107846e-05, "loss": 0.0014, "step": 20391 }, { "epoch": 4.15, "learning_rate": 2.1190372781611825e-05, "loss": 0.0075, "step": 20392 }, { "epoch": 4.15, "learning_rate": 2.118044027350903e-05, "loss": 0.0004, "step": 20393 }, { "epoch": 4.15, "learning_rate": 2.117050991693609e-05, "loss": 0.0001, "step": 20394 }, { "epoch": 4.15, "learning_rate": 2.1160581712058823e-05, "loss": 0.0079, "step": 20395 }, { "epoch": 4.15, "learning_rate": 2.1150655659043025e-05, "loss": 0.0046, "step": 20396 }, { "epoch": 4.15, "learning_rate": 2.1140731758054552e-05, "loss": 0.0002, "step": 20397 }, { "epoch": 4.15, "learning_rate": 2.113081000925902e-05, "loss": 0.0002, "step": 20398 }, { "epoch": 4.15, "learning_rate": 2.112089041282228e-05, "loss": 0.0023, "step": 20399 }, { "epoch": 4.15, "learning_rate": 2.1110972968909877e-05, "loss": 0.0042, "step": 20400 }, { "epoch": 4.15, "learning_rate": 2.1101057677687604e-05, "loss": 0.0002, "step": 20401 }, { "epoch": 4.15, "learning_rate": 2.1091144539320944e-05, "loss": 0.0005, "step": 20402 }, { "epoch": 4.15, "learning_rate": 2.108123355397549e-05, "loss": 0.005, "step": 20403 }, { "epoch": 4.15, "learning_rate": 2.10713247218168e-05, "loss": 0.0024, "step": 20404 }, { "epoch": 4.15, "learning_rate": 2.106141804301036e-05, "loss": 0.0009, "step": 20405 }, { "epoch": 4.16, "learning_rate": 2.1051513517721613e-05, "loss": 0.0026, "step": 20406 }, { "epoch": 4.16, "learning_rate": 2.1041611146116018e-05, "loss": 0.0009, "step": 20407 }, { "epoch": 4.16, "learning_rate": 2.103171092835892e-05, "loss": 0.0005, "step": 20408 }, { "epoch": 4.16, "learning_rate": 2.1021812864615707e-05, "loss": 0.0025, "step": 20409 }, { "epoch": 4.16, "learning_rate": 2.1011916955051693e-05, "loss": 0.0057, "step": 20410 }, { "epoch": 4.16, "learning_rate": 2.1002023199832134e-05, "loss": 0.0007, "step": 20411 }, { "epoch": 4.16, "learning_rate": 2.0992131599122314e-05, "loss": 0.003, "step": 20412 }, { "epoch": 4.16, "learning_rate": 2.0982242153087363e-05, "loss": 0.0005, "step": 20413 }, { "epoch": 4.16, "learning_rate": 2.0972354861892572e-05, "loss": 0.0035, "step": 20414 }, { "epoch": 4.16, "learning_rate": 2.0962469725702985e-05, "loss": 0.0035, "step": 20415 }, { "epoch": 4.16, "learning_rate": 2.0952586744683674e-05, "loss": 0.0047, "step": 20416 }, { "epoch": 4.16, "learning_rate": 2.094270591899984e-05, "loss": 0.0002, "step": 20417 }, { "epoch": 4.16, "learning_rate": 2.093282724881637e-05, "loss": 0.0023, "step": 20418 }, { "epoch": 4.16, "learning_rate": 2.0922950734298377e-05, "loss": 0.0008, "step": 20419 }, { "epoch": 4.16, "learning_rate": 2.0913076375610715e-05, "loss": 0.001, "step": 20420 }, { "epoch": 4.16, "learning_rate": 2.0903204172918352e-05, "loss": 0.003, "step": 20421 }, { "epoch": 4.16, "learning_rate": 2.0893334126386174e-05, "loss": 0.0023, "step": 20422 }, { "epoch": 4.16, "learning_rate": 2.0883466236179014e-05, "loss": 0.0003, "step": 20423 }, { "epoch": 4.16, "learning_rate": 2.087360050246169e-05, "loss": 0.0004, "step": 20424 }, { "epoch": 4.16, "learning_rate": 2.086373692539899e-05, "loss": 0.0016, "step": 20425 }, { "epoch": 4.16, "learning_rate": 2.0853875505155642e-05, "loss": 0.0022, "step": 20426 }, { "epoch": 4.16, "learning_rate": 2.084401624189634e-05, "loss": 0.0041, "step": 20427 }, { "epoch": 4.16, "learning_rate": 2.0834159135785777e-05, "loss": 0.0053, "step": 20428 }, { "epoch": 4.16, "learning_rate": 2.082430418698858e-05, "loss": 0.0001, "step": 20429 }, { "epoch": 4.16, "learning_rate": 2.0814451395669372e-05, "loss": 0.0016, "step": 20430 }, { "epoch": 4.16, "learning_rate": 2.0804600761992602e-05, "loss": 0.0018, "step": 20431 }, { "epoch": 4.16, "learning_rate": 2.079475228612296e-05, "loss": 0.0002, "step": 20432 }, { "epoch": 4.16, "learning_rate": 2.0784905968224756e-05, "loss": 0.0005, "step": 20433 }, { "epoch": 4.16, "learning_rate": 2.077506180846262e-05, "loss": 0.0007, "step": 20434 }, { "epoch": 4.16, "learning_rate": 2.0765219807000843e-05, "loss": 0.0001, "step": 20435 }, { "epoch": 4.16, "learning_rate": 2.0755379964003837e-05, "loss": 0.0027, "step": 20436 }, { "epoch": 4.16, "learning_rate": 2.074554227963596e-05, "loss": 0.0037, "step": 20437 }, { "epoch": 4.16, "learning_rate": 2.0735706754061505e-05, "loss": 0.0054, "step": 20438 }, { "epoch": 4.16, "learning_rate": 2.0725873387444746e-05, "loss": 0.0103, "step": 20439 }, { "epoch": 4.16, "learning_rate": 2.0716042179949938e-05, "loss": 0.0003, "step": 20440 }, { "epoch": 4.16, "learning_rate": 2.0706213131741244e-05, "loss": 0.0003, "step": 20441 }, { "epoch": 4.16, "learning_rate": 2.0696386242982872e-05, "loss": 0.002, "step": 20442 }, { "epoch": 4.16, "learning_rate": 2.068656151383895e-05, "loss": 0.0002, "step": 20443 }, { "epoch": 4.16, "learning_rate": 2.0676738944473485e-05, "loss": 0.0059, "step": 20444 }, { "epoch": 4.16, "learning_rate": 2.0666918535050665e-05, "loss": 0.0012, "step": 20445 }, { "epoch": 4.16, "learning_rate": 2.0657100285734367e-05, "loss": 0.0026, "step": 20446 }, { "epoch": 4.16, "learning_rate": 2.0647284196688685e-05, "loss": 0.004, "step": 20447 }, { "epoch": 4.16, "learning_rate": 2.063747026807755e-05, "loss": 0.0014, "step": 20448 }, { "epoch": 4.16, "learning_rate": 2.0627658500064797e-05, "loss": 0.0005, "step": 20449 }, { "epoch": 4.16, "learning_rate": 2.0617848892814416e-05, "loss": 0.0001, "step": 20450 }, { "epoch": 4.16, "learning_rate": 2.0608041446490103e-05, "loss": 0.0035, "step": 20451 }, { "epoch": 4.16, "learning_rate": 2.0598236161255833e-05, "loss": 0.0007, "step": 20452 }, { "epoch": 4.16, "learning_rate": 2.0588433037275238e-05, "loss": 0.0035, "step": 20453 }, { "epoch": 4.16, "learning_rate": 2.0578632074712088e-05, "loss": 0.0033, "step": 20454 }, { "epoch": 4.17, "learning_rate": 2.0568833273730083e-05, "loss": 0.0029, "step": 20455 }, { "epoch": 4.17, "learning_rate": 2.05590366344929e-05, "loss": 0.0001, "step": 20456 }, { "epoch": 4.17, "learning_rate": 2.0549242157164115e-05, "loss": 0.002, "step": 20457 }, { "epoch": 4.17, "learning_rate": 2.0539449841907367e-05, "loss": 0.0037, "step": 20458 }, { "epoch": 4.17, "learning_rate": 2.0529659688886162e-05, "loss": 0.0009, "step": 20459 }, { "epoch": 4.17, "learning_rate": 2.0519871698264035e-05, "loss": 0.0022, "step": 20460 }, { "epoch": 4.17, "learning_rate": 2.0510085870204466e-05, "loss": 0.0027, "step": 20461 }, { "epoch": 4.17, "learning_rate": 2.05003022048709e-05, "loss": 0.0006, "step": 20462 }, { "epoch": 4.17, "learning_rate": 2.049052070242675e-05, "loss": 0.0024, "step": 20463 }, { "epoch": 4.17, "learning_rate": 2.048074136303532e-05, "loss": 0.0015, "step": 20464 }, { "epoch": 4.17, "learning_rate": 2.047096418686006e-05, "loss": 0.0016, "step": 20465 }, { "epoch": 4.17, "learning_rate": 2.0461189174064163e-05, "loss": 0.0042, "step": 20466 }, { "epoch": 4.17, "learning_rate": 2.0451416324810927e-05, "loss": 0.001, "step": 20467 }, { "epoch": 4.17, "learning_rate": 2.0441645639263586e-05, "loss": 0.0003, "step": 20468 }, { "epoch": 4.17, "learning_rate": 2.0431877117585284e-05, "loss": 0.0005, "step": 20469 }, { "epoch": 4.17, "learning_rate": 2.042211075993928e-05, "loss": 0.0001, "step": 20470 }, { "epoch": 4.17, "learning_rate": 2.0412346566488585e-05, "loss": 0.0086, "step": 20471 }, { "epoch": 4.17, "learning_rate": 2.0402584537396316e-05, "loss": 0.001, "step": 20472 }, { "epoch": 4.17, "learning_rate": 2.039282467282551e-05, "loss": 0.0019, "step": 20473 }, { "epoch": 4.17, "learning_rate": 2.03830669729392e-05, "loss": 0.0019, "step": 20474 }, { "epoch": 4.17, "learning_rate": 2.0373311437900323e-05, "loss": 0.0022, "step": 20475 }, { "epoch": 4.17, "learning_rate": 2.0363558067871853e-05, "loss": 0.0003, "step": 20476 }, { "epoch": 4.17, "learning_rate": 2.0353806863016657e-05, "loss": 0.0026, "step": 20477 }, { "epoch": 4.17, "learning_rate": 2.0344057823497604e-05, "loss": 0.0004, "step": 20478 }, { "epoch": 4.17, "learning_rate": 2.033431094947755e-05, "loss": 0.0031, "step": 20479 }, { "epoch": 4.17, "learning_rate": 2.0324566241119244e-05, "loss": 0.0047, "step": 20480 }, { "epoch": 4.17, "learning_rate": 2.0314823698585507e-05, "loss": 0.0001, "step": 20481 }, { "epoch": 4.17, "learning_rate": 2.0305083322038928e-05, "loss": 0.0006, "step": 20482 }, { "epoch": 4.17, "learning_rate": 2.029534511164236e-05, "loss": 0.0035, "step": 20483 }, { "epoch": 4.17, "learning_rate": 2.02856090675583e-05, "loss": 0.0068, "step": 20484 }, { "epoch": 4.17, "learning_rate": 2.0275875189949475e-05, "loss": 0.0001, "step": 20485 }, { "epoch": 4.17, "learning_rate": 2.0266143478978368e-05, "loss": 0.0018, "step": 20486 }, { "epoch": 4.17, "learning_rate": 2.025641393480757e-05, "loss": 0.0035, "step": 20487 }, { "epoch": 4.17, "learning_rate": 2.0246686557599562e-05, "loss": 0.0019, "step": 20488 }, { "epoch": 4.17, "learning_rate": 2.0236961347516818e-05, "loss": 0.0004, "step": 20489 }, { "epoch": 4.17, "learning_rate": 2.0227238304721755e-05, "loss": 0.0014, "step": 20490 }, { "epoch": 4.17, "learning_rate": 2.0217517429376777e-05, "loss": 0.0011, "step": 20491 }, { "epoch": 4.17, "learning_rate": 2.0207798721644242e-05, "loss": 0.0004, "step": 20492 }, { "epoch": 4.17, "learning_rate": 2.019808218168648e-05, "loss": 0.0002, "step": 20493 }, { "epoch": 4.17, "learning_rate": 2.0188367809665785e-05, "loss": 0.0012, "step": 20494 }, { "epoch": 4.17, "learning_rate": 2.017865560574432e-05, "loss": 0.0006, "step": 20495 }, { "epoch": 4.17, "learning_rate": 2.0168945570084428e-05, "loss": 0.0009, "step": 20496 }, { "epoch": 4.17, "learning_rate": 2.015923770284816e-05, "loss": 0.0013, "step": 20497 }, { "epoch": 4.17, "learning_rate": 2.0149532004197765e-05, "loss": 0.0004, "step": 20498 }, { "epoch": 4.17, "learning_rate": 2.0139828474295272e-05, "loss": 0.0005, "step": 20499 }, { "epoch": 4.17, "learning_rate": 2.0130127113302745e-05, "loss": 0.0015, "step": 20500 }, { "epoch": 4.17, "learning_rate": 2.0120427921382293e-05, "loss": 0.0002, "step": 20501 }, { "epoch": 4.17, "learning_rate": 2.0110730898695813e-05, "loss": 0.0002, "step": 20502 }, { "epoch": 4.17, "learning_rate": 2.0101036045405365e-05, "loss": 0.002, "step": 20503 }, { "epoch": 4.18, "learning_rate": 2.0091343361672785e-05, "loss": 0.0062, "step": 20504 }, { "epoch": 4.18, "learning_rate": 2.008165284765999e-05, "loss": 0.0014, "step": 20505 }, { "epoch": 4.18, "learning_rate": 2.007196450352882e-05, "loss": 0.0007, "step": 20506 }, { "epoch": 4.18, "learning_rate": 2.006227832944111e-05, "loss": 0.0028, "step": 20507 }, { "epoch": 4.18, "learning_rate": 2.0052594325558637e-05, "loss": 0.0017, "step": 20508 }, { "epoch": 4.18, "learning_rate": 2.0042912492043113e-05, "loss": 0.0016, "step": 20509 }, { "epoch": 4.18, "learning_rate": 2.003323282905628e-05, "loss": 0.0009, "step": 20510 }, { "epoch": 4.18, "learning_rate": 2.0023555336759774e-05, "loss": 0.0008, "step": 20511 }, { "epoch": 4.18, "learning_rate": 2.001388001531528e-05, "loss": 0.0031, "step": 20512 }, { "epoch": 4.18, "learning_rate": 2.0004206864884292e-05, "loss": 0.0001, "step": 20513 }, { "epoch": 4.18, "learning_rate": 1.9994535885628494e-05, "loss": 0.0016, "step": 20514 }, { "epoch": 4.18, "learning_rate": 1.9984867077709288e-05, "loss": 0.0031, "step": 20515 }, { "epoch": 4.18, "learning_rate": 1.997520044128828e-05, "loss": 0.0002, "step": 20516 }, { "epoch": 4.18, "learning_rate": 1.9965535976526842e-05, "loss": 0.0001, "step": 20517 }, { "epoch": 4.18, "learning_rate": 1.995587368358641e-05, "loss": 0.0005, "step": 20518 }, { "epoch": 4.18, "learning_rate": 1.9946213562628355e-05, "loss": 0.0041, "step": 20519 }, { "epoch": 4.18, "learning_rate": 1.993655561381403e-05, "loss": 0.0025, "step": 20520 }, { "epoch": 4.18, "learning_rate": 1.9926899837304745e-05, "loss": 0.0004, "step": 20521 }, { "epoch": 4.18, "learning_rate": 1.9917246233261763e-05, "loss": 0.0002, "step": 20522 }, { "epoch": 4.18, "learning_rate": 1.990759480184631e-05, "loss": 0.0014, "step": 20523 }, { "epoch": 4.18, "learning_rate": 1.989794554321959e-05, "loss": 0.0003, "step": 20524 }, { "epoch": 4.18, "learning_rate": 1.988829845754277e-05, "loss": 0.0014, "step": 20525 }, { "epoch": 4.18, "learning_rate": 1.9878653544976964e-05, "loss": 0.0062, "step": 20526 }, { "epoch": 4.18, "learning_rate": 1.98690108056833e-05, "loss": 0.0032, "step": 20527 }, { "epoch": 4.18, "learning_rate": 1.9859370239822735e-05, "loss": 0.002, "step": 20528 }, { "epoch": 4.18, "learning_rate": 1.984973184755638e-05, "loss": 0.0003, "step": 20529 }, { "epoch": 4.18, "learning_rate": 1.9840095629045162e-05, "loss": 0.0019, "step": 20530 }, { "epoch": 4.18, "learning_rate": 1.983046158445006e-05, "loss": 0.0004, "step": 20531 }, { "epoch": 4.18, "learning_rate": 1.982082971393199e-05, "loss": 0.0002, "step": 20532 }, { "epoch": 4.18, "learning_rate": 1.9811200017651714e-05, "loss": 0.0029, "step": 20533 }, { "epoch": 4.18, "learning_rate": 1.980157249577023e-05, "loss": 0.0064, "step": 20534 }, { "epoch": 4.18, "learning_rate": 1.979194714844818e-05, "loss": 0.0007, "step": 20535 }, { "epoch": 4.18, "learning_rate": 1.9782323975846463e-05, "loss": 0.0003, "step": 20536 }, { "epoch": 4.18, "learning_rate": 1.977270297812571e-05, "loss": 0.0025, "step": 20537 }, { "epoch": 4.18, "learning_rate": 1.9763084155446636e-05, "loss": 0.0004, "step": 20538 }, { "epoch": 4.18, "learning_rate": 1.9753467507969893e-05, "loss": 0.0048, "step": 20539 }, { "epoch": 4.18, "learning_rate": 1.974385303585611e-05, "loss": 0.0001, "step": 20540 }, { "epoch": 4.18, "learning_rate": 1.9734240739265837e-05, "loss": 0.0003, "step": 20541 }, { "epoch": 4.18, "learning_rate": 1.9724630618359665e-05, "loss": 0.0015, "step": 20542 }, { "epoch": 4.18, "learning_rate": 1.9715022673298047e-05, "loss": 0.0001, "step": 20543 }, { "epoch": 4.18, "learning_rate": 1.9705416904241505e-05, "loss": 0.0025, "step": 20544 }, { "epoch": 4.18, "learning_rate": 1.969581331135046e-05, "loss": 0.0015, "step": 20545 }, { "epoch": 4.18, "learning_rate": 1.9686211894785254e-05, "loss": 0.0006, "step": 20546 }, { "epoch": 4.18, "learning_rate": 1.9676612654706354e-05, "loss": 0.0008, "step": 20547 }, { "epoch": 4.18, "learning_rate": 1.966701559127395e-05, "loss": 0.0022, "step": 20548 }, { "epoch": 4.18, "learning_rate": 1.965742070464848e-05, "loss": 0.0007, "step": 20549 }, { "epoch": 4.18, "learning_rate": 1.9647827994990083e-05, "loss": 0.0017, "step": 20550 }, { "epoch": 4.18, "learning_rate": 1.9638237462459016e-05, "loss": 0.0011, "step": 20551 }, { "epoch": 4.18, "learning_rate": 1.9628649107215466e-05, "loss": 0.0011, "step": 20552 }, { "epoch": 4.18, "learning_rate": 1.961906292941954e-05, "loss": 0.0019, "step": 20553 }, { "epoch": 4.19, "learning_rate": 1.9609478929231436e-05, "loss": 0.0002, "step": 20554 }, { "epoch": 4.19, "learning_rate": 1.959989710681112e-05, "loss": 0.0038, "step": 20555 }, { "epoch": 4.19, "learning_rate": 1.9590317462318688e-05, "loss": 0.0019, "step": 20556 }, { "epoch": 4.19, "learning_rate": 1.9580739995914103e-05, "loss": 0.0004, "step": 20557 }, { "epoch": 4.19, "learning_rate": 1.9571164707757347e-05, "loss": 0.0024, "step": 20558 }, { "epoch": 4.19, "learning_rate": 1.956159159800835e-05, "loss": 0.0013, "step": 20559 }, { "epoch": 4.19, "learning_rate": 1.955202066682699e-05, "loss": 0.0, "step": 20560 }, { "epoch": 4.19, "learning_rate": 1.954245191437313e-05, "loss": 0.0003, "step": 20561 }, { "epoch": 4.19, "learning_rate": 1.9532885340806576e-05, "loss": 0.0014, "step": 20562 }, { "epoch": 4.19, "learning_rate": 1.952332094628713e-05, "loss": 0.001, "step": 20563 }, { "epoch": 4.19, "learning_rate": 1.9513758730974466e-05, "loss": 0.0001, "step": 20564 }, { "epoch": 4.19, "learning_rate": 1.9504198695028406e-05, "loss": 0.0022, "step": 20565 }, { "epoch": 4.19, "learning_rate": 1.949464083860847e-05, "loss": 0.01, "step": 20566 }, { "epoch": 4.19, "learning_rate": 1.948508516187447e-05, "loss": 0.0013, "step": 20567 }, { "epoch": 4.19, "learning_rate": 1.9475531664985873e-05, "loss": 0.0006, "step": 20568 }, { "epoch": 4.19, "learning_rate": 1.9465980348102266e-05, "loss": 0.0026, "step": 20569 }, { "epoch": 4.19, "learning_rate": 1.945643121138321e-05, "loss": 0.0061, "step": 20570 }, { "epoch": 4.19, "learning_rate": 1.944688425498816e-05, "loss": 0.0001, "step": 20571 }, { "epoch": 4.19, "learning_rate": 1.9437339479076568e-05, "loss": 0.0002, "step": 20572 }, { "epoch": 4.19, "learning_rate": 1.942779688380788e-05, "loss": 0.0002, "step": 20573 }, { "epoch": 4.19, "learning_rate": 1.9418256469341444e-05, "loss": 0.0001, "step": 20574 }, { "epoch": 4.19, "learning_rate": 1.9408718235836617e-05, "loss": 0.0001, "step": 20575 }, { "epoch": 4.19, "learning_rate": 1.939918218345271e-05, "loss": 0.003, "step": 20576 }, { "epoch": 4.19, "learning_rate": 1.9389648312348976e-05, "loss": 0.0001, "step": 20577 }, { "epoch": 4.19, "learning_rate": 1.9380116622684706e-05, "loss": 0.0006, "step": 20578 }, { "epoch": 4.19, "learning_rate": 1.9370587114618986e-05, "loss": 0.0218, "step": 20579 }, { "epoch": 4.19, "learning_rate": 1.936105978831109e-05, "loss": 0.0002, "step": 20580 }, { "epoch": 4.19, "learning_rate": 1.9351534643920043e-05, "loss": 0.0006, "step": 20581 }, { "epoch": 4.19, "learning_rate": 1.9342011681605013e-05, "loss": 0.0021, "step": 20582 }, { "epoch": 4.19, "learning_rate": 1.933249090152506e-05, "loss": 0.0024, "step": 20583 }, { "epoch": 4.19, "learning_rate": 1.932297230383909e-05, "loss": 0.0005, "step": 20584 }, { "epoch": 4.19, "learning_rate": 1.9313455888706207e-05, "loss": 0.004, "step": 20585 }, { "epoch": 4.19, "learning_rate": 1.9303941656285287e-05, "loss": 0.0033, "step": 20586 }, { "epoch": 4.19, "learning_rate": 1.9294429606735235e-05, "loss": 0.0022, "step": 20587 }, { "epoch": 4.19, "learning_rate": 1.9284919740214938e-05, "loss": 0.0044, "step": 20588 }, { "epoch": 4.19, "learning_rate": 1.927541205688322e-05, "loss": 0.003, "step": 20589 }, { "epoch": 4.19, "learning_rate": 1.9265906556898892e-05, "loss": 0.0018, "step": 20590 }, { "epoch": 4.19, "learning_rate": 1.9256403240420686e-05, "loss": 0.0016, "step": 20591 }, { "epoch": 4.19, "learning_rate": 1.924690210760735e-05, "loss": 0.0007, "step": 20592 }, { "epoch": 4.19, "learning_rate": 1.9237403158617566e-05, "loss": 0.0024, "step": 20593 }, { "epoch": 4.19, "learning_rate": 1.9227906393609975e-05, "loss": 0.0018, "step": 20594 }, { "epoch": 4.19, "learning_rate": 1.9218411812743206e-05, "loss": 0.0043, "step": 20595 }, { "epoch": 4.19, "learning_rate": 1.9208919416175846e-05, "loss": 0.0005, "step": 20596 }, { "epoch": 4.19, "learning_rate": 1.919942920406636e-05, "loss": 0.0013, "step": 20597 }, { "epoch": 4.19, "learning_rate": 1.918994117657337e-05, "loss": 0.0014, "step": 20598 }, { "epoch": 4.19, "learning_rate": 1.918045533385522e-05, "loss": 0.0008, "step": 20599 }, { "epoch": 4.19, "learning_rate": 1.917097167607049e-05, "loss": 0.0004, "step": 20600 }, { "epoch": 4.19, "learning_rate": 1.9161490203377434e-05, "loss": 0.0012, "step": 20601 }, { "epoch": 4.19, "learning_rate": 1.9152010915934473e-05, "loss": 0.0009, "step": 20602 }, { "epoch": 4.2, "learning_rate": 1.9142533813899917e-05, "loss": 0.0075, "step": 20603 }, { "epoch": 4.2, "learning_rate": 1.9133058897432075e-05, "loss": 0.001, "step": 20604 }, { "epoch": 4.2, "learning_rate": 1.9123586166689165e-05, "loss": 0.002, "step": 20605 }, { "epoch": 4.2, "learning_rate": 1.9114115621829412e-05, "loss": 0.0018, "step": 20606 }, { "epoch": 4.2, "learning_rate": 1.910464726301101e-05, "loss": 0.0001, "step": 20607 }, { "epoch": 4.2, "learning_rate": 1.9095181090392057e-05, "loss": 0.0025, "step": 20608 }, { "epoch": 4.2, "learning_rate": 1.908571710413069e-05, "loss": 0.0002, "step": 20609 }, { "epoch": 4.2, "learning_rate": 1.9076255304384968e-05, "loss": 0.0014, "step": 20610 }, { "epoch": 4.2, "learning_rate": 1.906679569131294e-05, "loss": 0.0061, "step": 20611 }, { "epoch": 4.2, "learning_rate": 1.905733826507253e-05, "loss": 0.0065, "step": 20612 }, { "epoch": 4.2, "learning_rate": 1.9047883025821774e-05, "loss": 0.0017, "step": 20613 }, { "epoch": 4.2, "learning_rate": 1.9038429973718583e-05, "loss": 0.0002, "step": 20614 }, { "epoch": 4.2, "learning_rate": 1.9028979108920762e-05, "loss": 0.0007, "step": 20615 }, { "epoch": 4.2, "learning_rate": 1.9019530431586267e-05, "loss": 0.0012, "step": 20616 }, { "epoch": 4.2, "learning_rate": 1.9010083941872807e-05, "loss": 0.0001, "step": 20617 }, { "epoch": 4.2, "learning_rate": 1.900063963993827e-05, "loss": 0.0013, "step": 20618 }, { "epoch": 4.2, "learning_rate": 1.8991197525940284e-05, "loss": 0.0003, "step": 20619 }, { "epoch": 4.2, "learning_rate": 1.8981757600036602e-05, "loss": 0.0009, "step": 20620 }, { "epoch": 4.2, "learning_rate": 1.8972319862384884e-05, "loss": 0.0016, "step": 20621 }, { "epoch": 4.2, "learning_rate": 1.896288431314277e-05, "loss": 0.0001, "step": 20622 }, { "epoch": 4.2, "learning_rate": 1.8953450952467814e-05, "loss": 0.0002, "step": 20623 }, { "epoch": 4.2, "learning_rate": 1.894401978051761e-05, "loss": 0.0075, "step": 20624 }, { "epoch": 4.2, "learning_rate": 1.893459079744965e-05, "loss": 0.0052, "step": 20625 }, { "epoch": 4.2, "learning_rate": 1.892516400342144e-05, "loss": 0.004, "step": 20626 }, { "epoch": 4.2, "learning_rate": 1.8915739398590418e-05, "loss": 0.0003, "step": 20627 }, { "epoch": 4.2, "learning_rate": 1.8906316983113963e-05, "loss": 0.0053, "step": 20628 }, { "epoch": 4.2, "learning_rate": 1.8896896757149525e-05, "loss": 0.0002, "step": 20629 }, { "epoch": 4.2, "learning_rate": 1.8887478720854303e-05, "loss": 0.0058, "step": 20630 }, { "epoch": 4.2, "learning_rate": 1.887806287438577e-05, "loss": 0.0024, "step": 20631 }, { "epoch": 4.2, "learning_rate": 1.886864921790101e-05, "loss": 0.0004, "step": 20632 }, { "epoch": 4.2, "learning_rate": 1.8859237751557404e-05, "loss": 0.0003, "step": 20633 }, { "epoch": 4.2, "learning_rate": 1.8849828475512042e-05, "loss": 0.0001, "step": 20634 }, { "epoch": 4.2, "learning_rate": 1.8840421389922077e-05, "loss": 0.0006, "step": 20635 }, { "epoch": 4.2, "learning_rate": 1.8831016494944723e-05, "loss": 0.0001, "step": 20636 }, { "epoch": 4.2, "learning_rate": 1.8821613790736968e-05, "loss": 0.0011, "step": 20637 }, { "epoch": 4.2, "learning_rate": 1.881221327745587e-05, "loss": 0.0073, "step": 20638 }, { "epoch": 4.2, "learning_rate": 1.8802814955258432e-05, "loss": 0.0004, "step": 20639 }, { "epoch": 4.2, "learning_rate": 1.8793418824301654e-05, "loss": 0.002, "step": 20640 }, { "epoch": 4.2, "learning_rate": 1.8784024884742455e-05, "loss": 0.0016, "step": 20641 }, { "epoch": 4.2, "learning_rate": 1.877463313673771e-05, "loss": 0.0056, "step": 20642 }, { "epoch": 4.2, "learning_rate": 1.876524358044431e-05, "loss": 0.0012, "step": 20643 }, { "epoch": 4.2, "learning_rate": 1.8755856216019067e-05, "loss": 0.0015, "step": 20644 }, { "epoch": 4.2, "learning_rate": 1.874647104361875e-05, "loss": 0.0009, "step": 20645 }, { "epoch": 4.2, "learning_rate": 1.8737088063400136e-05, "loss": 0.0001, "step": 20646 }, { "epoch": 4.2, "learning_rate": 1.8727707275519966e-05, "loss": 0.0001, "step": 20647 }, { "epoch": 4.2, "learning_rate": 1.8718328680134815e-05, "loss": 0.0046, "step": 20648 }, { "epoch": 4.2, "learning_rate": 1.870895227740144e-05, "loss": 0.0009, "step": 20649 }, { "epoch": 4.2, "learning_rate": 1.8699578067476335e-05, "loss": 0.001, "step": 20650 }, { "epoch": 4.2, "learning_rate": 1.8690206050516187e-05, "loss": 0.0024, "step": 20651 }, { "epoch": 4.21, "learning_rate": 1.8680836226677425e-05, "loss": 0.0008, "step": 20652 }, { "epoch": 4.21, "learning_rate": 1.8671468596116572e-05, "loss": 0.0009, "step": 20653 }, { "epoch": 4.21, "learning_rate": 1.8662103158990104e-05, "loss": 0.0007, "step": 20654 }, { "epoch": 4.21, "learning_rate": 1.8652739915454444e-05, "loss": 0.0005, "step": 20655 }, { "epoch": 4.21, "learning_rate": 1.8643378865665953e-05, "loss": 0.0002, "step": 20656 }, { "epoch": 4.21, "learning_rate": 1.8634020009780987e-05, "loss": 0.0024, "step": 20657 }, { "epoch": 4.21, "learning_rate": 1.8624663347955853e-05, "loss": 0.003, "step": 20658 }, { "epoch": 4.21, "learning_rate": 1.861530888034683e-05, "loss": 0.0075, "step": 20659 }, { "epoch": 4.21, "learning_rate": 1.8605956607110158e-05, "loss": 0.0018, "step": 20660 }, { "epoch": 4.21, "learning_rate": 1.859660652840204e-05, "loss": 0.0009, "step": 20661 }, { "epoch": 4.21, "learning_rate": 1.858725864437866e-05, "loss": 0.0018, "step": 20662 }, { "epoch": 4.21, "learning_rate": 1.8577912955196056e-05, "loss": 0.0001, "step": 20663 }, { "epoch": 4.21, "learning_rate": 1.856856946101045e-05, "loss": 0.0011, "step": 20664 }, { "epoch": 4.21, "learning_rate": 1.8559228161977792e-05, "loss": 0.0004, "step": 20665 }, { "epoch": 4.21, "learning_rate": 1.8549889058254098e-05, "loss": 0.0018, "step": 20666 }, { "epoch": 4.21, "learning_rate": 1.8540552149995463e-05, "loss": 0.0067, "step": 20667 }, { "epoch": 4.21, "learning_rate": 1.8531217437357683e-05, "loss": 0.0024, "step": 20668 }, { "epoch": 4.21, "learning_rate": 1.852188492049681e-05, "loss": 0.0007, "step": 20669 }, { "epoch": 4.21, "learning_rate": 1.8512554599568606e-05, "loss": 0.0052, "step": 20670 }, { "epoch": 4.21, "learning_rate": 1.8503226474728933e-05, "loss": 0.0019, "step": 20671 }, { "epoch": 4.21, "learning_rate": 1.8493900546133596e-05, "loss": 0.0029, "step": 20672 }, { "epoch": 4.21, "learning_rate": 1.8484576813938367e-05, "loss": 0.0012, "step": 20673 }, { "epoch": 4.21, "learning_rate": 1.8475255278298946e-05, "loss": 0.0003, "step": 20674 }, { "epoch": 4.21, "learning_rate": 1.8465935939371036e-05, "loss": 0.0005, "step": 20675 }, { "epoch": 4.21, "learning_rate": 1.8456618797310278e-05, "loss": 0.0019, "step": 20676 }, { "epoch": 4.21, "learning_rate": 1.8447303852272304e-05, "loss": 0.0001, "step": 20677 }, { "epoch": 4.21, "learning_rate": 1.8437991104412668e-05, "loss": 0.0019, "step": 20678 }, { "epoch": 4.21, "learning_rate": 1.8428680553886934e-05, "loss": 0.0021, "step": 20679 }, { "epoch": 4.21, "learning_rate": 1.841937220085062e-05, "loss": 0.0018, "step": 20680 }, { "epoch": 4.21, "learning_rate": 1.8410066045459088e-05, "loss": 0.0034, "step": 20681 }, { "epoch": 4.21, "learning_rate": 1.8400762087867933e-05, "loss": 0.0005, "step": 20682 }, { "epoch": 4.21, "learning_rate": 1.8391460328232378e-05, "loss": 0.0014, "step": 20683 }, { "epoch": 4.21, "learning_rate": 1.8382160766707948e-05, "loss": 0.0001, "step": 20684 }, { "epoch": 4.21, "learning_rate": 1.8372863403449823e-05, "loss": 0.0007, "step": 20685 }, { "epoch": 4.21, "learning_rate": 1.8363568238613356e-05, "loss": 0.0035, "step": 20686 }, { "epoch": 4.21, "learning_rate": 1.8354275272353798e-05, "loss": 0.0028, "step": 20687 }, { "epoch": 4.21, "learning_rate": 1.8344984504826315e-05, "loss": 0.0011, "step": 20688 }, { "epoch": 4.21, "learning_rate": 1.8335695936186124e-05, "loss": 0.0022, "step": 20689 }, { "epoch": 4.21, "learning_rate": 1.8326409566588347e-05, "loss": 0.003, "step": 20690 }, { "epoch": 4.21, "learning_rate": 1.831712539618806e-05, "loss": 0.0002, "step": 20691 }, { "epoch": 4.21, "learning_rate": 1.8307843425140373e-05, "loss": 0.0013, "step": 20692 }, { "epoch": 4.21, "learning_rate": 1.8298563653600295e-05, "loss": 0.0003, "step": 20693 }, { "epoch": 4.21, "learning_rate": 1.8289286081722772e-05, "loss": 0.0007, "step": 20694 }, { "epoch": 4.21, "learning_rate": 1.8280010709662806e-05, "loss": 0.0001, "step": 20695 }, { "epoch": 4.21, "learning_rate": 1.8270737537575297e-05, "loss": 0.0015, "step": 20696 }, { "epoch": 4.21, "learning_rate": 1.8261466565615136e-05, "loss": 0.0013, "step": 20697 }, { "epoch": 4.21, "learning_rate": 1.8252197793937195e-05, "loss": 0.0002, "step": 20698 }, { "epoch": 4.21, "learning_rate": 1.8242931222696172e-05, "loss": 0.0005, "step": 20699 }, { "epoch": 4.21, "learning_rate": 1.8233666852046974e-05, "loss": 0.0001, "step": 20700 }, { "epoch": 4.22, "learning_rate": 1.8224404682144193e-05, "loss": 0.0002, "step": 20701 }, { "epoch": 4.22, "learning_rate": 1.8215144713142678e-05, "loss": 0.0003, "step": 20702 }, { "epoch": 4.22, "learning_rate": 1.8205886945196964e-05, "loss": 0.0006, "step": 20703 }, { "epoch": 4.22, "learning_rate": 1.8196631378461713e-05, "loss": 0.0061, "step": 20704 }, { "epoch": 4.22, "learning_rate": 1.818737801309152e-05, "loss": 0.0001, "step": 20705 }, { "epoch": 4.22, "learning_rate": 1.8178126849240927e-05, "loss": 0.0007, "step": 20706 }, { "epoch": 4.22, "learning_rate": 1.816887788706444e-05, "loss": 0.0042, "step": 20707 }, { "epoch": 4.22, "learning_rate": 1.8159631126716562e-05, "loss": 0.0022, "step": 20708 }, { "epoch": 4.22, "learning_rate": 1.8150386568351694e-05, "loss": 0.0015, "step": 20709 }, { "epoch": 4.22, "learning_rate": 1.8141144212124265e-05, "loss": 0.0011, "step": 20710 }, { "epoch": 4.22, "learning_rate": 1.8131904058188652e-05, "loss": 0.0002, "step": 20711 }, { "epoch": 4.22, "learning_rate": 1.8122666106699096e-05, "loss": 0.0002, "step": 20712 }, { "epoch": 4.22, "learning_rate": 1.811343035781001e-05, "loss": 0.0012, "step": 20713 }, { "epoch": 4.22, "learning_rate": 1.8104196811675537e-05, "loss": 0.0033, "step": 20714 }, { "epoch": 4.22, "learning_rate": 1.809496546845002e-05, "loss": 0.0018, "step": 20715 }, { "epoch": 4.22, "learning_rate": 1.8085736328287514e-05, "loss": 0.0008, "step": 20716 }, { "epoch": 4.22, "learning_rate": 1.8076509391342236e-05, "loss": 0.0038, "step": 20717 }, { "epoch": 4.22, "learning_rate": 1.8067284657768262e-05, "loss": 0.0018, "step": 20718 }, { "epoch": 4.22, "learning_rate": 1.8058062127719648e-05, "loss": 0.0041, "step": 20719 }, { "epoch": 4.22, "learning_rate": 1.8048841801350524e-05, "loss": 0.0024, "step": 20720 }, { "epoch": 4.22, "learning_rate": 1.803962367881478e-05, "loss": 0.0007, "step": 20721 }, { "epoch": 4.22, "learning_rate": 1.8030407760266414e-05, "loss": 0.0035, "step": 20722 }, { "epoch": 4.22, "learning_rate": 1.802119404585935e-05, "loss": 0.0004, "step": 20723 }, { "epoch": 4.22, "learning_rate": 1.8011982535747465e-05, "loss": 0.0006, "step": 20724 }, { "epoch": 4.22, "learning_rate": 1.800277323008462e-05, "loss": 0.0001, "step": 20725 }, { "epoch": 4.22, "learning_rate": 1.799356612902463e-05, "loss": 0.0016, "step": 20726 }, { "epoch": 4.22, "learning_rate": 1.7984361232721262e-05, "loss": 0.0026, "step": 20727 }, { "epoch": 4.22, "learning_rate": 1.7975158541328266e-05, "loss": 0.0025, "step": 20728 }, { "epoch": 4.22, "learning_rate": 1.7965958054999336e-05, "loss": 0.0025, "step": 20729 }, { "epoch": 4.22, "learning_rate": 1.795675977388813e-05, "loss": 0.0002, "step": 20730 }, { "epoch": 4.22, "learning_rate": 1.794756369814831e-05, "loss": 0.0015, "step": 20731 }, { "epoch": 4.22, "learning_rate": 1.79383698279334e-05, "loss": 0.0001, "step": 20732 }, { "epoch": 4.22, "learning_rate": 1.792917816339705e-05, "loss": 0.0012, "step": 20733 }, { "epoch": 4.22, "learning_rate": 1.791998870469265e-05, "loss": 0.0017, "step": 20734 }, { "epoch": 4.22, "learning_rate": 1.7910801451973844e-05, "loss": 0.0007, "step": 20735 }, { "epoch": 4.22, "learning_rate": 1.790161640539394e-05, "loss": 0.0013, "step": 20736 }, { "epoch": 4.22, "learning_rate": 1.7892433565106408e-05, "loss": 0.0003, "step": 20737 }, { "epoch": 4.22, "learning_rate": 1.7883252931264598e-05, "loss": 0.0002, "step": 20738 }, { "epoch": 4.22, "learning_rate": 1.7874074504021857e-05, "loss": 0.0005, "step": 20739 }, { "epoch": 4.22, "learning_rate": 1.7864898283531482e-05, "loss": 0.0047, "step": 20740 }, { "epoch": 4.22, "learning_rate": 1.7855724269946715e-05, "loss": 0.0003, "step": 20741 }, { "epoch": 4.22, "learning_rate": 1.78465524634208e-05, "loss": 0.0018, "step": 20742 }, { "epoch": 4.22, "learning_rate": 1.7837382864106913e-05, "loss": 0.0017, "step": 20743 }, { "epoch": 4.22, "learning_rate": 1.7828215472158253e-05, "loss": 0.0079, "step": 20744 }, { "epoch": 4.22, "learning_rate": 1.781905028772781e-05, "loss": 0.0053, "step": 20745 }, { "epoch": 4.22, "learning_rate": 1.7809887310968795e-05, "loss": 0.0112, "step": 20746 }, { "epoch": 4.22, "learning_rate": 1.780072654203414e-05, "loss": 0.0006, "step": 20747 }, { "epoch": 4.22, "learning_rate": 1.7791567981076915e-05, "loss": 0.0011, "step": 20748 }, { "epoch": 4.22, "learning_rate": 1.7782411628250088e-05, "loss": 0.0037, "step": 20749 }, { "epoch": 4.23, "learning_rate": 1.7773257483706517e-05, "loss": 0.0004, "step": 20750 }, { "epoch": 4.23, "learning_rate": 1.776410554759921e-05, "loss": 0.0003, "step": 20751 }, { "epoch": 4.23, "learning_rate": 1.7754955820080886e-05, "loss": 0.0016, "step": 20752 }, { "epoch": 4.23, "learning_rate": 1.774580830130448e-05, "loss": 0.0018, "step": 20753 }, { "epoch": 4.23, "learning_rate": 1.7736662991422712e-05, "loss": 0.0005, "step": 20754 }, { "epoch": 4.23, "learning_rate": 1.772751989058832e-05, "loss": 0.0011, "step": 20755 }, { "epoch": 4.23, "learning_rate": 1.7718378998954035e-05, "loss": 0.0012, "step": 20756 }, { "epoch": 4.23, "learning_rate": 1.770924031667252e-05, "loss": 0.0005, "step": 20757 }, { "epoch": 4.23, "learning_rate": 1.7700103843896413e-05, "loss": 0.0001, "step": 20758 }, { "epoch": 4.23, "learning_rate": 1.7690969580778297e-05, "loss": 0.0022, "step": 20759 }, { "epoch": 4.23, "learning_rate": 1.7681837527470732e-05, "loss": 0.0037, "step": 20760 }, { "epoch": 4.23, "learning_rate": 1.7672707684126265e-05, "loss": 0.0097, "step": 20761 }, { "epoch": 4.23, "learning_rate": 1.7663580050897387e-05, "loss": 0.0002, "step": 20762 }, { "epoch": 4.23, "learning_rate": 1.7654454627936477e-05, "loss": 0.0031, "step": 20763 }, { "epoch": 4.23, "learning_rate": 1.764533141539603e-05, "loss": 0.0104, "step": 20764 }, { "epoch": 4.23, "learning_rate": 1.763621041342834e-05, "loss": 0.0011, "step": 20765 }, { "epoch": 4.23, "learning_rate": 1.7627091622185857e-05, "loss": 0.0001, "step": 20766 }, { "epoch": 4.23, "learning_rate": 1.7617975041820786e-05, "loss": 0.0002, "step": 20767 }, { "epoch": 4.23, "learning_rate": 1.7608860672485407e-05, "loss": 0.0014, "step": 20768 }, { "epoch": 4.23, "learning_rate": 1.759974851433197e-05, "loss": 0.0029, "step": 20769 }, { "epoch": 4.23, "learning_rate": 1.7590638567512662e-05, "loss": 0.0023, "step": 20770 }, { "epoch": 4.23, "learning_rate": 1.7581530832179614e-05, "loss": 0.0043, "step": 20771 }, { "epoch": 4.23, "learning_rate": 1.757242530848497e-05, "loss": 0.0024, "step": 20772 }, { "epoch": 4.23, "learning_rate": 1.7563321996580798e-05, "loss": 0.0026, "step": 20773 }, { "epoch": 4.23, "learning_rate": 1.7554220896619137e-05, "loss": 0.0055, "step": 20774 }, { "epoch": 4.23, "learning_rate": 1.7545122008751984e-05, "loss": 0.0043, "step": 20775 }, { "epoch": 4.23, "learning_rate": 1.753602533313133e-05, "loss": 0.0011, "step": 20776 }, { "epoch": 4.23, "learning_rate": 1.7526930869909144e-05, "loss": 0.0042, "step": 20777 }, { "epoch": 4.23, "learning_rate": 1.7517838619237186e-05, "loss": 0.0007, "step": 20778 }, { "epoch": 4.23, "learning_rate": 1.7508748581267444e-05, "loss": 0.0005, "step": 20779 }, { "epoch": 4.23, "learning_rate": 1.749966075615169e-05, "loss": 0.0039, "step": 20780 }, { "epoch": 4.23, "learning_rate": 1.749057514404173e-05, "loss": 0.0057, "step": 20781 }, { "epoch": 4.23, "learning_rate": 1.748149174508931e-05, "loss": 0.0032, "step": 20782 }, { "epoch": 4.23, "learning_rate": 1.747241055944606e-05, "loss": 0.0012, "step": 20783 }, { "epoch": 4.23, "learning_rate": 1.746333158726379e-05, "loss": 0.0004, "step": 20784 }, { "epoch": 4.23, "learning_rate": 1.745425482869403e-05, "loss": 0.0024, "step": 20785 }, { "epoch": 4.23, "learning_rate": 1.7445180283888394e-05, "loss": 0.0014, "step": 20786 }, { "epoch": 4.23, "learning_rate": 1.743610795299849e-05, "loss": 0.0001, "step": 20787 }, { "epoch": 4.23, "learning_rate": 1.74270378361758e-05, "loss": 0.0036, "step": 20788 }, { "epoch": 4.23, "learning_rate": 1.7417969933571834e-05, "loss": 0.0035, "step": 20789 }, { "epoch": 4.23, "learning_rate": 1.7408904245338024e-05, "loss": 0.0034, "step": 20790 }, { "epoch": 4.23, "learning_rate": 1.739984077162581e-05, "loss": 0.0033, "step": 20791 }, { "epoch": 4.23, "learning_rate": 1.7390779512586544e-05, "loss": 0.0007, "step": 20792 }, { "epoch": 4.23, "learning_rate": 1.7381720468371586e-05, "loss": 0.0004, "step": 20793 }, { "epoch": 4.23, "learning_rate": 1.737266363913223e-05, "loss": 0.0026, "step": 20794 }, { "epoch": 4.23, "learning_rate": 1.736360902501977e-05, "loss": 0.0015, "step": 20795 }, { "epoch": 4.23, "learning_rate": 1.7354556626185357e-05, "loss": 0.0, "step": 20796 }, { "epoch": 4.23, "learning_rate": 1.734550644278028e-05, "loss": 0.0022, "step": 20797 }, { "epoch": 4.23, "learning_rate": 1.7336458474955596e-05, "loss": 0.0024, "step": 20798 }, { "epoch": 4.24, "learning_rate": 1.7327412722862538e-05, "loss": 0.0021, "step": 20799 }, { "epoch": 4.24, "learning_rate": 1.731836918665209e-05, "loss": 0.0004, "step": 20800 }, { "epoch": 4.24, "learning_rate": 1.7309327866475336e-05, "loss": 0.0026, "step": 20801 }, { "epoch": 4.24, "learning_rate": 1.7300288762483282e-05, "loss": 0.0015, "step": 20802 }, { "epoch": 4.24, "learning_rate": 1.7291251874826844e-05, "loss": 0.0054, "step": 20803 }, { "epoch": 4.24, "learning_rate": 1.7282217203657083e-05, "loss": 0.0047, "step": 20804 }, { "epoch": 4.24, "learning_rate": 1.727318474912478e-05, "loss": 0.0003, "step": 20805 }, { "epoch": 4.24, "learning_rate": 1.7264154511380845e-05, "loss": 0.0015, "step": 20806 }, { "epoch": 4.24, "learning_rate": 1.7255126490576077e-05, "loss": 0.0031, "step": 20807 }, { "epoch": 4.24, "learning_rate": 1.724610068686127e-05, "loss": 0.0001, "step": 20808 }, { "epoch": 4.24, "learning_rate": 1.723707710038717e-05, "loss": 0.0004, "step": 20809 }, { "epoch": 4.24, "learning_rate": 1.722805573130449e-05, "loss": 0.0001, "step": 20810 }, { "epoch": 4.24, "learning_rate": 1.7219036579763895e-05, "loss": 0.0016, "step": 20811 }, { "epoch": 4.24, "learning_rate": 1.7210019645916045e-05, "loss": 0.001, "step": 20812 }, { "epoch": 4.24, "learning_rate": 1.7201004929911555e-05, "loss": 0.0006, "step": 20813 }, { "epoch": 4.24, "learning_rate": 1.7191992431900903e-05, "loss": 0.0003, "step": 20814 }, { "epoch": 4.24, "learning_rate": 1.7182982152034718e-05, "loss": 0.0004, "step": 20815 }, { "epoch": 4.24, "learning_rate": 1.7173974090463384e-05, "loss": 0.0007, "step": 20816 }, { "epoch": 4.24, "learning_rate": 1.7164968247337475e-05, "loss": 0.0013, "step": 20817 }, { "epoch": 4.24, "learning_rate": 1.7155964622807305e-05, "loss": 0.0004, "step": 20818 }, { "epoch": 4.24, "learning_rate": 1.714696321702329e-05, "loss": 0.0069, "step": 20819 }, { "epoch": 4.24, "learning_rate": 1.7137964030135758e-05, "loss": 0.0007, "step": 20820 }, { "epoch": 4.24, "learning_rate": 1.712896706229504e-05, "loss": 0.0009, "step": 20821 }, { "epoch": 4.24, "learning_rate": 1.7119972313651366e-05, "loss": 0.0008, "step": 20822 }, { "epoch": 4.24, "learning_rate": 1.7110979784354995e-05, "loss": 0.005, "step": 20823 }, { "epoch": 4.24, "learning_rate": 1.7101989474556094e-05, "loss": 0.0001, "step": 20824 }, { "epoch": 4.24, "learning_rate": 1.7093001384404842e-05, "loss": 0.0008, "step": 20825 }, { "epoch": 4.24, "learning_rate": 1.7084015514051352e-05, "loss": 0.0012, "step": 20826 }, { "epoch": 4.24, "learning_rate": 1.707503186364569e-05, "loss": 0.0, "step": 20827 }, { "epoch": 4.24, "learning_rate": 1.7066050433337945e-05, "loss": 0.0002, "step": 20828 }, { "epoch": 4.24, "learning_rate": 1.7057071223278024e-05, "loss": 0.0001, "step": 20829 }, { "epoch": 4.24, "learning_rate": 1.7048094233616017e-05, "loss": 0.0003, "step": 20830 }, { "epoch": 4.24, "learning_rate": 1.7039119464501738e-05, "loss": 0.0023, "step": 20831 }, { "epoch": 4.24, "learning_rate": 1.7030146916085185e-05, "loss": 0.0025, "step": 20832 }, { "epoch": 4.24, "learning_rate": 1.7021176588516205e-05, "loss": 0.0024, "step": 20833 }, { "epoch": 4.24, "learning_rate": 1.7012208481944543e-05, "loss": 0.0032, "step": 20834 }, { "epoch": 4.24, "learning_rate": 1.7003242596520085e-05, "loss": 0.0015, "step": 20835 }, { "epoch": 4.24, "learning_rate": 1.6994278932392487e-05, "loss": 0.001, "step": 20836 }, { "epoch": 4.24, "learning_rate": 1.6985317489711497e-05, "loss": 0.0014, "step": 20837 }, { "epoch": 4.24, "learning_rate": 1.6976358268626783e-05, "loss": 0.0011, "step": 20838 }, { "epoch": 4.24, "learning_rate": 1.6967401269288005e-05, "loss": 0.0006, "step": 20839 }, { "epoch": 4.24, "learning_rate": 1.695844649184473e-05, "loss": 0.0004, "step": 20840 }, { "epoch": 4.24, "learning_rate": 1.6949493936446533e-05, "loss": 0.0007, "step": 20841 }, { "epoch": 4.24, "learning_rate": 1.6940543603242936e-05, "loss": 0.0009, "step": 20842 }, { "epoch": 4.24, "learning_rate": 1.6931595492383426e-05, "loss": 0.0105, "step": 20843 }, { "epoch": 4.24, "learning_rate": 1.6922649604017457e-05, "loss": 0.0007, "step": 20844 }, { "epoch": 4.24, "learning_rate": 1.691370593829446e-05, "loss": 0.0001, "step": 20845 }, { "epoch": 4.24, "learning_rate": 1.6904764495363793e-05, "loss": 0.0007, "step": 20846 }, { "epoch": 4.24, "learning_rate": 1.6895825275374758e-05, "loss": 0.0052, "step": 20847 }, { "epoch": 4.25, "learning_rate": 1.6886888278476735e-05, "loss": 0.0015, "step": 20848 }, { "epoch": 4.25, "learning_rate": 1.6877953504818902e-05, "loss": 0.0022, "step": 20849 }, { "epoch": 4.25, "learning_rate": 1.686902095455058e-05, "loss": 0.0031, "step": 20850 }, { "epoch": 4.25, "learning_rate": 1.686009062782089e-05, "loss": 0.0001, "step": 20851 }, { "epoch": 4.25, "learning_rate": 1.6851162524779e-05, "loss": 0.001, "step": 20852 }, { "epoch": 4.25, "learning_rate": 1.6842236645574026e-05, "loss": 0.0002, "step": 20853 }, { "epoch": 4.25, "learning_rate": 1.6833312990355062e-05, "loss": 0.0001, "step": 20854 }, { "epoch": 4.25, "learning_rate": 1.6824391559271128e-05, "loss": 0.0031, "step": 20855 }, { "epoch": 4.25, "learning_rate": 1.681547235247125e-05, "loss": 0.0031, "step": 20856 }, { "epoch": 4.25, "learning_rate": 1.680655537010439e-05, "loss": 0.0003, "step": 20857 }, { "epoch": 4.25, "learning_rate": 1.6797640612319487e-05, "loss": 0.0043, "step": 20858 }, { "epoch": 4.25, "learning_rate": 1.678872807926543e-05, "loss": 0.0009, "step": 20859 }, { "epoch": 4.25, "learning_rate": 1.677981777109102e-05, "loss": 0.0004, "step": 20860 }, { "epoch": 4.25, "learning_rate": 1.6770909687945188e-05, "loss": 0.0002, "step": 20861 }, { "epoch": 4.25, "learning_rate": 1.6762003829976585e-05, "loss": 0.0013, "step": 20862 }, { "epoch": 4.25, "learning_rate": 1.6753100197334052e-05, "loss": 0.0002, "step": 20863 }, { "epoch": 4.25, "learning_rate": 1.674419879016631e-05, "loss": 0.0003, "step": 20864 }, { "epoch": 4.25, "learning_rate": 1.67352996086219e-05, "loss": 0.0004, "step": 20865 }, { "epoch": 4.25, "learning_rate": 1.6726402652849623e-05, "loss": 0.0031, "step": 20866 }, { "epoch": 4.25, "learning_rate": 1.671750792299793e-05, "loss": 0.0034, "step": 20867 }, { "epoch": 4.25, "learning_rate": 1.67086154192155e-05, "loss": 0.0006, "step": 20868 }, { "epoch": 4.25, "learning_rate": 1.669972514165076e-05, "loss": 0.0008, "step": 20869 }, { "epoch": 4.25, "learning_rate": 1.6690837090452247e-05, "loss": 0.001, "step": 20870 }, { "epoch": 4.25, "learning_rate": 1.668195126576839e-05, "loss": 0.0001, "step": 20871 }, { "epoch": 4.25, "learning_rate": 1.6673067667747603e-05, "loss": 0.0004, "step": 20872 }, { "epoch": 4.25, "learning_rate": 1.666418629653825e-05, "loss": 0.0003, "step": 20873 }, { "epoch": 4.25, "learning_rate": 1.6655307152288683e-05, "loss": 0.0001, "step": 20874 }, { "epoch": 4.25, "learning_rate": 1.6646430235147194e-05, "loss": 0.0003, "step": 20875 }, { "epoch": 4.25, "learning_rate": 1.663755554526204e-05, "loss": 0.0019, "step": 20876 }, { "epoch": 4.25, "learning_rate": 1.662868308278144e-05, "loss": 0.0022, "step": 20877 }, { "epoch": 4.25, "learning_rate": 1.6619812847853603e-05, "loss": 0.0023, "step": 20878 }, { "epoch": 4.25, "learning_rate": 1.6610944840626672e-05, "loss": 0.0002, "step": 20879 }, { "epoch": 4.25, "learning_rate": 1.6602079061248713e-05, "loss": 0.0011, "step": 20880 }, { "epoch": 4.25, "learning_rate": 1.659321550986789e-05, "loss": 0.0008, "step": 20881 }, { "epoch": 4.25, "learning_rate": 1.6584354186632137e-05, "loss": 0.0023, "step": 20882 }, { "epoch": 4.25, "learning_rate": 1.6575495091689565e-05, "loss": 0.0001, "step": 20883 }, { "epoch": 4.25, "learning_rate": 1.656663822518806e-05, "loss": 0.0001, "step": 20884 }, { "epoch": 4.25, "learning_rate": 1.6557783587275535e-05, "loss": 0.0003, "step": 20885 }, { "epoch": 4.25, "learning_rate": 1.654893117809997e-05, "loss": 0.0025, "step": 20886 }, { "epoch": 4.25, "learning_rate": 1.6540080997809135e-05, "loss": 0.0016, "step": 20887 }, { "epoch": 4.25, "learning_rate": 1.6531233046550873e-05, "loss": 0.0005, "step": 20888 }, { "epoch": 4.25, "learning_rate": 1.6522387324472952e-05, "loss": 0.0013, "step": 20889 }, { "epoch": 4.25, "learning_rate": 1.651354383172312e-05, "loss": 0.0106, "step": 20890 }, { "epoch": 4.25, "learning_rate": 1.6504702568449073e-05, "loss": 0.0032, "step": 20891 }, { "epoch": 4.25, "learning_rate": 1.6495863534798498e-05, "loss": 0.0009, "step": 20892 }, { "epoch": 4.25, "learning_rate": 1.6487026730919005e-05, "loss": 0.0001, "step": 20893 }, { "epoch": 4.25, "learning_rate": 1.64781921569582e-05, "loss": 0.008, "step": 20894 }, { "epoch": 4.25, "learning_rate": 1.6469359813063605e-05, "loss": 0.0002, "step": 20895 }, { "epoch": 4.25, "learning_rate": 1.6460529699382757e-05, "loss": 0.0001, "step": 20896 }, { "epoch": 4.26, "learning_rate": 1.645170181606319e-05, "loss": 0.0003, "step": 20897 }, { "epoch": 4.26, "learning_rate": 1.6442876163252217e-05, "loss": 0.0005, "step": 20898 }, { "epoch": 4.26, "learning_rate": 1.6434052741097387e-05, "loss": 0.0024, "step": 20899 }, { "epoch": 4.26, "learning_rate": 1.6425231549745933e-05, "loss": 0.0005, "step": 20900 }, { "epoch": 4.26, "learning_rate": 1.64164125893453e-05, "loss": 0.0003, "step": 20901 }, { "epoch": 4.26, "learning_rate": 1.6407595860042728e-05, "loss": 0.0001, "step": 20902 }, { "epoch": 4.26, "learning_rate": 1.6398781361985474e-05, "loss": 0.0009, "step": 20903 }, { "epoch": 4.26, "learning_rate": 1.6389969095320743e-05, "loss": 0.0005, "step": 20904 }, { "epoch": 4.26, "learning_rate": 1.6381159060195748e-05, "loss": 0.0002, "step": 20905 }, { "epoch": 4.26, "learning_rate": 1.637235125675762e-05, "loss": 0.0007, "step": 20906 }, { "epoch": 4.26, "learning_rate": 1.636354568515348e-05, "loss": 0.0028, "step": 20907 }, { "epoch": 4.26, "learning_rate": 1.6354742345530353e-05, "loss": 0.0001, "step": 20908 }, { "epoch": 4.26, "learning_rate": 1.6345941238035328e-05, "loss": 0.0006, "step": 20909 }, { "epoch": 4.26, "learning_rate": 1.6337142362815397e-05, "loss": 0.0072, "step": 20910 }, { "epoch": 4.26, "learning_rate": 1.6328345720017433e-05, "loss": 0.0007, "step": 20911 }, { "epoch": 4.26, "learning_rate": 1.631955130978848e-05, "loss": 0.0001, "step": 20912 }, { "epoch": 4.26, "learning_rate": 1.6310759132275292e-05, "loss": 0.0005, "step": 20913 }, { "epoch": 4.26, "learning_rate": 1.6301969187624848e-05, "loss": 0.0007, "step": 20914 }, { "epoch": 4.26, "learning_rate": 1.6293181475983863e-05, "loss": 0.0011, "step": 20915 }, { "epoch": 4.26, "learning_rate": 1.6284395997499107e-05, "loss": 0.0006, "step": 20916 }, { "epoch": 4.26, "learning_rate": 1.6275612752317408e-05, "loss": 0.0052, "step": 20917 }, { "epoch": 4.26, "learning_rate": 1.6266831740585334e-05, "loss": 0.0069, "step": 20918 }, { "epoch": 4.26, "learning_rate": 1.6258052962449668e-05, "loss": 0.0001, "step": 20919 }, { "epoch": 4.26, "learning_rate": 1.6249276418056945e-05, "loss": 0.0042, "step": 20920 }, { "epoch": 4.26, "learning_rate": 1.6240502107553777e-05, "loss": 0.0006, "step": 20921 }, { "epoch": 4.26, "learning_rate": 1.6231730031086713e-05, "loss": 0.0007, "step": 20922 }, { "epoch": 4.26, "learning_rate": 1.622296018880226e-05, "loss": 0.0009, "step": 20923 }, { "epoch": 4.26, "learning_rate": 1.6214192580846907e-05, "loss": 0.0001, "step": 20924 }, { "epoch": 4.26, "learning_rate": 1.6205427207367062e-05, "loss": 0.0007, "step": 20925 }, { "epoch": 4.26, "learning_rate": 1.6196664068509135e-05, "loss": 0.0013, "step": 20926 }, { "epoch": 4.26, "learning_rate": 1.6187903164419496e-05, "loss": 0.0002, "step": 20927 }, { "epoch": 4.26, "learning_rate": 1.6179144495244477e-05, "loss": 0.0019, "step": 20928 }, { "epoch": 4.26, "learning_rate": 1.6170388061130328e-05, "loss": 0.0029, "step": 20929 }, { "epoch": 4.26, "learning_rate": 1.6161633862223367e-05, "loss": 0.003, "step": 20930 }, { "epoch": 4.26, "learning_rate": 1.615288189866969e-05, "loss": 0.0016, "step": 20931 }, { "epoch": 4.26, "learning_rate": 1.6144132170615598e-05, "loss": 0.0018, "step": 20932 }, { "epoch": 4.26, "learning_rate": 1.6135384678207142e-05, "loss": 0.0008, "step": 20933 }, { "epoch": 4.26, "learning_rate": 1.612663942159044e-05, "loss": 0.0001, "step": 20934 }, { "epoch": 4.26, "learning_rate": 1.6117896400911566e-05, "loss": 0.0025, "step": 20935 }, { "epoch": 4.26, "learning_rate": 1.610915561631655e-05, "loss": 0.0001, "step": 20936 }, { "epoch": 4.26, "learning_rate": 1.610041706795138e-05, "loss": 0.0006, "step": 20937 }, { "epoch": 4.26, "learning_rate": 1.6091680755961983e-05, "loss": 0.0001, "step": 20938 }, { "epoch": 4.26, "learning_rate": 1.6082946680494304e-05, "loss": 0.0015, "step": 20939 }, { "epoch": 4.26, "learning_rate": 1.6074214841694188e-05, "loss": 0.0085, "step": 20940 }, { "epoch": 4.26, "learning_rate": 1.6065485239707478e-05, "loss": 0.0024, "step": 20941 }, { "epoch": 4.26, "learning_rate": 1.605675787468e-05, "loss": 0.0023, "step": 20942 }, { "epoch": 4.26, "learning_rate": 1.604803274675752e-05, "loss": 0.0005, "step": 20943 }, { "epoch": 4.26, "learning_rate": 1.60393098560857e-05, "loss": 0.0043, "step": 20944 }, { "epoch": 4.26, "learning_rate": 1.603058920281029e-05, "loss": 0.0034, "step": 20945 }, { "epoch": 4.27, "learning_rate": 1.6021870787076934e-05, "loss": 0.0016, "step": 20946 }, { "epoch": 4.27, "learning_rate": 1.6013154609031233e-05, "loss": 0.0017, "step": 20947 }, { "epoch": 4.27, "learning_rate": 1.6004440668818813e-05, "loss": 0.0002, "step": 20948 }, { "epoch": 4.27, "learning_rate": 1.599572896658508e-05, "loss": 0.0006, "step": 20949 }, { "epoch": 4.27, "learning_rate": 1.5987019502475702e-05, "loss": 0.0026, "step": 20950 }, { "epoch": 4.27, "learning_rate": 1.5978312276636006e-05, "loss": 0.0001, "step": 20951 }, { "epoch": 4.27, "learning_rate": 1.5969607289211532e-05, "loss": 0.0005, "step": 20952 }, { "epoch": 4.27, "learning_rate": 1.5960904540347595e-05, "loss": 0.0053, "step": 20953 }, { "epoch": 4.27, "learning_rate": 1.5952204030189563e-05, "loss": 0.0074, "step": 20954 }, { "epoch": 4.27, "learning_rate": 1.5943505758882768e-05, "loss": 0.0029, "step": 20955 }, { "epoch": 4.27, "learning_rate": 1.593480972657246e-05, "loss": 0.0007, "step": 20956 }, { "epoch": 4.27, "learning_rate": 1.592611593340391e-05, "loss": 0.0003, "step": 20957 }, { "epoch": 4.27, "learning_rate": 1.5917424379522297e-05, "loss": 0.0001, "step": 20958 }, { "epoch": 4.27, "learning_rate": 1.5908735065072793e-05, "loss": 0.0002, "step": 20959 }, { "epoch": 4.27, "learning_rate": 1.5900047990200542e-05, "loss": 0.0007, "step": 20960 }, { "epoch": 4.27, "learning_rate": 1.5891363155050635e-05, "loss": 0.0023, "step": 20961 }, { "epoch": 4.27, "learning_rate": 1.588268055976805e-05, "loss": 0.0002, "step": 20962 }, { "epoch": 4.27, "learning_rate": 1.5874000204497946e-05, "loss": 0.0055, "step": 20963 }, { "epoch": 4.27, "learning_rate": 1.5865322089385146e-05, "loss": 0.0001, "step": 20964 }, { "epoch": 4.27, "learning_rate": 1.5856646214574725e-05, "loss": 0.0058, "step": 20965 }, { "epoch": 4.27, "learning_rate": 1.5847972580211482e-05, "loss": 0.0009, "step": 20966 }, { "epoch": 4.27, "learning_rate": 1.583930118644035e-05, "loss": 0.0001, "step": 20967 }, { "epoch": 4.27, "learning_rate": 1.5830632033406117e-05, "loss": 0.0045, "step": 20968 }, { "epoch": 4.27, "learning_rate": 1.5821965121253576e-05, "loss": 0.0012, "step": 20969 }, { "epoch": 4.27, "learning_rate": 1.5813300450127552e-05, "loss": 0.0002, "step": 20970 }, { "epoch": 4.27, "learning_rate": 1.580463802017266e-05, "loss": 0.0035, "step": 20971 }, { "epoch": 4.27, "learning_rate": 1.579597783153365e-05, "loss": 0.0006, "step": 20972 }, { "epoch": 4.27, "learning_rate": 1.5787319884355125e-05, "loss": 0.0001, "step": 20973 }, { "epoch": 4.27, "learning_rate": 1.5778664178781703e-05, "loss": 0.0026, "step": 20974 }, { "epoch": 4.27, "learning_rate": 1.5770010714957946e-05, "loss": 0.0024, "step": 20975 }, { "epoch": 4.27, "learning_rate": 1.5761359493028398e-05, "loss": 0.0003, "step": 20976 }, { "epoch": 4.27, "learning_rate": 1.5752710513137533e-05, "loss": 0.0002, "step": 20977 }, { "epoch": 4.27, "learning_rate": 1.574406377542981e-05, "loss": 0.0008, "step": 20978 }, { "epoch": 4.27, "learning_rate": 1.5735419280049645e-05, "loss": 0.0024, "step": 20979 }, { "epoch": 4.27, "learning_rate": 1.5726777027141436e-05, "loss": 0.0041, "step": 20980 }, { "epoch": 4.27, "learning_rate": 1.571813701684952e-05, "loss": 0.0011, "step": 20981 }, { "epoch": 4.27, "learning_rate": 1.5709499249318148e-05, "loss": 0.0013, "step": 20982 }, { "epoch": 4.27, "learning_rate": 1.5700863724691685e-05, "loss": 0.0025, "step": 20983 }, { "epoch": 4.27, "learning_rate": 1.5692230443114272e-05, "loss": 0.0044, "step": 20984 }, { "epoch": 4.27, "learning_rate": 1.5683599404730124e-05, "loss": 0.0002, "step": 20985 }, { "epoch": 4.27, "learning_rate": 1.5674970609683425e-05, "loss": 0.0029, "step": 20986 }, { "epoch": 4.27, "learning_rate": 1.5666344058118257e-05, "loss": 0.0009, "step": 20987 }, { "epoch": 4.27, "learning_rate": 1.5657719750178727e-05, "loss": 0.0024, "step": 20988 }, { "epoch": 4.27, "learning_rate": 1.5649097686008864e-05, "loss": 0.0151, "step": 20989 }, { "epoch": 4.27, "learning_rate": 1.5640477865752678e-05, "loss": 0.0015, "step": 20990 }, { "epoch": 4.27, "learning_rate": 1.5631860289554126e-05, "loss": 0.002, "step": 20991 }, { "epoch": 4.27, "learning_rate": 1.562324495755715e-05, "loss": 0.0013, "step": 20992 }, { "epoch": 4.27, "learning_rate": 1.5614631869905635e-05, "loss": 0.0031, "step": 20993 }, { "epoch": 4.27, "learning_rate": 1.5606021026743466e-05, "loss": 0.0011, "step": 20994 }, { "epoch": 4.27, "learning_rate": 1.5597412428214373e-05, "loss": 0.0013, "step": 20995 }, { "epoch": 4.28, "learning_rate": 1.5588806074462262e-05, "loss": 0.0018, "step": 20996 }, { "epoch": 4.28, "learning_rate": 1.558020196563075e-05, "loss": 0.0004, "step": 20997 }, { "epoch": 4.28, "learning_rate": 1.5571600101863625e-05, "loss": 0.0031, "step": 20998 }, { "epoch": 4.28, "learning_rate": 1.5563000483304548e-05, "loss": 0.0001, "step": 20999 }, { "epoch": 4.28, "learning_rate": 1.5554403110097098e-05, "loss": 0.0042, "step": 21000 }, { "epoch": 4.28, "learning_rate": 1.5545807982384935e-05, "loss": 0.0004, "step": 21001 }, { "epoch": 4.28, "learning_rate": 1.553721510031153e-05, "loss": 0.0005, "step": 21002 }, { "epoch": 4.28, "learning_rate": 1.55286244640205e-05, "loss": 0.0025, "step": 21003 }, { "epoch": 4.28, "learning_rate": 1.5520036073655267e-05, "loss": 0.0025, "step": 21004 }, { "epoch": 4.28, "learning_rate": 1.5511449929359267e-05, "loss": 0.0002, "step": 21005 }, { "epoch": 4.28, "learning_rate": 1.5502866031275913e-05, "loss": 0.0011, "step": 21006 }, { "epoch": 4.28, "learning_rate": 1.5494284379548577e-05, "loss": 0.0051, "step": 21007 }, { "epoch": 4.28, "learning_rate": 1.5485704974320594e-05, "loss": 0.0009, "step": 21008 }, { "epoch": 4.28, "learning_rate": 1.547712781573525e-05, "loss": 0.0103, "step": 21009 }, { "epoch": 4.28, "learning_rate": 1.54685529039358e-05, "loss": 0.0009, "step": 21010 }, { "epoch": 4.28, "learning_rate": 1.5459980239065474e-05, "loss": 0.0014, "step": 21011 }, { "epoch": 4.28, "learning_rate": 1.545140982126746e-05, "loss": 0.0013, "step": 21012 }, { "epoch": 4.28, "learning_rate": 1.5442841650684824e-05, "loss": 0.0008, "step": 21013 }, { "epoch": 4.28, "learning_rate": 1.5434275727460786e-05, "loss": 0.0005, "step": 21014 }, { "epoch": 4.28, "learning_rate": 1.5425712051738287e-05, "loss": 0.001, "step": 21015 }, { "epoch": 4.28, "learning_rate": 1.541715062366049e-05, "loss": 0.0009, "step": 21016 }, { "epoch": 4.28, "learning_rate": 1.5408591443370284e-05, "loss": 0.0029, "step": 21017 }, { "epoch": 4.28, "learning_rate": 1.540003451101067e-05, "loss": 0.0009, "step": 21018 }, { "epoch": 4.28, "learning_rate": 1.5391479826724562e-05, "loss": 0.0031, "step": 21019 }, { "epoch": 4.28, "learning_rate": 1.538292739065482e-05, "loss": 0.001, "step": 21020 }, { "epoch": 4.28, "learning_rate": 1.5374377202944293e-05, "loss": 0.0006, "step": 21021 }, { "epoch": 4.28, "learning_rate": 1.53658292637358e-05, "loss": 0.0026, "step": 21022 }, { "epoch": 4.28, "learning_rate": 1.5357283573172098e-05, "loss": 0.0017, "step": 21023 }, { "epoch": 4.28, "learning_rate": 1.5348740131395915e-05, "loss": 0.0057, "step": 21024 }, { "epoch": 4.28, "learning_rate": 1.534019893854994e-05, "loss": 0.0017, "step": 21025 }, { "epoch": 4.28, "learning_rate": 1.5331659994776847e-05, "loss": 0.0004, "step": 21026 }, { "epoch": 4.28, "learning_rate": 1.5323123300219246e-05, "loss": 0.0002, "step": 21027 }, { "epoch": 4.28, "learning_rate": 1.5314588855019666e-05, "loss": 0.0005, "step": 21028 }, { "epoch": 4.28, "learning_rate": 1.5306056659320704e-05, "loss": 0.0027, "step": 21029 }, { "epoch": 4.28, "learning_rate": 1.5297526713264847e-05, "loss": 0.0054, "step": 21030 }, { "epoch": 4.28, "learning_rate": 1.528899901699458e-05, "loss": 0.0022, "step": 21031 }, { "epoch": 4.28, "learning_rate": 1.5280473570652324e-05, "loss": 0.0003, "step": 21032 }, { "epoch": 4.28, "learning_rate": 1.5271950374380416e-05, "loss": 0.0032, "step": 21033 }, { "epoch": 4.28, "learning_rate": 1.5263429428321305e-05, "loss": 0.0008, "step": 21034 }, { "epoch": 4.28, "learning_rate": 1.5254910732617232e-05, "loss": 0.0029, "step": 21035 }, { "epoch": 4.28, "learning_rate": 1.5246394287410495e-05, "loss": 0.0027, "step": 21036 }, { "epoch": 4.28, "learning_rate": 1.5237880092843336e-05, "loss": 0.0025, "step": 21037 }, { "epoch": 4.28, "learning_rate": 1.5229368149057969e-05, "loss": 0.0022, "step": 21038 }, { "epoch": 4.28, "learning_rate": 1.5220858456196533e-05, "loss": 0.0019, "step": 21039 }, { "epoch": 4.28, "learning_rate": 1.5212351014401198e-05, "loss": 0.0013, "step": 21040 }, { "epoch": 4.28, "learning_rate": 1.5203845823814016e-05, "loss": 0.0051, "step": 21041 }, { "epoch": 4.28, "learning_rate": 1.5195342884577056e-05, "loss": 0.0045, "step": 21042 }, { "epoch": 4.28, "learning_rate": 1.5186842196832339e-05, "loss": 0.0057, "step": 21043 }, { "epoch": 4.28, "learning_rate": 1.5178343760721834e-05, "loss": 0.0046, "step": 21044 }, { "epoch": 4.29, "learning_rate": 1.5169847576387511e-05, "loss": 0.003, "step": 21045 }, { "epoch": 4.29, "learning_rate": 1.5161353643971174e-05, "loss": 0.0047, "step": 21046 }, { "epoch": 4.29, "learning_rate": 1.5152861963614827e-05, "loss": 0.0002, "step": 21047 }, { "epoch": 4.29, "learning_rate": 1.514437253546017e-05, "loss": 0.0031, "step": 21048 }, { "epoch": 4.29, "learning_rate": 1.5135885359649108e-05, "loss": 0.0006, "step": 21049 }, { "epoch": 4.29, "learning_rate": 1.5127400436323295e-05, "loss": 0.0013, "step": 21050 }, { "epoch": 4.29, "learning_rate": 1.5118917765624467e-05, "loss": 0.0021, "step": 21051 }, { "epoch": 4.29, "learning_rate": 1.5110437347694377e-05, "loss": 0.0067, "step": 21052 }, { "epoch": 4.29, "learning_rate": 1.5101959182674544e-05, "loss": 0.0005, "step": 21053 }, { "epoch": 4.29, "learning_rate": 1.5093483270706674e-05, "loss": 0.0002, "step": 21054 }, { "epoch": 4.29, "learning_rate": 1.5085009611932287e-05, "loss": 0.0006, "step": 21055 }, { "epoch": 4.29, "learning_rate": 1.5076538206492883e-05, "loss": 0.0019, "step": 21056 }, { "epoch": 4.29, "learning_rate": 1.5068069054529985e-05, "loss": 0.0058, "step": 21057 }, { "epoch": 4.29, "learning_rate": 1.5059602156185047e-05, "loss": 0.0008, "step": 21058 }, { "epoch": 4.29, "learning_rate": 1.5051137511599454e-05, "loss": 0.0046, "step": 21059 }, { "epoch": 4.29, "learning_rate": 1.504267512091461e-05, "loss": 0.0001, "step": 21060 }, { "epoch": 4.29, "learning_rate": 1.5034214984271837e-05, "loss": 0.0009, "step": 21061 }, { "epoch": 4.29, "learning_rate": 1.5025757101812452e-05, "loss": 0.0003, "step": 21062 }, { "epoch": 4.29, "learning_rate": 1.5017301473677713e-05, "loss": 0.0021, "step": 21063 }, { "epoch": 4.29, "learning_rate": 1.5008848100008803e-05, "loss": 0.0011, "step": 21064 }, { "epoch": 4.29, "learning_rate": 1.5000396980946978e-05, "loss": 0.0053, "step": 21065 }, { "epoch": 4.29, "learning_rate": 1.4991948116633307e-05, "loss": 0.0011, "step": 21066 }, { "epoch": 4.29, "learning_rate": 1.4983501507209012e-05, "loss": 0.0002, "step": 21067 }, { "epoch": 4.29, "learning_rate": 1.4975057152815061e-05, "loss": 0.0047, "step": 21068 }, { "epoch": 4.29, "learning_rate": 1.4966615053592545e-05, "loss": 0.0002, "step": 21069 }, { "epoch": 4.29, "learning_rate": 1.4958175209682449e-05, "loss": 0.001, "step": 21070 }, { "epoch": 4.29, "learning_rate": 1.4949737621225727e-05, "loss": 0.0007, "step": 21071 }, { "epoch": 4.29, "learning_rate": 1.4941302288363316e-05, "loss": 0.0008, "step": 21072 }, { "epoch": 4.29, "learning_rate": 1.4932869211236105e-05, "loss": 0.0017, "step": 21073 }, { "epoch": 4.29, "learning_rate": 1.4924438389984927e-05, "loss": 0.0025, "step": 21074 }, { "epoch": 4.29, "learning_rate": 1.4916009824750608e-05, "loss": 0.0012, "step": 21075 }, { "epoch": 4.29, "learning_rate": 1.4907583515673915e-05, "loss": 0.0001, "step": 21076 }, { "epoch": 4.29, "learning_rate": 1.4899159462895588e-05, "loss": 0.0024, "step": 21077 }, { "epoch": 4.29, "learning_rate": 1.489073766655633e-05, "loss": 0.0003, "step": 21078 }, { "epoch": 4.29, "learning_rate": 1.4882318126796743e-05, "loss": 0.0003, "step": 21079 }, { "epoch": 4.29, "learning_rate": 1.4873900843757552e-05, "loss": 0.0002, "step": 21080 }, { "epoch": 4.29, "learning_rate": 1.486548581757926e-05, "loss": 0.002, "step": 21081 }, { "epoch": 4.29, "learning_rate": 1.4857073048402402e-05, "loss": 0.0038, "step": 21082 }, { "epoch": 4.29, "learning_rate": 1.4848662536367583e-05, "loss": 0.0004, "step": 21083 }, { "epoch": 4.29, "learning_rate": 1.484025428161516e-05, "loss": 0.0008, "step": 21084 }, { "epoch": 4.29, "learning_rate": 1.4831848284285686e-05, "loss": 0.0001, "step": 21085 }, { "epoch": 4.29, "learning_rate": 1.4823444544519463e-05, "loss": 0.0059, "step": 21086 }, { "epoch": 4.29, "learning_rate": 1.4815043062456883e-05, "loss": 0.0018, "step": 21087 }, { "epoch": 4.29, "learning_rate": 1.4806643838238247e-05, "loss": 0.0002, "step": 21088 }, { "epoch": 4.29, "learning_rate": 1.4798246872003878e-05, "loss": 0.0, "step": 21089 }, { "epoch": 4.29, "learning_rate": 1.4789852163893978e-05, "loss": 0.0005, "step": 21090 }, { "epoch": 4.29, "learning_rate": 1.4781459714048788e-05, "loss": 0.0001, "step": 21091 }, { "epoch": 4.29, "learning_rate": 1.4773069522608444e-05, "loss": 0.0044, "step": 21092 }, { "epoch": 4.29, "learning_rate": 1.4764681589713117e-05, "loss": 0.005, "step": 21093 }, { "epoch": 4.3, "learning_rate": 1.475629591550288e-05, "loss": 0.0027, "step": 21094 }, { "epoch": 4.3, "learning_rate": 1.4747912500117787e-05, "loss": 0.0014, "step": 21095 }, { "epoch": 4.3, "learning_rate": 1.473953134369789e-05, "loss": 0.0003, "step": 21096 }, { "epoch": 4.3, "learning_rate": 1.4731152446383083e-05, "loss": 0.0007, "step": 21097 }, { "epoch": 4.3, "learning_rate": 1.472277580831343e-05, "loss": 0.0004, "step": 21098 }, { "epoch": 4.3, "learning_rate": 1.4714401429628725e-05, "loss": 0.0001, "step": 21099 }, { "epoch": 4.3, "learning_rate": 1.470602931046892e-05, "loss": 0.0002, "step": 21100 }, { "epoch": 4.3, "learning_rate": 1.4697659450973803e-05, "loss": 0.0001, "step": 21101 }, { "epoch": 4.3, "learning_rate": 1.4689291851283164e-05, "loss": 0.0008, "step": 21102 }, { "epoch": 4.3, "learning_rate": 1.4680926511536773e-05, "loss": 0.0012, "step": 21103 }, { "epoch": 4.3, "learning_rate": 1.4672563431874318e-05, "loss": 0.0018, "step": 21104 }, { "epoch": 4.3, "learning_rate": 1.4664202612435554e-05, "loss": 0.0009, "step": 21105 }, { "epoch": 4.3, "learning_rate": 1.4655844053360038e-05, "loss": 0.0011, "step": 21106 }, { "epoch": 4.3, "learning_rate": 1.4647487754787406e-05, "loss": 0.0005, "step": 21107 }, { "epoch": 4.3, "learning_rate": 1.4639133716857231e-05, "loss": 0.0028, "step": 21108 }, { "epoch": 4.3, "learning_rate": 1.4630781939709069e-05, "loss": 0.0003, "step": 21109 }, { "epoch": 4.3, "learning_rate": 1.4622432423482306e-05, "loss": 0.0065, "step": 21110 }, { "epoch": 4.3, "learning_rate": 1.4614085168316497e-05, "loss": 0.0065, "step": 21111 }, { "epoch": 4.3, "learning_rate": 1.4605740174351033e-05, "loss": 0.0008, "step": 21112 }, { "epoch": 4.3, "learning_rate": 1.4597397441725284e-05, "loss": 0.0003, "step": 21113 }, { "epoch": 4.3, "learning_rate": 1.4589056970578605e-05, "loss": 0.0001, "step": 21114 }, { "epoch": 4.3, "learning_rate": 1.458071876105022e-05, "loss": 0.0002, "step": 21115 }, { "epoch": 4.3, "learning_rate": 1.4572382813279532e-05, "loss": 0.0001, "step": 21116 }, { "epoch": 4.3, "learning_rate": 1.4564049127405614e-05, "loss": 0.0005, "step": 21117 }, { "epoch": 4.3, "learning_rate": 1.4555717703567787e-05, "loss": 0.0003, "step": 21118 }, { "epoch": 4.3, "learning_rate": 1.4547388541905125e-05, "loss": 0.0006, "step": 21119 }, { "epoch": 4.3, "learning_rate": 1.4539061642556749e-05, "loss": 0.0013, "step": 21120 }, { "epoch": 4.3, "learning_rate": 1.4530737005661747e-05, "loss": 0.0011, "step": 21121 }, { "epoch": 4.3, "learning_rate": 1.4522414631359158e-05, "loss": 0.0018, "step": 21122 }, { "epoch": 4.3, "learning_rate": 1.4514094519787973e-05, "loss": 0.0018, "step": 21123 }, { "epoch": 4.3, "learning_rate": 1.450577667108716e-05, "loss": 0.0006, "step": 21124 }, { "epoch": 4.3, "learning_rate": 1.4497461085395629e-05, "loss": 0.0032, "step": 21125 }, { "epoch": 4.3, "learning_rate": 1.4489147762852282e-05, "loss": 0.0009, "step": 21126 }, { "epoch": 4.3, "learning_rate": 1.4480836703595977e-05, "loss": 0.0054, "step": 21127 }, { "epoch": 4.3, "learning_rate": 1.4472527907765485e-05, "loss": 0.0017, "step": 21128 }, { "epoch": 4.3, "learning_rate": 1.4464221375499647e-05, "loss": 0.0015, "step": 21129 }, { "epoch": 4.3, "learning_rate": 1.4455917106937098e-05, "loss": 0.0001, "step": 21130 }, { "epoch": 4.3, "learning_rate": 1.4447615102216648e-05, "loss": 0.0017, "step": 21131 }, { "epoch": 4.3, "learning_rate": 1.4439315361476867e-05, "loss": 0.0009, "step": 21132 }, { "epoch": 4.3, "learning_rate": 1.443101788485641e-05, "loss": 0.0002, "step": 21133 }, { "epoch": 4.3, "learning_rate": 1.4422722672493853e-05, "loss": 0.0008, "step": 21134 }, { "epoch": 4.3, "learning_rate": 1.4414429724527732e-05, "loss": 0.0005, "step": 21135 }, { "epoch": 4.3, "learning_rate": 1.440613904109662e-05, "loss": 0.0015, "step": 21136 }, { "epoch": 4.3, "learning_rate": 1.4397850622338908e-05, "loss": 0.0109, "step": 21137 }, { "epoch": 4.3, "learning_rate": 1.438956446839305e-05, "loss": 0.0027, "step": 21138 }, { "epoch": 4.3, "learning_rate": 1.4381280579397452e-05, "loss": 0.0026, "step": 21139 }, { "epoch": 4.3, "learning_rate": 1.4372998955490472e-05, "loss": 0.003, "step": 21140 }, { "epoch": 4.3, "learning_rate": 1.4364719596810431e-05, "loss": 0.0011, "step": 21141 }, { "epoch": 4.3, "learning_rate": 1.4356442503495586e-05, "loss": 0.0069, "step": 21142 }, { "epoch": 4.31, "learning_rate": 1.4348167675684209e-05, "loss": 0.0064, "step": 21143 }, { "epoch": 4.31, "learning_rate": 1.4339895113514488e-05, "loss": 0.0002, "step": 21144 }, { "epoch": 4.31, "learning_rate": 1.43316248171246e-05, "loss": 0.0009, "step": 21145 }, { "epoch": 4.31, "learning_rate": 1.4323356786652661e-05, "loss": 0.0005, "step": 21146 }, { "epoch": 4.31, "learning_rate": 1.4315091022236802e-05, "loss": 0.0002, "step": 21147 }, { "epoch": 4.31, "learning_rate": 1.430682752401499e-05, "loss": 0.0118, "step": 21148 }, { "epoch": 4.31, "learning_rate": 1.429856629212537e-05, "loss": 0.0004, "step": 21149 }, { "epoch": 4.31, "learning_rate": 1.4290307326705775e-05, "loss": 0.0002, "step": 21150 }, { "epoch": 4.31, "learning_rate": 1.4282050627894265e-05, "loss": 0.0001, "step": 21151 }, { "epoch": 4.31, "learning_rate": 1.4273796195828679e-05, "loss": 0.0002, "step": 21152 }, { "epoch": 4.31, "learning_rate": 1.4265544030646909e-05, "loss": 0.0054, "step": 21153 }, { "epoch": 4.31, "learning_rate": 1.4257294132486758e-05, "loss": 0.0039, "step": 21154 }, { "epoch": 4.31, "learning_rate": 1.4249046501486017e-05, "loss": 0.0024, "step": 21155 }, { "epoch": 4.31, "learning_rate": 1.4240801137782459e-05, "loss": 0.0038, "step": 21156 }, { "epoch": 4.31, "learning_rate": 1.4232558041513791e-05, "loss": 0.0051, "step": 21157 }, { "epoch": 4.31, "learning_rate": 1.422431721281767e-05, "loss": 0.0003, "step": 21158 }, { "epoch": 4.31, "learning_rate": 1.4216078651831752e-05, "loss": 0.0036, "step": 21159 }, { "epoch": 4.31, "learning_rate": 1.4207842358693677e-05, "loss": 0.0001, "step": 21160 }, { "epoch": 4.31, "learning_rate": 1.4199608333540886e-05, "loss": 0.0039, "step": 21161 }, { "epoch": 4.31, "learning_rate": 1.4191376576511033e-05, "loss": 0.0005, "step": 21162 }, { "epoch": 4.31, "learning_rate": 1.4183147087741492e-05, "loss": 0.0004, "step": 21163 }, { "epoch": 4.31, "learning_rate": 1.4174919867369789e-05, "loss": 0.0036, "step": 21164 }, { "epoch": 4.31, "learning_rate": 1.416669491553336e-05, "loss": 0.0042, "step": 21165 }, { "epoch": 4.31, "learning_rate": 1.415847223236945e-05, "loss": 0.0003, "step": 21166 }, { "epoch": 4.31, "learning_rate": 1.4150251818015545e-05, "loss": 0.0003, "step": 21167 }, { "epoch": 4.31, "learning_rate": 1.4142033672608805e-05, "loss": 0.0015, "step": 21168 }, { "epoch": 4.31, "learning_rate": 1.4133817796286617e-05, "loss": 0.001, "step": 21169 }, { "epoch": 4.31, "learning_rate": 1.4125604189186106e-05, "loss": 0.0018, "step": 21170 }, { "epoch": 4.31, "learning_rate": 1.411739285144448e-05, "loss": 0.0094, "step": 21171 }, { "epoch": 4.31, "learning_rate": 1.4109183783198897e-05, "loss": 0.0021, "step": 21172 }, { "epoch": 4.31, "learning_rate": 1.410097698458646e-05, "loss": 0.001, "step": 21173 }, { "epoch": 4.31, "learning_rate": 1.4092772455744227e-05, "loss": 0.0003, "step": 21174 }, { "epoch": 4.31, "learning_rate": 1.4084570196809242e-05, "loss": 0.0044, "step": 21175 }, { "epoch": 4.31, "learning_rate": 1.4076370207918492e-05, "loss": 0.0057, "step": 21176 }, { "epoch": 4.31, "learning_rate": 1.4068172489208934e-05, "loss": 0.0003, "step": 21177 }, { "epoch": 4.31, "learning_rate": 1.4059977040817494e-05, "loss": 0.0012, "step": 21178 }, { "epoch": 4.31, "learning_rate": 1.4051783862881027e-05, "loss": 0.0056, "step": 21179 }, { "epoch": 4.31, "learning_rate": 1.4043592955536426e-05, "loss": 0.002, "step": 21180 }, { "epoch": 4.31, "learning_rate": 1.4035404318920395e-05, "loss": 0.0009, "step": 21181 }, { "epoch": 4.31, "learning_rate": 1.4027217953169828e-05, "loss": 0.0001, "step": 21182 }, { "epoch": 4.31, "learning_rate": 1.4019033858421347e-05, "loss": 0.0006, "step": 21183 }, { "epoch": 4.31, "learning_rate": 1.4010852034811692e-05, "loss": 0.0002, "step": 21184 }, { "epoch": 4.31, "learning_rate": 1.4002672482477506e-05, "loss": 0.0004, "step": 21185 }, { "epoch": 4.31, "learning_rate": 1.399449520155541e-05, "loss": 0.0, "step": 21186 }, { "epoch": 4.31, "learning_rate": 1.3986320192181965e-05, "loss": 0.0028, "step": 21187 }, { "epoch": 4.31, "learning_rate": 1.397814745449371e-05, "loss": 0.0043, "step": 21188 }, { "epoch": 4.31, "learning_rate": 1.3969976988627169e-05, "loss": 0.0064, "step": 21189 }, { "epoch": 4.31, "learning_rate": 1.3961808794718765e-05, "loss": 0.007, "step": 21190 }, { "epoch": 4.31, "learning_rate": 1.3953642872904958e-05, "loss": 0.0016, "step": 21191 }, { "epoch": 4.32, "learning_rate": 1.394547922332212e-05, "loss": 0.0003, "step": 21192 }, { "epoch": 4.32, "learning_rate": 1.3937317846106626e-05, "loss": 0.0002, "step": 21193 }, { "epoch": 4.32, "learning_rate": 1.3929158741394702e-05, "loss": 0.0006, "step": 21194 }, { "epoch": 4.32, "learning_rate": 1.392100190932272e-05, "loss": 0.0005, "step": 21195 }, { "epoch": 4.32, "learning_rate": 1.3912847350026857e-05, "loss": 0.0, "step": 21196 }, { "epoch": 4.32, "learning_rate": 1.3904695063643334e-05, "loss": 0.0037, "step": 21197 }, { "epoch": 4.32, "learning_rate": 1.3896545050308327e-05, "loss": 0.0007, "step": 21198 }, { "epoch": 4.32, "learning_rate": 1.3888397310157879e-05, "loss": 0.0009, "step": 21199 }, { "epoch": 4.32, "learning_rate": 1.3880251843328177e-05, "loss": 0.0003, "step": 21200 }, { "epoch": 4.32, "learning_rate": 1.3872108649955166e-05, "loss": 0.0021, "step": 21201 }, { "epoch": 4.32, "learning_rate": 1.3863967730174951e-05, "loss": 0.0021, "step": 21202 }, { "epoch": 4.32, "learning_rate": 1.385582908412341e-05, "loss": 0.0015, "step": 21203 }, { "epoch": 4.32, "learning_rate": 1.3847692711936531e-05, "loss": 0.0045, "step": 21204 }, { "epoch": 4.32, "learning_rate": 1.3839558613750174e-05, "loss": 0.0043, "step": 21205 }, { "epoch": 4.32, "learning_rate": 1.3831426789700228e-05, "loss": 0.001, "step": 21206 }, { "epoch": 4.32, "learning_rate": 1.382329723992247e-05, "loss": 0.0005, "step": 21207 }, { "epoch": 4.32, "learning_rate": 1.3815169964552709e-05, "loss": 0.001, "step": 21208 }, { "epoch": 4.32, "learning_rate": 1.3807044963726683e-05, "loss": 0.0001, "step": 21209 }, { "epoch": 4.32, "learning_rate": 1.3798922237580085e-05, "loss": 0.0004, "step": 21210 }, { "epoch": 4.32, "learning_rate": 1.3790801786248607e-05, "loss": 0.0006, "step": 21211 }, { "epoch": 4.32, "learning_rate": 1.3782683609867806e-05, "loss": 0.0024, "step": 21212 }, { "epoch": 4.32, "learning_rate": 1.3774567708573359e-05, "loss": 0.0024, "step": 21213 }, { "epoch": 4.32, "learning_rate": 1.3766454082500721e-05, "loss": 0.0007, "step": 21214 }, { "epoch": 4.32, "learning_rate": 1.375834273178552e-05, "loss": 0.0013, "step": 21215 }, { "epoch": 4.32, "learning_rate": 1.3750233656563148e-05, "loss": 0.0015, "step": 21216 }, { "epoch": 4.32, "learning_rate": 1.3742126856969026e-05, "loss": 0.003, "step": 21217 }, { "epoch": 4.32, "learning_rate": 1.373402233313865e-05, "loss": 0.0007, "step": 21218 }, { "epoch": 4.32, "learning_rate": 1.3725920085207259e-05, "loss": 0.0037, "step": 21219 }, { "epoch": 4.32, "learning_rate": 1.3717820113310312e-05, "loss": 0.0027, "step": 21220 }, { "epoch": 4.32, "learning_rate": 1.370972241758297e-05, "loss": 0.0007, "step": 21221 }, { "epoch": 4.32, "learning_rate": 1.3701626998160553e-05, "loss": 0.0024, "step": 21222 }, { "epoch": 4.32, "learning_rate": 1.3693533855178223e-05, "loss": 0.0001, "step": 21223 }, { "epoch": 4.32, "learning_rate": 1.368544298877119e-05, "loss": 0.0021, "step": 21224 }, { "epoch": 4.32, "learning_rate": 1.3677354399074558e-05, "loss": 0.0005, "step": 21225 }, { "epoch": 4.32, "learning_rate": 1.366926808622344e-05, "loss": 0.0023, "step": 21226 }, { "epoch": 4.32, "learning_rate": 1.3661184050352892e-05, "loss": 0.0005, "step": 21227 }, { "epoch": 4.32, "learning_rate": 1.3653102291597923e-05, "loss": 0.0025, "step": 21228 }, { "epoch": 4.32, "learning_rate": 1.3645022810093558e-05, "loss": 0.0003, "step": 21229 }, { "epoch": 4.32, "learning_rate": 1.3636945605974641e-05, "loss": 0.0014, "step": 21230 }, { "epoch": 4.32, "learning_rate": 1.3628870679376181e-05, "loss": 0.0003, "step": 21231 }, { "epoch": 4.32, "learning_rate": 1.362079803043295e-05, "loss": 0.0021, "step": 21232 }, { "epoch": 4.32, "learning_rate": 1.3612727659279876e-05, "loss": 0.0016, "step": 21233 }, { "epoch": 4.32, "learning_rate": 1.3604659566051685e-05, "loss": 0.0004, "step": 21234 }, { "epoch": 4.32, "learning_rate": 1.3596593750883134e-05, "loss": 0.0197, "step": 21235 }, { "epoch": 4.32, "learning_rate": 1.358853021390895e-05, "loss": 0.0007, "step": 21236 }, { "epoch": 4.32, "learning_rate": 1.358046895526379e-05, "loss": 0.0007, "step": 21237 }, { "epoch": 4.32, "learning_rate": 1.3572409975082332e-05, "loss": 0.0007, "step": 21238 }, { "epoch": 4.32, "learning_rate": 1.3564353273499151e-05, "loss": 0.0006, "step": 21239 }, { "epoch": 4.32, "learning_rate": 1.3556298850648789e-05, "loss": 0.0026, "step": 21240 }, { "epoch": 4.33, "learning_rate": 1.3548246706665806e-05, "loss": 0.0002, "step": 21241 }, { "epoch": 4.33, "learning_rate": 1.3540196841684675e-05, "loss": 0.0009, "step": 21242 }, { "epoch": 4.33, "learning_rate": 1.3532149255839842e-05, "loss": 0.0001, "step": 21243 }, { "epoch": 4.33, "learning_rate": 1.3524103949265746e-05, "loss": 0.0001, "step": 21244 }, { "epoch": 4.33, "learning_rate": 1.3516060922096683e-05, "loss": 0.0019, "step": 21245 }, { "epoch": 4.33, "learning_rate": 1.3508020174467077e-05, "loss": 0.0004, "step": 21246 }, { "epoch": 4.33, "learning_rate": 1.3499981706511138e-05, "loss": 0.0011, "step": 21247 }, { "epoch": 4.33, "learning_rate": 1.349194551836319e-05, "loss": 0.001, "step": 21248 }, { "epoch": 4.33, "learning_rate": 1.3483911610157444e-05, "loss": 0.0002, "step": 21249 }, { "epoch": 4.33, "learning_rate": 1.3475879982028025e-05, "loss": 0.0002, "step": 21250 }, { "epoch": 4.33, "learning_rate": 1.3467850634109161e-05, "loss": 0.0069, "step": 21251 }, { "epoch": 4.33, "learning_rate": 1.3459823566534877e-05, "loss": 0.0002, "step": 21252 }, { "epoch": 4.33, "learning_rate": 1.3451798779439315e-05, "loss": 0.0022, "step": 21253 }, { "epoch": 4.33, "learning_rate": 1.3443776272956453e-05, "loss": 0.0001, "step": 21254 }, { "epoch": 4.33, "learning_rate": 1.3435756047220282e-05, "loss": 0.0027, "step": 21255 }, { "epoch": 4.33, "learning_rate": 1.3427738102364776e-05, "loss": 0.0002, "step": 21256 }, { "epoch": 4.33, "learning_rate": 1.3419722438523834e-05, "loss": 0.0017, "step": 21257 }, { "epoch": 4.33, "learning_rate": 1.3411709055831344e-05, "loss": 0.0046, "step": 21258 }, { "epoch": 4.33, "learning_rate": 1.340369795442115e-05, "loss": 0.0021, "step": 21259 }, { "epoch": 4.33, "learning_rate": 1.3395689134427045e-05, "loss": 0.0, "step": 21260 }, { "epoch": 4.33, "learning_rate": 1.3387682595982774e-05, "loss": 0.0013, "step": 21261 }, { "epoch": 4.33, "learning_rate": 1.3379678339222111e-05, "loss": 0.0029, "step": 21262 }, { "epoch": 4.33, "learning_rate": 1.3371676364278666e-05, "loss": 0.0044, "step": 21263 }, { "epoch": 4.33, "learning_rate": 1.3363676671286184e-05, "loss": 0.0062, "step": 21264 }, { "epoch": 4.33, "learning_rate": 1.3355679260378154e-05, "loss": 0.0004, "step": 21265 }, { "epoch": 4.33, "learning_rate": 1.3347684131688274e-05, "loss": 0.0005, "step": 21266 }, { "epoch": 4.33, "learning_rate": 1.3339691285349985e-05, "loss": 0.0018, "step": 21267 }, { "epoch": 4.33, "learning_rate": 1.333170072149683e-05, "loss": 0.0023, "step": 21268 }, { "epoch": 4.33, "learning_rate": 1.3323712440262236e-05, "loss": 0.0001, "step": 21269 }, { "epoch": 4.33, "learning_rate": 1.3315726441779629e-05, "loss": 0.001, "step": 21270 }, { "epoch": 4.33, "learning_rate": 1.3307742726182452e-05, "loss": 0.0005, "step": 21271 }, { "epoch": 4.33, "learning_rate": 1.329976129360395e-05, "loss": 0.0033, "step": 21272 }, { "epoch": 4.33, "learning_rate": 1.3291782144177499e-05, "loss": 0.0002, "step": 21273 }, { "epoch": 4.33, "learning_rate": 1.3283805278036326e-05, "loss": 0.0015, "step": 21274 }, { "epoch": 4.33, "learning_rate": 1.3275830695313688e-05, "loss": 0.0034, "step": 21275 }, { "epoch": 4.33, "learning_rate": 1.326785839614275e-05, "loss": 0.0071, "step": 21276 }, { "epoch": 4.33, "learning_rate": 1.3259888380656702e-05, "loss": 0.0007, "step": 21277 }, { "epoch": 4.33, "learning_rate": 1.325192064898859e-05, "loss": 0.0001, "step": 21278 }, { "epoch": 4.33, "learning_rate": 1.3243955201271555e-05, "loss": 0.0017, "step": 21279 }, { "epoch": 4.33, "learning_rate": 1.3235992037638642e-05, "loss": 0.0001, "step": 21280 }, { "epoch": 4.33, "learning_rate": 1.3228031158222762e-05, "loss": 0.0016, "step": 21281 }, { "epoch": 4.33, "learning_rate": 1.3220072563157008e-05, "loss": 0.0035, "step": 21282 }, { "epoch": 4.33, "learning_rate": 1.3212116252574156e-05, "loss": 0.0016, "step": 21283 }, { "epoch": 4.33, "learning_rate": 1.3204162226607235e-05, "loss": 0.0012, "step": 21284 }, { "epoch": 4.33, "learning_rate": 1.3196210485389003e-05, "loss": 0.0032, "step": 21285 }, { "epoch": 4.33, "learning_rate": 1.3188261029052289e-05, "loss": 0.0011, "step": 21286 }, { "epoch": 4.33, "learning_rate": 1.3180313857729852e-05, "loss": 0.0036, "step": 21287 }, { "epoch": 4.33, "learning_rate": 1.3172368971554453e-05, "loss": 0.0005, "step": 21288 }, { "epoch": 4.33, "learning_rate": 1.316442637065877e-05, "loss": 0.0012, "step": 21289 }, { "epoch": 4.34, "learning_rate": 1.3156486055175464e-05, "loss": 0.0004, "step": 21290 }, { "epoch": 4.34, "learning_rate": 1.3148548025237143e-05, "loss": 0.0001, "step": 21291 }, { "epoch": 4.34, "learning_rate": 1.3140612280976404e-05, "loss": 0.0034, "step": 21292 }, { "epoch": 4.34, "learning_rate": 1.3132678822525772e-05, "loss": 0.0003, "step": 21293 }, { "epoch": 4.34, "learning_rate": 1.3124747650017758e-05, "loss": 0.002, "step": 21294 }, { "epoch": 4.34, "learning_rate": 1.3116818763584874e-05, "loss": 0.0007, "step": 21295 }, { "epoch": 4.34, "learning_rate": 1.310889216335943e-05, "loss": 0.0005, "step": 21296 }, { "epoch": 4.34, "learning_rate": 1.3100967849473954e-05, "loss": 0.0086, "step": 21297 }, { "epoch": 4.34, "learning_rate": 1.3093045822060655e-05, "loss": 0.0002, "step": 21298 }, { "epoch": 4.34, "learning_rate": 1.3085126081251995e-05, "loss": 0.0023, "step": 21299 }, { "epoch": 4.34, "learning_rate": 1.3077208627180136e-05, "loss": 0.0008, "step": 21300 }, { "epoch": 4.34, "learning_rate": 1.3069293459977337e-05, "loss": 0.0005, "step": 21301 }, { "epoch": 4.34, "learning_rate": 1.306138057977586e-05, "loss": 0.0022, "step": 21302 }, { "epoch": 4.34, "learning_rate": 1.3053469986707765e-05, "loss": 0.0013, "step": 21303 }, { "epoch": 4.34, "learning_rate": 1.3045561680905281e-05, "loss": 0.0007, "step": 21304 }, { "epoch": 4.34, "learning_rate": 1.3037655662500402e-05, "loss": 0.0065, "step": 21305 }, { "epoch": 4.34, "learning_rate": 1.302975193162522e-05, "loss": 0.0038, "step": 21306 }, { "epoch": 4.34, "learning_rate": 1.3021850488411716e-05, "loss": 0.0033, "step": 21307 }, { "epoch": 4.34, "learning_rate": 1.3013951332991884e-05, "loss": 0.0005, "step": 21308 }, { "epoch": 4.34, "learning_rate": 1.300605446549765e-05, "loss": 0.0016, "step": 21309 }, { "epoch": 4.34, "learning_rate": 1.2998159886060893e-05, "loss": 0.0001, "step": 21310 }, { "epoch": 4.34, "learning_rate": 1.2990267594813474e-05, "loss": 0.0026, "step": 21311 }, { "epoch": 4.34, "learning_rate": 1.2982377591887204e-05, "loss": 0.0013, "step": 21312 }, { "epoch": 4.34, "learning_rate": 1.2974489877413912e-05, "loss": 0.0016, "step": 21313 }, { "epoch": 4.34, "learning_rate": 1.2966604451525225e-05, "loss": 0.0033, "step": 21314 }, { "epoch": 4.34, "learning_rate": 1.295872131435297e-05, "loss": 0.0033, "step": 21315 }, { "epoch": 4.34, "learning_rate": 1.2950840466028694e-05, "loss": 0.0015, "step": 21316 }, { "epoch": 4.34, "learning_rate": 1.2942961906684141e-05, "loss": 0.0, "step": 21317 }, { "epoch": 4.34, "learning_rate": 1.2935085636450804e-05, "loss": 0.002, "step": 21318 }, { "epoch": 4.34, "learning_rate": 1.2927211655460279e-05, "loss": 0.0024, "step": 21319 }, { "epoch": 4.34, "learning_rate": 1.2919339963844061e-05, "loss": 0.0032, "step": 21320 }, { "epoch": 4.34, "learning_rate": 1.291147056173361e-05, "loss": 0.0012, "step": 21321 }, { "epoch": 4.34, "learning_rate": 1.2903603449260374e-05, "loss": 0.0006, "step": 21322 }, { "epoch": 4.34, "learning_rate": 1.2895738626555763e-05, "loss": 0.003, "step": 21323 }, { "epoch": 4.34, "learning_rate": 1.2887876093751104e-05, "loss": 0.0015, "step": 21324 }, { "epoch": 4.34, "learning_rate": 1.2880015850977744e-05, "loss": 0.0067, "step": 21325 }, { "epoch": 4.34, "learning_rate": 1.2872157898366941e-05, "loss": 0.0007, "step": 21326 }, { "epoch": 4.34, "learning_rate": 1.2864302236049961e-05, "loss": 0.0002, "step": 21327 }, { "epoch": 4.34, "learning_rate": 1.2856448864158014e-05, "loss": 0.0001, "step": 21328 }, { "epoch": 4.34, "learning_rate": 1.2848597782822196e-05, "loss": 0.0007, "step": 21329 }, { "epoch": 4.34, "learning_rate": 1.2840748992173732e-05, "loss": 0.0006, "step": 21330 }, { "epoch": 4.34, "learning_rate": 1.2832902492343655e-05, "loss": 0.0003, "step": 21331 }, { "epoch": 4.34, "learning_rate": 1.2825058283462991e-05, "loss": 0.0002, "step": 21332 }, { "epoch": 4.34, "learning_rate": 1.2817216365662853e-05, "loss": 0.0069, "step": 21333 }, { "epoch": 4.34, "learning_rate": 1.2809376739074084e-05, "loss": 0.0004, "step": 21334 }, { "epoch": 4.34, "learning_rate": 1.2801539403827748e-05, "loss": 0.0003, "step": 21335 }, { "epoch": 4.34, "learning_rate": 1.2793704360054658e-05, "loss": 0.002, "step": 21336 }, { "epoch": 4.34, "learning_rate": 1.2785871607885707e-05, "loss": 0.0002, "step": 21337 }, { "epoch": 4.34, "learning_rate": 1.2778041147451706e-05, "loss": 0.0032, "step": 21338 }, { "epoch": 4.35, "learning_rate": 1.2770212978883437e-05, "loss": 0.0036, "step": 21339 }, { "epoch": 4.35, "learning_rate": 1.276238710231166e-05, "loss": 0.0039, "step": 21340 }, { "epoch": 4.35, "learning_rate": 1.2754563517867072e-05, "loss": 0.001, "step": 21341 }, { "epoch": 4.35, "learning_rate": 1.2746742225680334e-05, "loss": 0.0055, "step": 21342 }, { "epoch": 4.35, "learning_rate": 1.2738923225882092e-05, "loss": 0.0056, "step": 21343 }, { "epoch": 4.35, "learning_rate": 1.2731106518602924e-05, "loss": 0.0004, "step": 21344 }, { "epoch": 4.35, "learning_rate": 1.2723292103973393e-05, "loss": 0.0019, "step": 21345 }, { "epoch": 4.35, "learning_rate": 1.2715479982124045e-05, "loss": 0.0011, "step": 21346 }, { "epoch": 4.35, "learning_rate": 1.2707670153185256e-05, "loss": 0.0013, "step": 21347 }, { "epoch": 4.35, "learning_rate": 1.269986261728761e-05, "loss": 0.0006, "step": 21348 }, { "epoch": 4.35, "learning_rate": 1.2692057374561365e-05, "loss": 0.0001, "step": 21349 }, { "epoch": 4.35, "learning_rate": 1.2684254425137002e-05, "loss": 0.0043, "step": 21350 }, { "epoch": 4.35, "learning_rate": 1.267645376914475e-05, "loss": 0.0002, "step": 21351 }, { "epoch": 4.35, "learning_rate": 1.2668655406714957e-05, "loss": 0.0018, "step": 21352 }, { "epoch": 4.35, "learning_rate": 1.2660859337977847e-05, "loss": 0.0002, "step": 21353 }, { "epoch": 4.35, "learning_rate": 1.2653065563063636e-05, "loss": 0.0001, "step": 21354 }, { "epoch": 4.35, "learning_rate": 1.264527408210247e-05, "loss": 0.0037, "step": 21355 }, { "epoch": 4.35, "learning_rate": 1.2637484895224526e-05, "loss": 0.0006, "step": 21356 }, { "epoch": 4.35, "learning_rate": 1.2629698002559869e-05, "loss": 0.0018, "step": 21357 }, { "epoch": 4.35, "learning_rate": 1.2621913404238543e-05, "loss": 0.0015, "step": 21358 }, { "epoch": 4.35, "learning_rate": 1.261413110039063e-05, "loss": 0.0013, "step": 21359 }, { "epoch": 4.35, "learning_rate": 1.2606351091146005e-05, "loss": 0.0003, "step": 21360 }, { "epoch": 4.35, "learning_rate": 1.2598573376634685e-05, "loss": 0.0027, "step": 21361 }, { "epoch": 4.35, "learning_rate": 1.2590797956986548e-05, "loss": 0.0001, "step": 21362 }, { "epoch": 4.35, "learning_rate": 1.2583024832331473e-05, "loss": 0.0006, "step": 21363 }, { "epoch": 4.35, "learning_rate": 1.2575254002799307e-05, "loss": 0.0031, "step": 21364 }, { "epoch": 4.35, "learning_rate": 1.2567485468519744e-05, "loss": 0.0051, "step": 21365 }, { "epoch": 4.35, "learning_rate": 1.2559719229622651e-05, "loss": 0.0001, "step": 21366 }, { "epoch": 4.35, "learning_rate": 1.2551955286237637e-05, "loss": 0.0007, "step": 21367 }, { "epoch": 4.35, "learning_rate": 1.2544193638494466e-05, "loss": 0.004, "step": 21368 }, { "epoch": 4.35, "learning_rate": 1.2536434286522702e-05, "loss": 0.0026, "step": 21369 }, { "epoch": 4.35, "learning_rate": 1.2528677230451972e-05, "loss": 0.0017, "step": 21370 }, { "epoch": 4.35, "learning_rate": 1.2520922470411827e-05, "loss": 0.0008, "step": 21371 }, { "epoch": 4.35, "learning_rate": 1.2513170006531792e-05, "loss": 0.0002, "step": 21372 }, { "epoch": 4.35, "learning_rate": 1.2505419838941332e-05, "loss": 0.0054, "step": 21373 }, { "epoch": 4.35, "learning_rate": 1.2497671967769896e-05, "loss": 0.0, "step": 21374 }, { "epoch": 4.35, "learning_rate": 1.248992639314691e-05, "loss": 0.0002, "step": 21375 }, { "epoch": 4.35, "learning_rate": 1.2482183115201704e-05, "loss": 0.0013, "step": 21376 }, { "epoch": 4.35, "learning_rate": 1.2474442134063628e-05, "loss": 0.0039, "step": 21377 }, { "epoch": 4.35, "learning_rate": 1.2466703449861975e-05, "loss": 0.0005, "step": 21378 }, { "epoch": 4.35, "learning_rate": 1.245896706272601e-05, "loss": 0.0009, "step": 21379 }, { "epoch": 4.35, "learning_rate": 1.2451232972784864e-05, "loss": 0.0003, "step": 21380 }, { "epoch": 4.35, "learning_rate": 1.2443501180167831e-05, "loss": 0.0056, "step": 21381 }, { "epoch": 4.35, "learning_rate": 1.2435771685003943e-05, "loss": 0.0002, "step": 21382 }, { "epoch": 4.35, "learning_rate": 1.2428044487422345e-05, "loss": 0.0012, "step": 21383 }, { "epoch": 4.35, "learning_rate": 1.2420319587552102e-05, "loss": 0.0035, "step": 21384 }, { "epoch": 4.35, "learning_rate": 1.2412596985522178e-05, "loss": 0.0009, "step": 21385 }, { "epoch": 4.35, "learning_rate": 1.2404876681461667e-05, "loss": 0.0098, "step": 21386 }, { "epoch": 4.35, "learning_rate": 1.2397158675499403e-05, "loss": 0.0006, "step": 21387 }, { "epoch": 4.36, "learning_rate": 1.2389442967764346e-05, "loss": 0.0002, "step": 21388 }, { "epoch": 4.36, "learning_rate": 1.2381729558385345e-05, "loss": 0.0027, "step": 21389 }, { "epoch": 4.36, "learning_rate": 1.237401844749123e-05, "loss": 0.0011, "step": 21390 }, { "epoch": 4.36, "learning_rate": 1.2366309635210797e-05, "loss": 0.0012, "step": 21391 }, { "epoch": 4.36, "learning_rate": 1.2358603121672794e-05, "loss": 0.0023, "step": 21392 }, { "epoch": 4.36, "learning_rate": 1.2350898907005934e-05, "loss": 0.0045, "step": 21393 }, { "epoch": 4.36, "learning_rate": 1.23431969913389e-05, "loss": 0.002, "step": 21394 }, { "epoch": 4.36, "learning_rate": 1.2335497374800318e-05, "loss": 0.0001, "step": 21395 }, { "epoch": 4.36, "learning_rate": 1.2327800057518788e-05, "loss": 0.002, "step": 21396 }, { "epoch": 4.36, "learning_rate": 1.2320105039622891e-05, "loss": 0.0056, "step": 21397 }, { "epoch": 4.36, "learning_rate": 1.2312412321241088e-05, "loss": 0.0052, "step": 21398 }, { "epoch": 4.36, "learning_rate": 1.2304721902501962e-05, "loss": 0.0004, "step": 21399 }, { "epoch": 4.36, "learning_rate": 1.2297033783533828e-05, "loss": 0.0001, "step": 21400 }, { "epoch": 4.36, "learning_rate": 1.2289347964465229e-05, "loss": 0.0003, "step": 21401 }, { "epoch": 4.36, "learning_rate": 1.2281664445424433e-05, "loss": 0.0001, "step": 21402 }, { "epoch": 4.36, "learning_rate": 1.2273983226539802e-05, "loss": 0.0005, "step": 21403 }, { "epoch": 4.36, "learning_rate": 1.2266304307939633e-05, "loss": 0.0005, "step": 21404 }, { "epoch": 4.36, "learning_rate": 1.225862768975216e-05, "loss": 0.0002, "step": 21405 }, { "epoch": 4.36, "learning_rate": 1.2250953372105626e-05, "loss": 0.0002, "step": 21406 }, { "epoch": 4.36, "learning_rate": 1.2243281355128182e-05, "loss": 0.0002, "step": 21407 }, { "epoch": 4.36, "learning_rate": 1.2235611638947972e-05, "loss": 0.0005, "step": 21408 }, { "epoch": 4.36, "learning_rate": 1.2227944223693098e-05, "loss": 0.002, "step": 21409 }, { "epoch": 4.36, "learning_rate": 1.2220279109491654e-05, "loss": 0.0001, "step": 21410 }, { "epoch": 4.36, "learning_rate": 1.2212616296471572e-05, "loss": 0.0007, "step": 21411 }, { "epoch": 4.36, "learning_rate": 1.2204955784760934e-05, "loss": 0.0003, "step": 21412 }, { "epoch": 4.36, "learning_rate": 1.2197297574487585e-05, "loss": 0.0008, "step": 21413 }, { "epoch": 4.36, "learning_rate": 1.2189641665779526e-05, "loss": 0.0032, "step": 21414 }, { "epoch": 4.36, "learning_rate": 1.2181988058764603e-05, "loss": 0.0011, "step": 21415 }, { "epoch": 4.36, "learning_rate": 1.217433675357058e-05, "loss": 0.0012, "step": 21416 }, { "epoch": 4.36, "learning_rate": 1.2166687750325355e-05, "loss": 0.0044, "step": 21417 }, { "epoch": 4.36, "learning_rate": 1.215904104915656e-05, "loss": 0.0102, "step": 21418 }, { "epoch": 4.36, "learning_rate": 1.215139665019204e-05, "loss": 0.0005, "step": 21419 }, { "epoch": 4.36, "learning_rate": 1.2143754553559365e-05, "loss": 0.0004, "step": 21420 }, { "epoch": 4.36, "learning_rate": 1.2136114759386212e-05, "loss": 0.0008, "step": 21421 }, { "epoch": 4.36, "learning_rate": 1.2128477267800196e-05, "loss": 0.0003, "step": 21422 }, { "epoch": 4.36, "learning_rate": 1.2120842078928833e-05, "loss": 0.0024, "step": 21423 }, { "epoch": 4.36, "learning_rate": 1.2113209192899686e-05, "loss": 0.0018, "step": 21424 }, { "epoch": 4.36, "learning_rate": 1.2105578609840238e-05, "loss": 0.001, "step": 21425 }, { "epoch": 4.36, "learning_rate": 1.2097950329877903e-05, "loss": 0.0004, "step": 21426 }, { "epoch": 4.36, "learning_rate": 1.2090324353140113e-05, "loss": 0.0024, "step": 21427 }, { "epoch": 4.36, "learning_rate": 1.2082700679754264e-05, "loss": 0.0019, "step": 21428 }, { "epoch": 4.36, "learning_rate": 1.2075079309847591e-05, "loss": 0.0002, "step": 21429 }, { "epoch": 4.36, "learning_rate": 1.2067460243547488e-05, "loss": 0.0001, "step": 21430 }, { "epoch": 4.36, "learning_rate": 1.2059843480981124e-05, "loss": 0.0077, "step": 21431 }, { "epoch": 4.36, "learning_rate": 1.2052229022275795e-05, "loss": 0.0048, "step": 21432 }, { "epoch": 4.36, "learning_rate": 1.2044616867558631e-05, "loss": 0.0017, "step": 21433 }, { "epoch": 4.36, "learning_rate": 1.2037007016956752e-05, "loss": 0.0019, "step": 21434 }, { "epoch": 4.36, "learning_rate": 1.20293994705973e-05, "loss": 0.0002, "step": 21435 }, { "epoch": 4.36, "learning_rate": 1.2021794228607295e-05, "loss": 0.0002, "step": 21436 }, { "epoch": 4.36, "learning_rate": 1.2014191291113784e-05, "loss": 0.0012, "step": 21437 }, { "epoch": 4.37, "learning_rate": 1.2006590658243764e-05, "loss": 0.0011, "step": 21438 }, { "epoch": 4.37, "learning_rate": 1.1998992330124135e-05, "loss": 0.0046, "step": 21439 }, { "epoch": 4.37, "learning_rate": 1.1991396306881845e-05, "loss": 0.0022, "step": 21440 }, { "epoch": 4.37, "learning_rate": 1.1983802588643743e-05, "loss": 0.0029, "step": 21441 }, { "epoch": 4.37, "learning_rate": 1.1976211175536659e-05, "loss": 0.0018, "step": 21442 }, { "epoch": 4.37, "learning_rate": 1.1968622067687412e-05, "loss": 0.0008, "step": 21443 }, { "epoch": 4.37, "learning_rate": 1.1961035265222679e-05, "loss": 0.0033, "step": 21444 }, { "epoch": 4.37, "learning_rate": 1.1953450768269263e-05, "loss": 0.0031, "step": 21445 }, { "epoch": 4.37, "learning_rate": 1.1945868576953776e-05, "loss": 0.0007, "step": 21446 }, { "epoch": 4.37, "learning_rate": 1.1938288691402903e-05, "loss": 0.003, "step": 21447 }, { "epoch": 4.37, "learning_rate": 1.1930711111743225e-05, "loss": 0.0004, "step": 21448 }, { "epoch": 4.37, "learning_rate": 1.1923135838101256e-05, "loss": 0.0029, "step": 21449 }, { "epoch": 4.37, "learning_rate": 1.1915562870603612e-05, "loss": 0.0002, "step": 21450 }, { "epoch": 4.37, "learning_rate": 1.190799220937666e-05, "loss": 0.0031, "step": 21451 }, { "epoch": 4.37, "learning_rate": 1.1900423854546948e-05, "loss": 0.0008, "step": 21452 }, { "epoch": 4.37, "learning_rate": 1.1892857806240825e-05, "loss": 0.0001, "step": 21453 }, { "epoch": 4.37, "learning_rate": 1.1885294064584671e-05, "loss": 0.0008, "step": 21454 }, { "epoch": 4.37, "learning_rate": 1.1877732629704822e-05, "loss": 0.0014, "step": 21455 }, { "epoch": 4.37, "learning_rate": 1.1870173501727559e-05, "loss": 0.001, "step": 21456 }, { "epoch": 4.37, "learning_rate": 1.186261668077913e-05, "loss": 0.0057, "step": 21457 }, { "epoch": 4.37, "learning_rate": 1.1855062166985768e-05, "loss": 0.0003, "step": 21458 }, { "epoch": 4.37, "learning_rate": 1.1847509960473623e-05, "loss": 0.0004, "step": 21459 }, { "epoch": 4.37, "learning_rate": 1.1839960061368842e-05, "loss": 0.0002, "step": 21460 }, { "epoch": 4.37, "learning_rate": 1.183241246979756e-05, "loss": 0.0007, "step": 21461 }, { "epoch": 4.37, "learning_rate": 1.182486718588574e-05, "loss": 0.0008, "step": 21462 }, { "epoch": 4.37, "learning_rate": 1.1817324209759515e-05, "loss": 0.0033, "step": 21463 }, { "epoch": 4.37, "learning_rate": 1.180978354154477e-05, "loss": 0.0017, "step": 21464 }, { "epoch": 4.37, "learning_rate": 1.1802245181367537e-05, "loss": 0.0041, "step": 21465 }, { "epoch": 4.37, "learning_rate": 1.1794709129353646e-05, "loss": 0.0041, "step": 21466 }, { "epoch": 4.37, "learning_rate": 1.1787175385628982e-05, "loss": 0.0043, "step": 21467 }, { "epoch": 4.37, "learning_rate": 1.1779643950319429e-05, "loss": 0.0008, "step": 21468 }, { "epoch": 4.37, "learning_rate": 1.1772114823550665e-05, "loss": 0.0001, "step": 21469 }, { "epoch": 4.37, "learning_rate": 1.1764588005448578e-05, "loss": 0.0001, "step": 21470 }, { "epoch": 4.37, "learning_rate": 1.175706349613878e-05, "loss": 0.0004, "step": 21471 }, { "epoch": 4.37, "learning_rate": 1.1749541295746973e-05, "loss": 0.0004, "step": 21472 }, { "epoch": 4.37, "learning_rate": 1.1742021404398789e-05, "loss": 0.0005, "step": 21473 }, { "epoch": 4.37, "learning_rate": 1.1734503822219826e-05, "loss": 0.0004, "step": 21474 }, { "epoch": 4.37, "learning_rate": 1.1726988549335636e-05, "loss": 0.0037, "step": 21475 }, { "epoch": 4.37, "learning_rate": 1.1719475585871768e-05, "loss": 0.0001, "step": 21476 }, { "epoch": 4.37, "learning_rate": 1.171196493195367e-05, "loss": 0.0011, "step": 21477 }, { "epoch": 4.37, "learning_rate": 1.1704456587706794e-05, "loss": 0.0006, "step": 21478 }, { "epoch": 4.37, "learning_rate": 1.1696950553256556e-05, "loss": 0.0021, "step": 21479 }, { "epoch": 4.37, "learning_rate": 1.1689446828728289e-05, "loss": 0.0044, "step": 21480 }, { "epoch": 4.37, "learning_rate": 1.1681945414247374e-05, "loss": 0.0072, "step": 21481 }, { "epoch": 4.37, "learning_rate": 1.1674446309939012e-05, "loss": 0.0002, "step": 21482 }, { "epoch": 4.37, "learning_rate": 1.1666949515928553e-05, "loss": 0.0048, "step": 21483 }, { "epoch": 4.37, "learning_rate": 1.165945503234113e-05, "loss": 0.0006, "step": 21484 }, { "epoch": 4.37, "learning_rate": 1.1651962859301961e-05, "loss": 0.002, "step": 21485 }, { "epoch": 4.37, "learning_rate": 1.1644472996936144e-05, "loss": 0.0059, "step": 21486 }, { "epoch": 4.38, "learning_rate": 1.1636985445368814e-05, "loss": 0.0083, "step": 21487 }, { "epoch": 4.38, "learning_rate": 1.1629500204724984e-05, "loss": 0.0001, "step": 21488 }, { "epoch": 4.38, "learning_rate": 1.1622017275129708e-05, "loss": 0.0018, "step": 21489 }, { "epoch": 4.38, "learning_rate": 1.1614536656707934e-05, "loss": 0.002, "step": 21490 }, { "epoch": 4.38, "learning_rate": 1.160705834958463e-05, "loss": 0.0002, "step": 21491 }, { "epoch": 4.38, "learning_rate": 1.1599582353884696e-05, "loss": 0.0025, "step": 21492 }, { "epoch": 4.38, "learning_rate": 1.159210866973298e-05, "loss": 0.0013, "step": 21493 }, { "epoch": 4.38, "learning_rate": 1.1584637297254334e-05, "loss": 0.0008, "step": 21494 }, { "epoch": 4.38, "learning_rate": 1.1577168236573475e-05, "loss": 0.0016, "step": 21495 }, { "epoch": 4.38, "learning_rate": 1.1569701487815236e-05, "loss": 0.003, "step": 21496 }, { "epoch": 4.38, "learning_rate": 1.1562237051104251e-05, "loss": 0.0007, "step": 21497 }, { "epoch": 4.38, "learning_rate": 1.1554774926565252e-05, "loss": 0.0014, "step": 21498 }, { "epoch": 4.38, "learning_rate": 1.1547315114322875e-05, "loss": 0.0023, "step": 21499 }, { "epoch": 4.38, "learning_rate": 1.1539857614501619e-05, "loss": 0.001, "step": 21500 }, { "epoch": 4.38, "learning_rate": 1.1532402427226167e-05, "loss": 0.0012, "step": 21501 }, { "epoch": 4.38, "learning_rate": 1.1524949552620938e-05, "loss": 0.0002, "step": 21502 }, { "epoch": 4.38, "learning_rate": 1.1517498990810431e-05, "loss": 0.0033, "step": 21503 }, { "epoch": 4.38, "learning_rate": 1.1510050741919113e-05, "loss": 0.0024, "step": 21504 }, { "epoch": 4.38, "learning_rate": 1.1502604806071369e-05, "loss": 0.0013, "step": 21505 }, { "epoch": 4.38, "learning_rate": 1.1495161183391532e-05, "loss": 0.0001, "step": 21506 }, { "epoch": 4.38, "learning_rate": 1.148771987400397e-05, "loss": 0.002, "step": 21507 }, { "epoch": 4.38, "learning_rate": 1.148028087803295e-05, "loss": 0.0001, "step": 21508 }, { "epoch": 4.38, "learning_rate": 1.1472844195602705e-05, "loss": 0.0017, "step": 21509 }, { "epoch": 4.38, "learning_rate": 1.1465409826837452e-05, "loss": 0.0014, "step": 21510 }, { "epoch": 4.38, "learning_rate": 1.145797777186136e-05, "loss": 0.0005, "step": 21511 }, { "epoch": 4.38, "learning_rate": 1.1450548030798561e-05, "loss": 0.0008, "step": 21512 }, { "epoch": 4.38, "learning_rate": 1.144312060377311e-05, "loss": 0.0009, "step": 21513 }, { "epoch": 4.38, "learning_rate": 1.1435695490909137e-05, "loss": 0.0028, "step": 21514 }, { "epoch": 4.38, "learning_rate": 1.1428272692330559e-05, "loss": 0.0025, "step": 21515 }, { "epoch": 4.38, "learning_rate": 1.1420852208161447e-05, "loss": 0.0012, "step": 21516 }, { "epoch": 4.38, "learning_rate": 1.1413434038525665e-05, "loss": 0.0008, "step": 21517 }, { "epoch": 4.38, "learning_rate": 1.140601818354715e-05, "loss": 0.0031, "step": 21518 }, { "epoch": 4.38, "learning_rate": 1.1398604643349718e-05, "loss": 0.003, "step": 21519 }, { "epoch": 4.38, "learning_rate": 1.139119341805722e-05, "loss": 0.002, "step": 21520 }, { "epoch": 4.38, "learning_rate": 1.1383784507793459e-05, "loss": 0.0018, "step": 21521 }, { "epoch": 4.38, "learning_rate": 1.137637791268215e-05, "loss": 0.0001, "step": 21522 }, { "epoch": 4.38, "learning_rate": 1.1368973632846979e-05, "loss": 0.0026, "step": 21523 }, { "epoch": 4.38, "learning_rate": 1.1361571668411646e-05, "loss": 0.0029, "step": 21524 }, { "epoch": 4.38, "learning_rate": 1.1354172019499768e-05, "loss": 0.0003, "step": 21525 }, { "epoch": 4.38, "learning_rate": 1.1346774686234933e-05, "loss": 0.0076, "step": 21526 }, { "epoch": 4.38, "learning_rate": 1.1339379668740672e-05, "loss": 0.0012, "step": 21527 }, { "epoch": 4.38, "learning_rate": 1.1331986967140521e-05, "loss": 0.0051, "step": 21528 }, { "epoch": 4.38, "learning_rate": 1.1324596581557931e-05, "loss": 0.0023, "step": 21529 }, { "epoch": 4.38, "learning_rate": 1.1317208512116388e-05, "loss": 0.0039, "step": 21530 }, { "epoch": 4.38, "learning_rate": 1.1309822758939191e-05, "loss": 0.0003, "step": 21531 }, { "epoch": 4.38, "learning_rate": 1.1302439322149792e-05, "loss": 0.004, "step": 21532 }, { "epoch": 4.38, "learning_rate": 1.1295058201871426e-05, "loss": 0.0018, "step": 21533 }, { "epoch": 4.38, "learning_rate": 1.1287679398227446e-05, "loss": 0.001, "step": 21534 }, { "epoch": 4.38, "learning_rate": 1.1280302911341049e-05, "loss": 0.0022, "step": 21535 }, { "epoch": 4.39, "learning_rate": 1.1272928741335441e-05, "loss": 0.0009, "step": 21536 }, { "epoch": 4.39, "learning_rate": 1.1265556888333788e-05, "loss": 0.0011, "step": 21537 }, { "epoch": 4.39, "learning_rate": 1.1258187352459225e-05, "loss": 0.0005, "step": 21538 }, { "epoch": 4.39, "learning_rate": 1.1250820133834804e-05, "loss": 0.0005, "step": 21539 }, { "epoch": 4.39, "learning_rate": 1.124345523258361e-05, "loss": 0.0002, "step": 21540 }, { "epoch": 4.39, "learning_rate": 1.1236092648828642e-05, "loss": 0.0013, "step": 21541 }, { "epoch": 4.39, "learning_rate": 1.122873238269284e-05, "loss": 0.0025, "step": 21542 }, { "epoch": 4.39, "learning_rate": 1.1221374434299169e-05, "loss": 0.0008, "step": 21543 }, { "epoch": 4.39, "learning_rate": 1.1214018803770513e-05, "loss": 0.0024, "step": 21544 }, { "epoch": 4.39, "learning_rate": 1.1206665491229744e-05, "loss": 0.0063, "step": 21545 }, { "epoch": 4.39, "learning_rate": 1.1199314496799594e-05, "loss": 0.001, "step": 21546 }, { "epoch": 4.39, "learning_rate": 1.119196582060295e-05, "loss": 0.0028, "step": 21547 }, { "epoch": 4.39, "learning_rate": 1.1184619462762446e-05, "loss": 0.0032, "step": 21548 }, { "epoch": 4.39, "learning_rate": 1.1177275423400883e-05, "loss": 0.0037, "step": 21549 }, { "epoch": 4.39, "learning_rate": 1.1169933702640848e-05, "loss": 0.0061, "step": 21550 }, { "epoch": 4.39, "learning_rate": 1.1162594300604943e-05, "loss": 0.0009, "step": 21551 }, { "epoch": 4.39, "learning_rate": 1.1155257217415836e-05, "loss": 0.002, "step": 21552 }, { "epoch": 4.39, "learning_rate": 1.1147922453196012e-05, "loss": 0.0003, "step": 21553 }, { "epoch": 4.39, "learning_rate": 1.1140590008067973e-05, "loss": 0.0009, "step": 21554 }, { "epoch": 4.39, "learning_rate": 1.1133259882154205e-05, "loss": 0.0018, "step": 21555 }, { "epoch": 4.39, "learning_rate": 1.112593207557711e-05, "loss": 0.0001, "step": 21556 }, { "epoch": 4.39, "learning_rate": 1.1118606588459107e-05, "loss": 0.0005, "step": 21557 }, { "epoch": 4.39, "learning_rate": 1.1111283420922528e-05, "loss": 0.0001, "step": 21558 }, { "epoch": 4.39, "learning_rate": 1.110396257308968e-05, "loss": 0.0002, "step": 21559 }, { "epoch": 4.39, "learning_rate": 1.1096644045082848e-05, "loss": 0.0024, "step": 21560 }, { "epoch": 4.39, "learning_rate": 1.1089327837024265e-05, "loss": 0.009, "step": 21561 }, { "epoch": 4.39, "learning_rate": 1.1082013949036116e-05, "loss": 0.0035, "step": 21562 }, { "epoch": 4.39, "learning_rate": 1.1074702381240574e-05, "loss": 0.0002, "step": 21563 }, { "epoch": 4.39, "learning_rate": 1.1067393133759705e-05, "loss": 0.0113, "step": 21564 }, { "epoch": 4.39, "learning_rate": 1.1060086206715663e-05, "loss": 0.002, "step": 21565 }, { "epoch": 4.39, "learning_rate": 1.1052781600230415e-05, "loss": 0.002, "step": 21566 }, { "epoch": 4.39, "learning_rate": 1.1045479314426032e-05, "loss": 0.0005, "step": 21567 }, { "epoch": 4.39, "learning_rate": 1.1038179349424431e-05, "loss": 0.0059, "step": 21568 }, { "epoch": 4.39, "learning_rate": 1.1030881705347533e-05, "loss": 0.001, "step": 21569 }, { "epoch": 4.39, "learning_rate": 1.1023586382317224e-05, "loss": 0.0025, "step": 21570 }, { "epoch": 4.39, "learning_rate": 1.1016293380455371e-05, "loss": 0.0004, "step": 21571 }, { "epoch": 4.39, "learning_rate": 1.1009002699883763e-05, "loss": 0.0002, "step": 21572 }, { "epoch": 4.39, "learning_rate": 1.1001714340724182e-05, "loss": 0.0001, "step": 21573 }, { "epoch": 4.39, "learning_rate": 1.0994428303098335e-05, "loss": 0.0032, "step": 21574 }, { "epoch": 4.39, "learning_rate": 1.0987144587127939e-05, "loss": 0.0025, "step": 21575 }, { "epoch": 4.39, "learning_rate": 1.0979863192934663e-05, "loss": 0.0004, "step": 21576 }, { "epoch": 4.39, "learning_rate": 1.0972584120640026e-05, "loss": 0.0011, "step": 21577 }, { "epoch": 4.39, "learning_rate": 1.0965307370365733e-05, "loss": 0.0005, "step": 21578 }, { "epoch": 4.39, "learning_rate": 1.0958032942233186e-05, "loss": 0.0001, "step": 21579 }, { "epoch": 4.39, "learning_rate": 1.0950760836363987e-05, "loss": 0.0003, "step": 21580 }, { "epoch": 4.39, "learning_rate": 1.0943491052879587e-05, "loss": 0.0021, "step": 21581 }, { "epoch": 4.39, "learning_rate": 1.0936223591901311e-05, "loss": 0.003, "step": 21582 }, { "epoch": 4.39, "learning_rate": 1.0928958453550658e-05, "loss": 0.0001, "step": 21583 }, { "epoch": 4.39, "learning_rate": 1.0921695637948863e-05, "loss": 0.0021, "step": 21584 }, { "epoch": 4.4, "learning_rate": 1.0914435145217332e-05, "loss": 0.0003, "step": 21585 }, { "epoch": 4.4, "learning_rate": 1.090717697547725e-05, "loss": 0.0017, "step": 21586 }, { "epoch": 4.4, "learning_rate": 1.0899921128849854e-05, "loss": 0.0002, "step": 21587 }, { "epoch": 4.4, "learning_rate": 1.0892667605456362e-05, "loss": 0.0103, "step": 21588 }, { "epoch": 4.4, "learning_rate": 1.0885416405417897e-05, "loss": 0.0042, "step": 21589 }, { "epoch": 4.4, "learning_rate": 1.0878167528855592e-05, "loss": 0.001, "step": 21590 }, { "epoch": 4.4, "learning_rate": 1.0870920975890485e-05, "loss": 0.0002, "step": 21591 }, { "epoch": 4.4, "learning_rate": 1.0863676746643629e-05, "loss": 0.001, "step": 21592 }, { "epoch": 4.4, "learning_rate": 1.0856434841235994e-05, "loss": 0.0001, "step": 21593 }, { "epoch": 4.4, "learning_rate": 1.0849195259788568e-05, "loss": 0.0019, "step": 21594 }, { "epoch": 4.4, "learning_rate": 1.0841958002422235e-05, "loss": 0.0027, "step": 21595 }, { "epoch": 4.4, "learning_rate": 1.0834723069257916e-05, "loss": 0.0008, "step": 21596 }, { "epoch": 4.4, "learning_rate": 1.0827490460416366e-05, "loss": 0.0002, "step": 21597 }, { "epoch": 4.4, "learning_rate": 1.0820260176018486e-05, "loss": 0.0001, "step": 21598 }, { "epoch": 4.4, "learning_rate": 1.0813032216184913e-05, "loss": 0.0056, "step": 21599 }, { "epoch": 4.4, "learning_rate": 1.0805806581036503e-05, "loss": 0.0037, "step": 21600 }, { "epoch": 4.4, "learning_rate": 1.079858327069384e-05, "loss": 0.0035, "step": 21601 }, { "epoch": 4.4, "learning_rate": 1.0791362285277594e-05, "loss": 0.0047, "step": 21602 }, { "epoch": 4.4, "learning_rate": 1.078414362490837e-05, "loss": 0.0013, "step": 21603 }, { "epoch": 4.4, "learning_rate": 1.0776927289706754e-05, "loss": 0.0001, "step": 21604 }, { "epoch": 4.4, "learning_rate": 1.0769713279793234e-05, "loss": 0.0002, "step": 21605 }, { "epoch": 4.4, "learning_rate": 1.0762501595288332e-05, "loss": 0.0003, "step": 21606 }, { "epoch": 4.4, "learning_rate": 1.075529223631248e-05, "loss": 0.0037, "step": 21607 }, { "epoch": 4.4, "learning_rate": 1.0748085202986084e-05, "loss": 0.0001, "step": 21608 }, { "epoch": 4.4, "learning_rate": 1.074088049542955e-05, "loss": 0.0001, "step": 21609 }, { "epoch": 4.4, "learning_rate": 1.0733678113763128e-05, "loss": 0.0001, "step": 21610 }, { "epoch": 4.4, "learning_rate": 1.0726478058107192e-05, "loss": 0.0011, "step": 21611 }, { "epoch": 4.4, "learning_rate": 1.0719280328581976e-05, "loss": 0.0033, "step": 21612 }, { "epoch": 4.4, "learning_rate": 1.0712084925307685e-05, "loss": 0.0007, "step": 21613 }, { "epoch": 4.4, "learning_rate": 1.0704891848404522e-05, "loss": 0.0003, "step": 21614 }, { "epoch": 4.4, "learning_rate": 1.0697701097992561e-05, "loss": 0.0016, "step": 21615 }, { "epoch": 4.4, "learning_rate": 1.0690512674191986e-05, "loss": 0.001, "step": 21616 }, { "epoch": 4.4, "learning_rate": 1.0683326577122769e-05, "loss": 0.001, "step": 21617 }, { "epoch": 4.4, "learning_rate": 1.067614280690503e-05, "loss": 0.0001, "step": 21618 }, { "epoch": 4.4, "learning_rate": 1.0668961363658674e-05, "loss": 0.0031, "step": 21619 }, { "epoch": 4.4, "learning_rate": 1.066178224750367e-05, "loss": 0.0037, "step": 21620 }, { "epoch": 4.4, "learning_rate": 1.0654605458559905e-05, "loss": 0.0027, "step": 21621 }, { "epoch": 4.4, "learning_rate": 1.0647430996947287e-05, "loss": 0.0013, "step": 21622 }, { "epoch": 4.4, "learning_rate": 1.06402588627856e-05, "loss": 0.002, "step": 21623 }, { "epoch": 4.4, "learning_rate": 1.0633089056194649e-05, "loss": 0.0008, "step": 21624 }, { "epoch": 4.4, "learning_rate": 1.0625921577294189e-05, "loss": 0.0008, "step": 21625 }, { "epoch": 4.4, "learning_rate": 1.061875642620394e-05, "loss": 0.0001, "step": 21626 }, { "epoch": 4.4, "learning_rate": 1.0611593603043573e-05, "loss": 0.001, "step": 21627 }, { "epoch": 4.4, "learning_rate": 1.0604433107932658e-05, "loss": 0.0035, "step": 21628 }, { "epoch": 4.4, "learning_rate": 1.0597274940990885e-05, "loss": 0.0012, "step": 21629 }, { "epoch": 4.4, "learning_rate": 1.0590119102337707e-05, "loss": 0.0033, "step": 21630 }, { "epoch": 4.4, "learning_rate": 1.0582965592092747e-05, "loss": 0.0003, "step": 21631 }, { "epoch": 4.4, "learning_rate": 1.0575814410375404e-05, "loss": 0.0015, "step": 21632 }, { "epoch": 4.4, "learning_rate": 1.0568665557305123e-05, "loss": 0.0001, "step": 21633 }, { "epoch": 4.41, "learning_rate": 1.056151903300137e-05, "loss": 0.0015, "step": 21634 }, { "epoch": 4.41, "learning_rate": 1.0554374837583418e-05, "loss": 0.0005, "step": 21635 }, { "epoch": 4.41, "learning_rate": 1.0547232971170671e-05, "loss": 0.001, "step": 21636 }, { "epoch": 4.41, "learning_rate": 1.0540093433882336e-05, "loss": 0.005, "step": 21637 }, { "epoch": 4.41, "learning_rate": 1.0532956225837697e-05, "loss": 0.0015, "step": 21638 }, { "epoch": 4.41, "learning_rate": 1.052582134715596e-05, "loss": 0.0011, "step": 21639 }, { "epoch": 4.41, "learning_rate": 1.0518688797956265e-05, "loss": 0.0013, "step": 21640 }, { "epoch": 4.41, "learning_rate": 1.0511558578357765e-05, "loss": 0.0021, "step": 21641 }, { "epoch": 4.41, "learning_rate": 1.0504430688479548e-05, "loss": 0.0037, "step": 21642 }, { "epoch": 4.41, "learning_rate": 1.0497305128440653e-05, "loss": 0.0006, "step": 21643 }, { "epoch": 4.41, "learning_rate": 1.0490181898360084e-05, "loss": 0.0013, "step": 21644 }, { "epoch": 4.41, "learning_rate": 1.0483060998356813e-05, "loss": 0.0002, "step": 21645 }, { "epoch": 4.41, "learning_rate": 1.0475942428549793e-05, "loss": 0.0008, "step": 21646 }, { "epoch": 4.41, "learning_rate": 1.0468826189057933e-05, "loss": 0.0021, "step": 21647 }, { "epoch": 4.41, "learning_rate": 1.0461712280000001e-05, "loss": 0.0, "step": 21648 }, { "epoch": 4.41, "learning_rate": 1.045460070149492e-05, "loss": 0.0033, "step": 21649 }, { "epoch": 4.41, "learning_rate": 1.0447491453661394e-05, "loss": 0.0001, "step": 21650 }, { "epoch": 4.41, "learning_rate": 1.0440384536618197e-05, "loss": 0.0038, "step": 21651 }, { "epoch": 4.41, "learning_rate": 1.0433279950484013e-05, "loss": 0.0024, "step": 21652 }, { "epoch": 4.41, "learning_rate": 1.0426177695377486e-05, "loss": 0.0001, "step": 21653 }, { "epoch": 4.41, "learning_rate": 1.0419077771417266e-05, "loss": 0.0044, "step": 21654 }, { "epoch": 4.41, "learning_rate": 1.0411980178721929e-05, "loss": 0.0004, "step": 21655 }, { "epoch": 4.41, "learning_rate": 1.0404884917410012e-05, "loss": 0.0021, "step": 21656 }, { "epoch": 4.41, "learning_rate": 1.0397791987600017e-05, "loss": 0.0025, "step": 21657 }, { "epoch": 4.41, "learning_rate": 1.0390701389410422e-05, "loss": 0.0014, "step": 21658 }, { "epoch": 4.41, "learning_rate": 1.0383613122959643e-05, "loss": 0.001, "step": 21659 }, { "epoch": 4.41, "learning_rate": 1.037652718836609e-05, "loss": 0.0064, "step": 21660 }, { "epoch": 4.41, "learning_rate": 1.0369443585748049e-05, "loss": 0.0002, "step": 21661 }, { "epoch": 4.41, "learning_rate": 1.036236231522391e-05, "loss": 0.0003, "step": 21662 }, { "epoch": 4.41, "learning_rate": 1.0355283376911861e-05, "loss": 0.0001, "step": 21663 }, { "epoch": 4.41, "learning_rate": 1.0348206770930207e-05, "loss": 0.001, "step": 21664 }, { "epoch": 4.41, "learning_rate": 1.0341132497397136e-05, "loss": 0.0036, "step": 21665 }, { "epoch": 4.41, "learning_rate": 1.0334060556430723e-05, "loss": 0.0043, "step": 21666 }, { "epoch": 4.41, "learning_rate": 1.0326990948149188e-05, "loss": 0.0027, "step": 21667 }, { "epoch": 4.41, "learning_rate": 1.0319923672670504e-05, "loss": 0.0094, "step": 21668 }, { "epoch": 4.41, "learning_rate": 1.0312858730112811e-05, "loss": 0.0001, "step": 21669 }, { "epoch": 4.41, "learning_rate": 1.0305796120594028e-05, "loss": 0.0024, "step": 21670 }, { "epoch": 4.41, "learning_rate": 1.029873584423213e-05, "loss": 0.0001, "step": 21671 }, { "epoch": 4.41, "learning_rate": 1.0291677901145073e-05, "loss": 0.0003, "step": 21672 }, { "epoch": 4.41, "learning_rate": 1.0284622291450695e-05, "loss": 0.0002, "step": 21673 }, { "epoch": 4.41, "learning_rate": 1.0277569015266867e-05, "loss": 0.0023, "step": 21674 }, { "epoch": 4.41, "learning_rate": 1.0270518072711365e-05, "loss": 0.0012, "step": 21675 }, { "epoch": 4.41, "learning_rate": 1.0263469463901991e-05, "loss": 0.0009, "step": 21676 }, { "epoch": 4.41, "learning_rate": 1.0256423188956437e-05, "loss": 0.0006, "step": 21677 }, { "epoch": 4.41, "learning_rate": 1.0249379247992424e-05, "loss": 0.0018, "step": 21678 }, { "epoch": 4.41, "learning_rate": 1.0242337641127523e-05, "loss": 0.0054, "step": 21679 }, { "epoch": 4.41, "learning_rate": 1.023529836847946e-05, "loss": 0.0004, "step": 21680 }, { "epoch": 4.41, "learning_rate": 1.0228261430165674e-05, "loss": 0.0002, "step": 21681 }, { "epoch": 4.41, "learning_rate": 1.0221226826303819e-05, "loss": 0.0018, "step": 21682 }, { "epoch": 4.42, "learning_rate": 1.0214194557011285e-05, "loss": 0.0056, "step": 21683 }, { "epoch": 4.42, "learning_rate": 1.0207164622405579e-05, "loss": 0.0008, "step": 21684 }, { "epoch": 4.42, "learning_rate": 1.0200137022604105e-05, "loss": 0.0066, "step": 21685 }, { "epoch": 4.42, "learning_rate": 1.0193111757724203e-05, "loss": 0.0003, "step": 21686 }, { "epoch": 4.42, "learning_rate": 1.0186088827883299e-05, "loss": 0.0001, "step": 21687 }, { "epoch": 4.42, "learning_rate": 1.0179068233198595e-05, "loss": 0.0001, "step": 21688 }, { "epoch": 4.42, "learning_rate": 1.0172049973787383e-05, "loss": 0.008, "step": 21689 }, { "epoch": 4.42, "learning_rate": 1.0165034049766885e-05, "loss": 0.0002, "step": 21690 }, { "epoch": 4.42, "learning_rate": 1.0158020461254258e-05, "loss": 0.0041, "step": 21691 }, { "epoch": 4.42, "learning_rate": 1.0151009208366672e-05, "loss": 0.0003, "step": 21692 }, { "epoch": 4.42, "learning_rate": 1.0144000291221221e-05, "loss": 0.004, "step": 21693 }, { "epoch": 4.42, "learning_rate": 1.013699370993496e-05, "loss": 0.0016, "step": 21694 }, { "epoch": 4.42, "learning_rate": 1.012998946462491e-05, "loss": 0.0007, "step": 21695 }, { "epoch": 4.42, "learning_rate": 1.0122987555408063e-05, "loss": 0.0054, "step": 21696 }, { "epoch": 4.42, "learning_rate": 1.0115987982401357e-05, "loss": 0.0004, "step": 21697 }, { "epoch": 4.42, "learning_rate": 1.0108990745721734e-05, "loss": 0.0006, "step": 21698 }, { "epoch": 4.42, "learning_rate": 1.0101995845485966e-05, "loss": 0.0006, "step": 21699 }, { "epoch": 4.42, "learning_rate": 1.0095003281810993e-05, "loss": 0.0036, "step": 21700 }, { "epoch": 4.42, "learning_rate": 1.0088013054813538e-05, "loss": 0.002, "step": 21701 }, { "epoch": 4.42, "learning_rate": 1.0081025164610373e-05, "loss": 0.0032, "step": 21702 }, { "epoch": 4.42, "learning_rate": 1.0074039611318192e-05, "loss": 0.0001, "step": 21703 }, { "epoch": 4.42, "learning_rate": 1.006705639505368e-05, "loss": 0.0004, "step": 21704 }, { "epoch": 4.42, "learning_rate": 1.006007551593348e-05, "loss": 0.0026, "step": 21705 }, { "epoch": 4.42, "learning_rate": 1.0053096974074165e-05, "loss": 0.0006, "step": 21706 }, { "epoch": 4.42, "learning_rate": 1.0046120769592308e-05, "loss": 0.0042, "step": 21707 }, { "epoch": 4.42, "learning_rate": 1.00391469026044e-05, "loss": 0.0019, "step": 21708 }, { "epoch": 4.42, "learning_rate": 1.0032175373226947e-05, "loss": 0.0025, "step": 21709 }, { "epoch": 4.42, "learning_rate": 1.0025206181576356e-05, "loss": 0.0033, "step": 21710 }, { "epoch": 4.42, "learning_rate": 1.0018239327769084e-05, "loss": 0.0016, "step": 21711 }, { "epoch": 4.42, "learning_rate": 1.0011274811921388e-05, "loss": 0.0014, "step": 21712 }, { "epoch": 4.42, "learning_rate": 1.0004312634149708e-05, "loss": 0.0001, "step": 21713 }, { "epoch": 4.42, "learning_rate": 9.997352794570217e-06, "loss": 0.0008, "step": 21714 }, { "epoch": 4.42, "learning_rate": 9.990395293299257e-06, "loss": 0.0033, "step": 21715 }, { "epoch": 4.42, "learning_rate": 9.983440130452968e-06, "loss": 0.0036, "step": 21716 }, { "epoch": 4.42, "learning_rate": 9.97648730614749e-06, "loss": 0.003, "step": 21717 }, { "epoch": 4.42, "learning_rate": 9.969536820499047e-06, "loss": 0.0003, "step": 21718 }, { "epoch": 4.42, "learning_rate": 9.962588673623611e-06, "loss": 0.0043, "step": 21719 }, { "epoch": 4.42, "learning_rate": 9.955642865637326e-06, "loss": 0.0032, "step": 21720 }, { "epoch": 4.42, "learning_rate": 9.94869939665613e-06, "loss": 0.0001, "step": 21721 }, { "epoch": 4.42, "learning_rate": 9.941758266796029e-06, "loss": 0.0022, "step": 21722 }, { "epoch": 4.42, "learning_rate": 9.93481947617295e-06, "loss": 0.0004, "step": 21723 }, { "epoch": 4.42, "learning_rate": 9.927883024902766e-06, "loss": 0.0005, "step": 21724 }, { "epoch": 4.42, "learning_rate": 9.920948913101351e-06, "loss": 0.0003, "step": 21725 }, { "epoch": 4.42, "learning_rate": 9.914017140884495e-06, "loss": 0.0028, "step": 21726 }, { "epoch": 4.42, "learning_rate": 9.907087708367989e-06, "loss": 0.0011, "step": 21727 }, { "epoch": 4.42, "learning_rate": 9.900160615667574e-06, "loss": 0.0015, "step": 21728 }, { "epoch": 4.42, "learning_rate": 9.893235862898941e-06, "loss": 0.0012, "step": 21729 }, { "epoch": 4.42, "learning_rate": 9.886313450177696e-06, "loss": 0.0, "step": 21730 }, { "epoch": 4.42, "learning_rate": 9.87939337761955e-06, "loss": 0.0003, "step": 21731 }, { "epoch": 4.43, "learning_rate": 9.872475645339971e-06, "loss": 0.0021, "step": 21732 }, { "epoch": 4.43, "learning_rate": 9.865560253454624e-06, "loss": 0.0018, "step": 21733 }, { "epoch": 4.43, "learning_rate": 9.858647202078913e-06, "loss": 0.0002, "step": 21734 }, { "epoch": 4.43, "learning_rate": 9.851736491328326e-06, "loss": 0.0037, "step": 21735 }, { "epoch": 4.43, "learning_rate": 9.844828121318294e-06, "loss": 0.0008, "step": 21736 }, { "epoch": 4.43, "learning_rate": 9.837922092164186e-06, "loss": 0.0007, "step": 21737 }, { "epoch": 4.43, "learning_rate": 9.831018403981362e-06, "loss": 0.0002, "step": 21738 }, { "epoch": 4.43, "learning_rate": 9.824117056885111e-06, "loss": 0.0013, "step": 21739 }, { "epoch": 4.43, "learning_rate": 9.81721805099071e-06, "loss": 0.0043, "step": 21740 }, { "epoch": 4.43, "learning_rate": 9.810321386413384e-06, "loss": 0.0187, "step": 21741 }, { "epoch": 4.43, "learning_rate": 9.80342706326832e-06, "loss": 0.0012, "step": 21742 }, { "epoch": 4.43, "learning_rate": 9.796535081670648e-06, "loss": 0.0007, "step": 21743 }, { "epoch": 4.43, "learning_rate": 9.789645441735539e-06, "loss": 0.0023, "step": 21744 }, { "epoch": 4.43, "learning_rate": 9.782758143577952e-06, "loss": 0.0027, "step": 21745 }, { "epoch": 4.43, "learning_rate": 9.77587318731301e-06, "loss": 0.0001, "step": 21746 }, { "epoch": 4.43, "learning_rate": 9.768990573055673e-06, "loss": 0.0006, "step": 21747 }, { "epoch": 4.43, "learning_rate": 9.762110300920916e-06, "loss": 0.0014, "step": 21748 }, { "epoch": 4.43, "learning_rate": 9.755232371023647e-06, "loss": 0.0009, "step": 21749 }, { "epoch": 4.43, "learning_rate": 9.748356783478672e-06, "loss": 0.0035, "step": 21750 }, { "epoch": 4.43, "learning_rate": 9.741483538400952e-06, "loss": 0.0005, "step": 21751 }, { "epoch": 4.43, "learning_rate": 9.734612635905175e-06, "loss": 0.0011, "step": 21752 }, { "epoch": 4.43, "learning_rate": 9.727744076106136e-06, "loss": 0.0006, "step": 21753 }, { "epoch": 4.43, "learning_rate": 9.720877859118558e-06, "loss": 0.0, "step": 21754 }, { "epoch": 4.43, "learning_rate": 9.714013985057101e-06, "loss": 0.0009, "step": 21755 }, { "epoch": 4.43, "learning_rate": 9.707152454036437e-06, "loss": 0.0016, "step": 21756 }, { "epoch": 4.43, "learning_rate": 9.700293266171144e-06, "loss": 0.0033, "step": 21757 }, { "epoch": 4.43, "learning_rate": 9.693436421575778e-06, "loss": 0.0026, "step": 21758 }, { "epoch": 4.43, "learning_rate": 9.686581920364883e-06, "loss": 0.0016, "step": 21759 }, { "epoch": 4.43, "learning_rate": 9.679729762652932e-06, "loss": 0.0009, "step": 21760 }, { "epoch": 4.43, "learning_rate": 9.672879948554369e-06, "loss": 0.0026, "step": 21761 }, { "epoch": 4.43, "learning_rate": 9.6660324781836e-06, "loss": 0.0012, "step": 21762 }, { "epoch": 4.43, "learning_rate": 9.659187351654968e-06, "loss": 0.0041, "step": 21763 }, { "epoch": 4.43, "learning_rate": 9.652344569082848e-06, "loss": 0.0004, "step": 21764 }, { "epoch": 4.43, "learning_rate": 9.645504130581449e-06, "loss": 0.0003, "step": 21765 }, { "epoch": 4.43, "learning_rate": 9.63866603626513e-06, "loss": 0.0003, "step": 21766 }, { "epoch": 4.43, "learning_rate": 9.631830286248015e-06, "loss": 0.0002, "step": 21767 }, { "epoch": 4.43, "learning_rate": 9.624996880644281e-06, "loss": 0.0038, "step": 21768 }, { "epoch": 4.43, "learning_rate": 9.618165819568085e-06, "loss": 0.0001, "step": 21769 }, { "epoch": 4.43, "learning_rate": 9.611337103133487e-06, "loss": 0.0007, "step": 21770 }, { "epoch": 4.43, "learning_rate": 9.604510731454612e-06, "loss": 0.0008, "step": 21771 }, { "epoch": 4.43, "learning_rate": 9.597686704645402e-06, "loss": 0.0001, "step": 21772 }, { "epoch": 4.43, "learning_rate": 9.59086502281985e-06, "loss": 0.0009, "step": 21773 }, { "epoch": 4.43, "learning_rate": 9.58404568609188e-06, "loss": 0.0015, "step": 21774 }, { "epoch": 4.43, "learning_rate": 9.577228694575433e-06, "loss": 0.0007, "step": 21775 }, { "epoch": 4.43, "learning_rate": 9.57041404838429e-06, "loss": 0.0015, "step": 21776 }, { "epoch": 4.43, "learning_rate": 9.563601747632337e-06, "loss": 0.0004, "step": 21777 }, { "epoch": 4.43, "learning_rate": 9.556791792433322e-06, "loss": 0.0003, "step": 21778 }, { "epoch": 4.43, "learning_rate": 9.549984182901e-06, "loss": 0.0003, "step": 21779 }, { "epoch": 4.43, "learning_rate": 9.543178919149063e-06, "loss": 0.0001, "step": 21780 }, { "epoch": 4.44, "learning_rate": 9.53637600129114e-06, "loss": 0.0003, "step": 21781 }, { "epoch": 4.44, "learning_rate": 9.529575429440923e-06, "loss": 0.0032, "step": 21782 }, { "epoch": 4.44, "learning_rate": 9.522777203711902e-06, "loss": 0.0025, "step": 21783 }, { "epoch": 4.44, "learning_rate": 9.515981324217737e-06, "loss": 0.0012, "step": 21784 }, { "epoch": 4.44, "learning_rate": 9.509187791071821e-06, "loss": 0.0002, "step": 21785 }, { "epoch": 4.44, "learning_rate": 9.502396604387664e-06, "loss": 0.0048, "step": 21786 }, { "epoch": 4.44, "learning_rate": 9.495607764278706e-06, "loss": 0.0027, "step": 21787 }, { "epoch": 4.44, "learning_rate": 9.48882127085831e-06, "loss": 0.0007, "step": 21788 }, { "epoch": 4.44, "learning_rate": 9.482037124239833e-06, "loss": 0.0012, "step": 21789 }, { "epoch": 4.44, "learning_rate": 9.475255324536585e-06, "loss": 0.0004, "step": 21790 }, { "epoch": 4.44, "learning_rate": 9.468475871861825e-06, "loss": 0.0003, "step": 21791 }, { "epoch": 4.44, "learning_rate": 9.461698766328796e-06, "loss": 0.0014, "step": 21792 }, { "epoch": 4.44, "learning_rate": 9.454924008050691e-06, "loss": 0.002, "step": 21793 }, { "epoch": 4.44, "learning_rate": 9.448151597140635e-06, "loss": 0.0004, "step": 21794 }, { "epoch": 4.44, "learning_rate": 9.441381533711806e-06, "loss": 0.0023, "step": 21795 }, { "epoch": 4.44, "learning_rate": 9.434613817877162e-06, "loss": 0.0013, "step": 21796 }, { "epoch": 4.44, "learning_rate": 9.427848449749847e-06, "loss": 0.0002, "step": 21797 }, { "epoch": 4.44, "learning_rate": 9.421085429442803e-06, "loss": 0.0004, "step": 21798 }, { "epoch": 4.44, "learning_rate": 9.414324757068974e-06, "loss": 0.0057, "step": 21799 }, { "epoch": 4.44, "learning_rate": 9.40756643274132e-06, "loss": 0.0003, "step": 21800 }, { "epoch": 4.44, "learning_rate": 9.40081045657265e-06, "loss": 0.0044, "step": 21801 }, { "epoch": 4.44, "learning_rate": 9.394056828675905e-06, "loss": 0.0013, "step": 21802 }, { "epoch": 4.44, "learning_rate": 9.387305549163799e-06, "loss": 0.0005, "step": 21803 }, { "epoch": 4.44, "learning_rate": 9.380556618149104e-06, "loss": 0.0008, "step": 21804 }, { "epoch": 4.44, "learning_rate": 9.373810035744567e-06, "loss": 0.0003, "step": 21805 }, { "epoch": 4.44, "learning_rate": 9.367065802062845e-06, "loss": 0.0054, "step": 21806 }, { "epoch": 4.44, "learning_rate": 9.360323917216583e-06, "loss": 0.0001, "step": 21807 }, { "epoch": 4.44, "learning_rate": 9.353584381318391e-06, "loss": 0.0002, "step": 21808 }, { "epoch": 4.44, "learning_rate": 9.346847194480828e-06, "loss": 0.0001, "step": 21809 }, { "epoch": 4.44, "learning_rate": 9.34011235681642e-06, "loss": 0.0005, "step": 21810 }, { "epoch": 4.44, "learning_rate": 9.333379868437663e-06, "loss": 0.0059, "step": 21811 }, { "epoch": 4.44, "learning_rate": 9.32664972945698e-06, "loss": 0.0054, "step": 21812 }, { "epoch": 4.44, "learning_rate": 9.319921939986801e-06, "loss": 0.0005, "step": 21813 }, { "epoch": 4.44, "learning_rate": 9.313196500139436e-06, "loss": 0.0014, "step": 21814 }, { "epoch": 4.44, "learning_rate": 9.30647341002731e-06, "loss": 0.0052, "step": 21815 }, { "epoch": 4.44, "learning_rate": 9.2997526697626e-06, "loss": 0.0001, "step": 21816 }, { "epoch": 4.44, "learning_rate": 9.29303427945765e-06, "loss": 0.0004, "step": 21817 }, { "epoch": 4.44, "learning_rate": 9.286318239224622e-06, "loss": 0.0054, "step": 21818 }, { "epoch": 4.44, "learning_rate": 9.27960454917569e-06, "loss": 0.0018, "step": 21819 }, { "epoch": 4.44, "learning_rate": 9.272893209422999e-06, "loss": 0.0013, "step": 21820 }, { "epoch": 4.44, "learning_rate": 9.26618422007861e-06, "loss": 0.0007, "step": 21821 }, { "epoch": 4.44, "learning_rate": 9.259477581254615e-06, "loss": 0.0008, "step": 21822 }, { "epoch": 4.44, "learning_rate": 9.25277329306301e-06, "loss": 0.0009, "step": 21823 }, { "epoch": 4.44, "learning_rate": 9.24607135561577e-06, "loss": 0.0001, "step": 21824 }, { "epoch": 4.44, "learning_rate": 9.239371769024839e-06, "loss": 0.0002, "step": 21825 }, { "epoch": 4.44, "learning_rate": 9.232674533402113e-06, "loss": 0.0005, "step": 21826 }, { "epoch": 4.44, "learning_rate": 9.2259796488594e-06, "loss": 0.0001, "step": 21827 }, { "epoch": 4.44, "learning_rate": 9.219287115508595e-06, "loss": 0.0038, "step": 21828 }, { "epoch": 4.44, "learning_rate": 9.212596933461392e-06, "loss": 0.0006, "step": 21829 }, { "epoch": 4.45, "learning_rate": 9.2059091028296e-06, "loss": 0.0001, "step": 21830 }, { "epoch": 4.45, "learning_rate": 9.199223623724933e-06, "loss": 0.0034, "step": 21831 }, { "epoch": 4.45, "learning_rate": 9.192540496258948e-06, "loss": 0.0015, "step": 21832 }, { "epoch": 4.45, "learning_rate": 9.185859720543377e-06, "loss": 0.0021, "step": 21833 }, { "epoch": 4.45, "learning_rate": 9.179181296689708e-06, "loss": 0.0, "step": 21834 }, { "epoch": 4.45, "learning_rate": 9.17250522480959e-06, "loss": 0.0083, "step": 21835 }, { "epoch": 4.45, "learning_rate": 9.16583150501443e-06, "loss": 0.0003, "step": 21836 }, { "epoch": 4.45, "learning_rate": 9.159160137415728e-06, "loss": 0.001, "step": 21837 }, { "epoch": 4.45, "learning_rate": 9.152491122124905e-06, "loss": 0.0018, "step": 21838 }, { "epoch": 4.45, "learning_rate": 9.14582445925336e-06, "loss": 0.0028, "step": 21839 }, { "epoch": 4.45, "learning_rate": 9.139160148912417e-06, "loss": 0.0001, "step": 21840 }, { "epoch": 4.45, "learning_rate": 9.132498191213389e-06, "loss": 0.0037, "step": 21841 }, { "epoch": 4.45, "learning_rate": 9.125838586267553e-06, "loss": 0.0063, "step": 21842 }, { "epoch": 4.45, "learning_rate": 9.119181334186138e-06, "loss": 0.0001, "step": 21843 }, { "epoch": 4.45, "learning_rate": 9.112526435080319e-06, "loss": 0.0036, "step": 21844 }, { "epoch": 4.45, "learning_rate": 9.10587388906126e-06, "loss": 0.0056, "step": 21845 }, { "epoch": 4.45, "learning_rate": 9.099223696240072e-06, "loss": 0.0191, "step": 21846 }, { "epoch": 4.45, "learning_rate": 9.09257585672778e-06, "loss": 0.0022, "step": 21847 }, { "epoch": 4.45, "learning_rate": 9.085930370635496e-06, "loss": 0.0016, "step": 21848 }, { "epoch": 4.45, "learning_rate": 9.07928723807415e-06, "loss": 0.0015, "step": 21849 }, { "epoch": 4.45, "learning_rate": 9.07264645915472e-06, "loss": 0.0004, "step": 21850 }, { "epoch": 4.45, "learning_rate": 9.066008033988098e-06, "loss": 0.0005, "step": 21851 }, { "epoch": 4.45, "learning_rate": 9.059371962685197e-06, "loss": 0.0023, "step": 21852 }, { "epoch": 4.45, "learning_rate": 9.052738245356811e-06, "loss": 0.0011, "step": 21853 }, { "epoch": 4.45, "learning_rate": 9.046106882113751e-06, "loss": 0.019, "step": 21854 }, { "epoch": 4.45, "learning_rate": 9.03947787306678e-06, "loss": 0.0091, "step": 21855 }, { "epoch": 4.45, "learning_rate": 9.032851218326609e-06, "loss": 0.0021, "step": 21856 }, { "epoch": 4.45, "learning_rate": 9.026226918003915e-06, "loss": 0.0046, "step": 21857 }, { "epoch": 4.45, "learning_rate": 9.019604972209343e-06, "loss": 0.0008, "step": 21858 }, { "epoch": 4.45, "learning_rate": 9.012985381053506e-06, "loss": 0.0025, "step": 21859 }, { "epoch": 4.45, "learning_rate": 9.006368144646913e-06, "loss": 0.0006, "step": 21860 }, { "epoch": 4.45, "learning_rate": 8.999753263100129e-06, "loss": 0.0003, "step": 21861 }, { "epoch": 4.45, "learning_rate": 8.993140736523613e-06, "loss": 0.0002, "step": 21862 }, { "epoch": 4.45, "learning_rate": 8.986530565027827e-06, "loss": 0.0025, "step": 21863 }, { "epoch": 4.45, "learning_rate": 8.979922748723183e-06, "loss": 0.0021, "step": 21864 }, { "epoch": 4.45, "learning_rate": 8.973317287719978e-06, "loss": 0.005, "step": 21865 }, { "epoch": 4.45, "learning_rate": 8.966714182128621e-06, "loss": 0.0005, "step": 21866 }, { "epoch": 4.45, "learning_rate": 8.960113432059324e-06, "loss": 0.0007, "step": 21867 }, { "epoch": 4.45, "learning_rate": 8.953515037622399e-06, "loss": 0.0029, "step": 21868 }, { "epoch": 4.45, "learning_rate": 8.946918998927993e-06, "loss": 0.0015, "step": 21869 }, { "epoch": 4.45, "learning_rate": 8.9403253160863e-06, "loss": 0.0024, "step": 21870 }, { "epoch": 4.45, "learning_rate": 8.933733989207449e-06, "loss": 0.0001, "step": 21871 }, { "epoch": 4.45, "learning_rate": 8.927145018401516e-06, "loss": 0.0008, "step": 21872 }, { "epoch": 4.45, "learning_rate": 8.92055840377855e-06, "loss": 0.0018, "step": 21873 }, { "epoch": 4.45, "learning_rate": 8.913974145448576e-06, "loss": 0.0032, "step": 21874 }, { "epoch": 4.45, "learning_rate": 8.907392243521544e-06, "loss": 0.0006, "step": 21875 }, { "epoch": 4.45, "learning_rate": 8.900812698107395e-06, "loss": 0.0018, "step": 21876 }, { "epoch": 4.45, "learning_rate": 8.894235509316045e-06, "loss": 0.0047, "step": 21877 }, { "epoch": 4.45, "learning_rate": 8.887660677257252e-06, "loss": 0.0031, "step": 21878 }, { "epoch": 4.45, "learning_rate": 8.881088202040964e-06, "loss": 0.0006, "step": 21879 }, { "epoch": 4.46, "learning_rate": 8.874518083776827e-06, "loss": 0.003, "step": 21880 }, { "epoch": 4.46, "learning_rate": 8.867950322574685e-06, "loss": 0.0017, "step": 21881 }, { "epoch": 4.46, "learning_rate": 8.86138491854415e-06, "loss": 0.0003, "step": 21882 }, { "epoch": 4.46, "learning_rate": 8.854821871794888e-06, "loss": 0.0001, "step": 21883 }, { "epoch": 4.46, "learning_rate": 8.848261182436556e-06, "loss": 0.0003, "step": 21884 }, { "epoch": 4.46, "learning_rate": 8.841702850578686e-06, "loss": 0.0018, "step": 21885 }, { "epoch": 4.46, "learning_rate": 8.835146876330857e-06, "loss": 0.0016, "step": 21886 }, { "epoch": 4.46, "learning_rate": 8.82859325980253e-06, "loss": 0.0017, "step": 21887 }, { "epoch": 4.46, "learning_rate": 8.822042001103185e-06, "loss": 0.0094, "step": 21888 }, { "epoch": 4.46, "learning_rate": 8.81549310034222e-06, "loss": 0.0006, "step": 21889 }, { "epoch": 4.46, "learning_rate": 8.808946557629027e-06, "loss": 0.0002, "step": 21890 }, { "epoch": 4.46, "learning_rate": 8.802402373072937e-06, "loss": 0.0023, "step": 21891 }, { "epoch": 4.46, "learning_rate": 8.795860546783263e-06, "loss": 0.0018, "step": 21892 }, { "epoch": 4.46, "learning_rate": 8.789321078869265e-06, "loss": 0.0001, "step": 21893 }, { "epoch": 4.46, "learning_rate": 8.78278396944016e-06, "loss": 0.0, "step": 21894 }, { "epoch": 4.46, "learning_rate": 8.776249218605124e-06, "loss": 0.0001, "step": 21895 }, { "epoch": 4.46, "learning_rate": 8.769716826473305e-06, "loss": 0.0054, "step": 21896 }, { "epoch": 4.46, "learning_rate": 8.763186793153814e-06, "loss": 0.0016, "step": 21897 }, { "epoch": 4.46, "learning_rate": 8.756659118755683e-06, "loss": 0.004, "step": 21898 }, { "epoch": 4.46, "learning_rate": 8.750133803387987e-06, "loss": 0.0093, "step": 21899 }, { "epoch": 4.46, "learning_rate": 8.743610847159676e-06, "loss": 0.0005, "step": 21900 }, { "epoch": 4.46, "learning_rate": 8.737090250179713e-06, "loss": 0.0, "step": 21901 }, { "epoch": 4.46, "learning_rate": 8.730572012556975e-06, "loss": 0.0003, "step": 21902 }, { "epoch": 4.46, "learning_rate": 8.724056134400359e-06, "loss": 0.0022, "step": 21903 }, { "epoch": 4.46, "learning_rate": 8.71754261581868e-06, "loss": 0.0028, "step": 21904 }, { "epoch": 4.46, "learning_rate": 8.71103145692073e-06, "loss": 0.0097, "step": 21905 }, { "epoch": 4.46, "learning_rate": 8.70452265781526e-06, "loss": 0.0039, "step": 21906 }, { "epoch": 4.46, "learning_rate": 8.698016218610965e-06, "loss": 0.0014, "step": 21907 }, { "epoch": 4.46, "learning_rate": 8.69151213941654e-06, "loss": 0.002, "step": 21908 }, { "epoch": 4.46, "learning_rate": 8.685010420340583e-06, "loss": 0.0001, "step": 21909 }, { "epoch": 4.46, "learning_rate": 8.67851106149174e-06, "loss": 0.0006, "step": 21910 }, { "epoch": 4.46, "learning_rate": 8.672014062978471e-06, "loss": 0.0035, "step": 21911 }, { "epoch": 4.46, "learning_rate": 8.665519424909395e-06, "loss": 0.0002, "step": 21912 }, { "epoch": 4.46, "learning_rate": 8.659027147392888e-06, "loss": 0.0003, "step": 21913 }, { "epoch": 4.46, "learning_rate": 8.652537230537449e-06, "loss": 0.0034, "step": 21914 }, { "epoch": 4.46, "learning_rate": 8.646049674451472e-06, "loss": 0.0027, "step": 21915 }, { "epoch": 4.46, "learning_rate": 8.639564479243238e-06, "loss": 0.002, "step": 21916 }, { "epoch": 4.46, "learning_rate": 8.633081645021178e-06, "loss": 0.0022, "step": 21917 }, { "epoch": 4.46, "learning_rate": 8.626601171893438e-06, "loss": 0.0002, "step": 21918 }, { "epoch": 4.46, "learning_rate": 8.620123059968381e-06, "loss": 0.0023, "step": 21919 }, { "epoch": 4.46, "learning_rate": 8.613647309354105e-06, "loss": 0.0033, "step": 21920 }, { "epoch": 4.46, "learning_rate": 8.607173920158805e-06, "loss": 0.0073, "step": 21921 }, { "epoch": 4.46, "learning_rate": 8.600702892490613e-06, "loss": 0.0003, "step": 21922 }, { "epoch": 4.46, "learning_rate": 8.594234226457592e-06, "loss": 0.0085, "step": 21923 }, { "epoch": 4.46, "learning_rate": 8.58776792216777e-06, "loss": 0.0006, "step": 21924 }, { "epoch": 4.46, "learning_rate": 8.581303979729165e-06, "loss": 0.0006, "step": 21925 }, { "epoch": 4.46, "learning_rate": 8.574842399249721e-06, "loss": 0.0039, "step": 21926 }, { "epoch": 4.46, "learning_rate": 8.568383180837368e-06, "loss": 0.0002, "step": 21927 }, { "epoch": 4.46, "learning_rate": 8.561926324600022e-06, "loss": 0.0002, "step": 21928 }, { "epoch": 4.47, "learning_rate": 8.555471830645444e-06, "loss": 0.0023, "step": 21929 }, { "epoch": 4.47, "learning_rate": 8.549019699081517e-06, "loss": 0.0019, "step": 21930 }, { "epoch": 4.47, "learning_rate": 8.542569930015918e-06, "loss": 0.0012, "step": 21931 }, { "epoch": 4.47, "learning_rate": 8.536122523556482e-06, "loss": 0.0049, "step": 21932 }, { "epoch": 4.47, "learning_rate": 8.529677479810803e-06, "loss": 0.0021, "step": 21933 }, { "epoch": 4.47, "learning_rate": 8.523234798886564e-06, "loss": 0.0013, "step": 21934 }, { "epoch": 4.47, "learning_rate": 8.516794480891343e-06, "loss": 0.0045, "step": 21935 }, { "epoch": 4.47, "learning_rate": 8.510356525932705e-06, "loss": 0.003, "step": 21936 }, { "epoch": 4.47, "learning_rate": 8.503920934118247e-06, "loss": 0.0024, "step": 21937 }, { "epoch": 4.47, "learning_rate": 8.497487705555367e-06, "loss": 0.0009, "step": 21938 }, { "epoch": 4.47, "learning_rate": 8.491056840351562e-06, "loss": 0.006, "step": 21939 }, { "epoch": 4.47, "learning_rate": 8.484628338614213e-06, "loss": 0.0003, "step": 21940 }, { "epoch": 4.47, "learning_rate": 8.478202200450701e-06, "loss": 0.0001, "step": 21941 }, { "epoch": 4.47, "learning_rate": 8.471778425968357e-06, "loss": 0.0001, "step": 21942 }, { "epoch": 4.47, "learning_rate": 8.465357015274477e-06, "loss": 0.0002, "step": 21943 }, { "epoch": 4.47, "learning_rate": 8.458937968476277e-06, "loss": 0.0022, "step": 21944 }, { "epoch": 4.47, "learning_rate": 8.452521285681003e-06, "loss": 0.0002, "step": 21945 }, { "epoch": 4.47, "learning_rate": 8.44610696699582e-06, "loss": 0.0017, "step": 21946 }, { "epoch": 4.47, "learning_rate": 8.439695012527842e-06, "loss": 0.0008, "step": 21947 }, { "epoch": 4.47, "learning_rate": 8.4332854223842e-06, "loss": 0.0032, "step": 21948 }, { "epoch": 4.47, "learning_rate": 8.426878196671877e-06, "loss": 0.0002, "step": 21949 }, { "epoch": 4.47, "learning_rate": 8.420473335497968e-06, "loss": 0.0018, "step": 21950 }, { "epoch": 4.47, "learning_rate": 8.414070838969372e-06, "loss": 0.0012, "step": 21951 }, { "epoch": 4.47, "learning_rate": 8.407670707193055e-06, "loss": 0.0029, "step": 21952 }, { "epoch": 4.47, "learning_rate": 8.401272940275927e-06, "loss": 0.0028, "step": 21953 }, { "epoch": 4.47, "learning_rate": 8.394877538324824e-06, "loss": 0.0005, "step": 21954 }, { "epoch": 4.47, "learning_rate": 8.388484501446558e-06, "loss": 0.0002, "step": 21955 }, { "epoch": 4.47, "learning_rate": 8.38209382974791e-06, "loss": 0.0002, "step": 21956 }, { "epoch": 4.47, "learning_rate": 8.375705523335629e-06, "loss": 0.0031, "step": 21957 }, { "epoch": 4.47, "learning_rate": 8.369319582316381e-06, "loss": 0.0001, "step": 21958 }, { "epoch": 4.47, "learning_rate": 8.362936006796861e-06, "loss": 0.002, "step": 21959 }, { "epoch": 4.47, "learning_rate": 8.356554796883668e-06, "loss": 0.004, "step": 21960 }, { "epoch": 4.47, "learning_rate": 8.350175952683385e-06, "loss": 0.0036, "step": 21961 }, { "epoch": 4.47, "learning_rate": 8.343799474302526e-06, "loss": 0.0042, "step": 21962 }, { "epoch": 4.47, "learning_rate": 8.337425361847638e-06, "loss": 0.0002, "step": 21963 }, { "epoch": 4.47, "learning_rate": 8.33105361542512e-06, "loss": 0.0022, "step": 21964 }, { "epoch": 4.47, "learning_rate": 8.324684235141455e-06, "loss": 0.0001, "step": 21965 }, { "epoch": 4.47, "learning_rate": 8.318317221102988e-06, "loss": 0.0015, "step": 21966 }, { "epoch": 4.47, "learning_rate": 8.311952573416036e-06, "loss": 0.0012, "step": 21967 }, { "epoch": 4.47, "learning_rate": 8.305590292186981e-06, "loss": 0.0011, "step": 21968 }, { "epoch": 4.47, "learning_rate": 8.299230377521987e-06, "loss": 0.0038, "step": 21969 }, { "epoch": 4.47, "learning_rate": 8.29287282952737e-06, "loss": 0.0028, "step": 21970 }, { "epoch": 4.47, "learning_rate": 8.286517648309244e-06, "loss": 0.0001, "step": 21971 }, { "epoch": 4.47, "learning_rate": 8.28016483397379e-06, "loss": 0.0003, "step": 21972 }, { "epoch": 4.47, "learning_rate": 8.273814386627076e-06, "loss": 0.0022, "step": 21973 }, { "epoch": 4.47, "learning_rate": 8.267466306375197e-06, "loss": 0.0044, "step": 21974 }, { "epoch": 4.47, "learning_rate": 8.261120593324171e-06, "loss": 0.0053, "step": 21975 }, { "epoch": 4.47, "learning_rate": 8.254777247579997e-06, "loss": 0.0071, "step": 21976 }, { "epoch": 4.47, "learning_rate": 8.248436269248588e-06, "loss": 0.0037, "step": 21977 }, { "epoch": 4.48, "learning_rate": 8.242097658435876e-06, "loss": 0.0006, "step": 21978 }, { "epoch": 4.48, "learning_rate": 8.235761415247743e-06, "loss": 0.0001, "step": 21979 }, { "epoch": 4.48, "learning_rate": 8.22942753978994e-06, "loss": 0.0006, "step": 21980 }, { "epoch": 4.48, "learning_rate": 8.223096032168363e-06, "loss": 0.0004, "step": 21981 }, { "epoch": 4.48, "learning_rate": 8.216766892488646e-06, "loss": 0.0001, "step": 21982 }, { "epoch": 4.48, "learning_rate": 8.21044012085662e-06, "loss": 0.0015, "step": 21983 }, { "epoch": 4.48, "learning_rate": 8.204115717377852e-06, "loss": 0.0002, "step": 21984 }, { "epoch": 4.48, "learning_rate": 8.197793682158022e-06, "loss": 0.0002, "step": 21985 }, { "epoch": 4.48, "learning_rate": 8.191474015302695e-06, "loss": 0.0013, "step": 21986 }, { "epoch": 4.48, "learning_rate": 8.18515671691744e-06, "loss": 0.0004, "step": 21987 }, { "epoch": 4.48, "learning_rate": 8.178841787107771e-06, "loss": 0.0023, "step": 21988 }, { "epoch": 4.48, "learning_rate": 8.172529225979152e-06, "loss": 0.0002, "step": 21989 }, { "epoch": 4.48, "learning_rate": 8.166219033637e-06, "loss": 0.0025, "step": 21990 }, { "epoch": 4.48, "learning_rate": 8.159911210186731e-06, "loss": 0.0041, "step": 21991 }, { "epoch": 4.48, "learning_rate": 8.153605755733678e-06, "loss": 0.0012, "step": 21992 }, { "epoch": 4.48, "learning_rate": 8.147302670383172e-06, "loss": 0.0006, "step": 21993 }, { "epoch": 4.48, "learning_rate": 8.141001954240494e-06, "loss": 0.0038, "step": 21994 }, { "epoch": 4.48, "learning_rate": 8.134703607410815e-06, "loss": 0.0032, "step": 21995 }, { "epoch": 4.48, "learning_rate": 8.128407629999395e-06, "loss": 0.0003, "step": 21996 }, { "epoch": 4.48, "learning_rate": 8.122114022111403e-06, "loss": 0.001, "step": 21997 }, { "epoch": 4.48, "learning_rate": 8.115822783851872e-06, "loss": 0.002, "step": 21998 }, { "epoch": 4.48, "learning_rate": 8.109533915325966e-06, "loss": 0.0015, "step": 21999 }, { "epoch": 4.48, "learning_rate": 8.103247416638636e-06, "loss": 0.0001, "step": 22000 }, { "epoch": 4.48, "learning_rate": 8.096963287894965e-06, "loss": 0.0046, "step": 22001 }, { "epoch": 4.48, "learning_rate": 8.09068152919985e-06, "loss": 0.0007, "step": 22002 }, { "epoch": 4.48, "learning_rate": 8.084402140658226e-06, "loss": 0.0064, "step": 22003 }, { "epoch": 4.48, "learning_rate": 8.078125122374973e-06, "loss": 0.002, "step": 22004 }, { "epoch": 4.48, "learning_rate": 8.071850474454927e-06, "loss": 0.0004, "step": 22005 }, { "epoch": 4.48, "learning_rate": 8.065578197002887e-06, "loss": 0.0003, "step": 22006 }, { "epoch": 4.48, "learning_rate": 8.059308290123617e-06, "loss": 0.0005, "step": 22007 }, { "epoch": 4.48, "learning_rate": 8.053040753921819e-06, "loss": 0.001, "step": 22008 }, { "epoch": 4.48, "learning_rate": 8.046775588502192e-06, "loss": 0.001, "step": 22009 }, { "epoch": 4.48, "learning_rate": 8.040512793969367e-06, "loss": 0.0001, "step": 22010 }, { "epoch": 4.48, "learning_rate": 8.034252370427946e-06, "loss": 0.0099, "step": 22011 }, { "epoch": 4.48, "learning_rate": 8.027994317982494e-06, "loss": 0.0004, "step": 22012 }, { "epoch": 4.48, "learning_rate": 8.021738636737513e-06, "loss": 0.0021, "step": 22013 }, { "epoch": 4.48, "learning_rate": 8.015485326797532e-06, "loss": 0.0001, "step": 22014 }, { "epoch": 4.48, "learning_rate": 8.009234388266905e-06, "loss": 0.0014, "step": 22015 }, { "epoch": 4.48, "learning_rate": 8.002985821250147e-06, "loss": 0.0003, "step": 22016 }, { "epoch": 4.48, "learning_rate": 7.99673962585154e-06, "loss": 0.0059, "step": 22017 }, { "epoch": 4.48, "learning_rate": 7.990495802175435e-06, "loss": 0.0001, "step": 22018 }, { "epoch": 4.48, "learning_rate": 7.984254350326096e-06, "loss": 0.0001, "step": 22019 }, { "epoch": 4.48, "learning_rate": 7.978015270407779e-06, "loss": 0.0004, "step": 22020 }, { "epoch": 4.48, "learning_rate": 7.971778562524728e-06, "loss": 0.0, "step": 22021 }, { "epoch": 4.48, "learning_rate": 7.965544226781061e-06, "loss": 0.0002, "step": 22022 }, { "epoch": 4.48, "learning_rate": 7.959312263280898e-06, "loss": 0.0064, "step": 22023 }, { "epoch": 4.48, "learning_rate": 7.953082672128353e-06, "loss": 0.0029, "step": 22024 }, { "epoch": 4.48, "learning_rate": 7.946855453427476e-06, "loss": 0.0004, "step": 22025 }, { "epoch": 4.48, "learning_rate": 7.940630607282217e-06, "loss": 0.0016, "step": 22026 }, { "epoch": 4.49, "learning_rate": 7.934408133796611e-06, "loss": 0.0024, "step": 22027 }, { "epoch": 4.49, "learning_rate": 7.92818803307454e-06, "loss": 0.003, "step": 22028 }, { "epoch": 4.49, "learning_rate": 7.921970305219921e-06, "loss": 0.0004, "step": 22029 }, { "epoch": 4.49, "learning_rate": 7.915754950336607e-06, "loss": 0.0026, "step": 22030 }, { "epoch": 4.49, "learning_rate": 7.909541968528343e-06, "loss": 0.0006, "step": 22031 }, { "epoch": 4.49, "learning_rate": 7.903331359898984e-06, "loss": 0.0003, "step": 22032 }, { "epoch": 4.49, "learning_rate": 7.897123124552196e-06, "loss": 0.0001, "step": 22033 }, { "epoch": 4.49, "learning_rate": 7.890917262591712e-06, "loss": 0.0016, "step": 22034 }, { "epoch": 4.49, "learning_rate": 7.884713774121132e-06, "loss": 0.003, "step": 22035 }, { "epoch": 4.49, "learning_rate": 7.878512659244107e-06, "loss": 0.0014, "step": 22036 }, { "epoch": 4.49, "learning_rate": 7.872313918064188e-06, "loss": 0.0006, "step": 22037 }, { "epoch": 4.49, "learning_rate": 7.866117550684926e-06, "loss": 0.0004, "step": 22038 }, { "epoch": 4.49, "learning_rate": 7.859923557209784e-06, "loss": 0.0015, "step": 22039 }, { "epoch": 4.49, "learning_rate": 7.85373193774222e-06, "loss": 0.0018, "step": 22040 }, { "epoch": 4.49, "learning_rate": 7.847542692385662e-06, "loss": 0.0023, "step": 22041 }, { "epoch": 4.49, "learning_rate": 7.841355821243479e-06, "loss": 0.0042, "step": 22042 }, { "epoch": 4.49, "learning_rate": 7.835171324418987e-06, "loss": 0.0011, "step": 22043 }, { "epoch": 4.49, "learning_rate": 7.82898920201549e-06, "loss": 0.0003, "step": 22044 }, { "epoch": 4.49, "learning_rate": 7.82280945413627e-06, "loss": 0.0058, "step": 22045 }, { "epoch": 4.49, "learning_rate": 7.81663208088446e-06, "loss": 0.0022, "step": 22046 }, { "epoch": 4.49, "learning_rate": 7.81045708236333e-06, "loss": 0.0008, "step": 22047 }, { "epoch": 4.49, "learning_rate": 7.804284458675946e-06, "loss": 0.0005, "step": 22048 }, { "epoch": 4.49, "learning_rate": 7.79811420992541e-06, "loss": 0.0086, "step": 22049 }, { "epoch": 4.49, "learning_rate": 7.791946336214822e-06, "loss": 0.0044, "step": 22050 }, { "epoch": 4.49, "learning_rate": 7.785780837647132e-06, "loss": 0.0014, "step": 22051 }, { "epoch": 4.49, "learning_rate": 7.779617714325392e-06, "loss": 0.0002, "step": 22052 }, { "epoch": 4.49, "learning_rate": 7.773456966352487e-06, "loss": 0.0031, "step": 22053 }, { "epoch": 4.49, "learning_rate": 7.7672985938313e-06, "loss": 0.0002, "step": 22054 }, { "epoch": 4.49, "learning_rate": 7.761142596864716e-06, "loss": 0.0001, "step": 22055 }, { "epoch": 4.49, "learning_rate": 7.754988975555553e-06, "loss": 0.0002, "step": 22056 }, { "epoch": 4.49, "learning_rate": 7.74883773000658e-06, "loss": 0.0036, "step": 22057 }, { "epoch": 4.49, "learning_rate": 7.742688860320528e-06, "loss": 0.0001, "step": 22058 }, { "epoch": 4.49, "learning_rate": 7.736542366600101e-06, "loss": 0.0005, "step": 22059 }, { "epoch": 4.49, "learning_rate": 7.730398248947966e-06, "loss": 0.0015, "step": 22060 }, { "epoch": 4.49, "learning_rate": 7.724256507466742e-06, "loss": 0.0003, "step": 22061 }, { "epoch": 4.49, "learning_rate": 7.718117142258978e-06, "loss": 0.0044, "step": 22062 }, { "epoch": 4.49, "learning_rate": 7.71198015342726e-06, "loss": 0.0014, "step": 22063 }, { "epoch": 4.49, "learning_rate": 7.705845541074025e-06, "loss": 0.001, "step": 22064 }, { "epoch": 4.49, "learning_rate": 7.699713305301802e-06, "loss": 0.0066, "step": 22065 }, { "epoch": 4.49, "learning_rate": 7.693583446212947e-06, "loss": 0.0006, "step": 22066 }, { "epoch": 4.49, "learning_rate": 7.687455963909912e-06, "loss": 0.0001, "step": 22067 }, { "epoch": 4.49, "learning_rate": 7.68133085849496e-06, "loss": 0.0024, "step": 22068 }, { "epoch": 4.49, "learning_rate": 7.675208130070448e-06, "loss": 0.0002, "step": 22069 }, { "epoch": 4.49, "learning_rate": 7.669087778738609e-06, "loss": 0.0006, "step": 22070 }, { "epoch": 4.49, "learning_rate": 7.662969804601677e-06, "loss": 0.0008, "step": 22071 }, { "epoch": 4.49, "learning_rate": 7.65685420776182e-06, "loss": 0.0003, "step": 22072 }, { "epoch": 4.49, "learning_rate": 7.650740988321191e-06, "loss": 0.0002, "step": 22073 }, { "epoch": 4.49, "learning_rate": 7.644630146381891e-06, "loss": 0.0016, "step": 22074 }, { "epoch": 4.49, "learning_rate": 7.63852168204599e-06, "loss": 0.0012, "step": 22075 }, { "epoch": 4.5, "learning_rate": 7.63241559541552e-06, "loss": 0.0046, "step": 22076 }, { "epoch": 4.5, "learning_rate": 7.626311886592401e-06, "loss": 0.0035, "step": 22077 }, { "epoch": 4.5, "learning_rate": 7.620210555678669e-06, "loss": 0.0001, "step": 22078 }, { "epoch": 4.5, "learning_rate": 7.6141116027761406e-06, "loss": 0.0004, "step": 22079 }, { "epoch": 4.5, "learning_rate": 7.608015027986736e-06, "loss": 0.0003, "step": 22080 }, { "epoch": 4.5, "learning_rate": 7.601920831412289e-06, "loss": 0.0006, "step": 22081 }, { "epoch": 4.5, "learning_rate": 7.5958290131545194e-06, "loss": 0.0008, "step": 22082 }, { "epoch": 4.5, "learning_rate": 7.589739573315262e-06, "loss": 0.0034, "step": 22083 }, { "epoch": 4.5, "learning_rate": 7.5836525119961185e-06, "loss": 0.0022, "step": 22084 }, { "epoch": 4.5, "learning_rate": 7.577567829298859e-06, "loss": 0.0006, "step": 22085 }, { "epoch": 4.5, "learning_rate": 7.571485525325016e-06, "loss": 0.0006, "step": 22086 }, { "epoch": 4.5, "learning_rate": 7.565405600176244e-06, "loss": 0.0004, "step": 22087 }, { "epoch": 4.5, "learning_rate": 7.559328053954044e-06, "loss": 0.0001, "step": 22088 }, { "epoch": 4.5, "learning_rate": 7.553252886759953e-06, "loss": 0.0014, "step": 22089 }, { "epoch": 4.5, "learning_rate": 7.547180098695421e-06, "loss": 0.0008, "step": 22090 }, { "epoch": 4.5, "learning_rate": 7.541109689861885e-06, "loss": 0.0002, "step": 22091 }, { "epoch": 4.5, "learning_rate": 7.535041660360713e-06, "loss": 0.0019, "step": 22092 }, { "epoch": 4.5, "learning_rate": 7.528976010293275e-06, "loss": 0.0016, "step": 22093 }, { "epoch": 4.5, "learning_rate": 7.522912739760872e-06, "loss": 0.0009, "step": 22094 }, { "epoch": 4.5, "learning_rate": 7.516851848864775e-06, "loss": 0.0023, "step": 22095 }, { "epoch": 4.5, "learning_rate": 7.510793337706233e-06, "loss": 0.0063, "step": 22096 }, { "epoch": 4.5, "learning_rate": 7.504737206386352e-06, "loss": 0.0003, "step": 22097 }, { "epoch": 4.5, "learning_rate": 7.498683455006399e-06, "loss": 0.0024, "step": 22098 }, { "epoch": 4.5, "learning_rate": 7.492632083667394e-06, "loss": 0.0006, "step": 22099 }, { "epoch": 4.5, "learning_rate": 7.4865830924704215e-06, "loss": 0.0003, "step": 22100 }, { "epoch": 4.5, "learning_rate": 7.480536481516536e-06, "loss": 0.0003, "step": 22101 }, { "epoch": 4.5, "learning_rate": 7.474492250906705e-06, "loss": 0.0038, "step": 22102 }, { "epoch": 4.5, "learning_rate": 7.4684504007419155e-06, "loss": 0.0001, "step": 22103 }, { "epoch": 4.5, "learning_rate": 7.4624109311230365e-06, "loss": 0.0013, "step": 22104 }, { "epoch": 4.5, "learning_rate": 7.456373842150953e-06, "loss": 0.0006, "step": 22105 }, { "epoch": 4.5, "learning_rate": 7.450339133926486e-06, "loss": 0.0009, "step": 22106 }, { "epoch": 4.5, "learning_rate": 7.444306806550454e-06, "loss": 0.0019, "step": 22107 }, { "epoch": 4.5, "learning_rate": 7.438276860123593e-06, "loss": 0.0048, "step": 22108 }, { "epoch": 4.5, "learning_rate": 7.432249294746589e-06, "loss": 0.0035, "step": 22109 }, { "epoch": 4.5, "learning_rate": 7.426224110520163e-06, "loss": 0.0001, "step": 22110 }, { "epoch": 4.5, "learning_rate": 7.420201307544915e-06, "loss": 0.0016, "step": 22111 }, { "epoch": 4.5, "learning_rate": 7.414180885921434e-06, "loss": 0.0007, "step": 22112 }, { "epoch": 4.5, "learning_rate": 7.408162845750288e-06, "loss": 0.001, "step": 22113 }, { "epoch": 4.5, "learning_rate": 7.402147187132013e-06, "loss": 0.0009, "step": 22114 }, { "epoch": 4.5, "learning_rate": 7.396133910166996e-06, "loss": 0.0011, "step": 22115 }, { "epoch": 4.5, "learning_rate": 7.390123014955773e-06, "loss": 0.0032, "step": 22116 }, { "epoch": 4.5, "learning_rate": 7.384114501598648e-06, "loss": 0.0, "step": 22117 }, { "epoch": 4.5, "learning_rate": 7.378108370196073e-06, "loss": 0.005, "step": 22118 }, { "epoch": 4.5, "learning_rate": 7.372104620848268e-06, "loss": 0.0009, "step": 22119 }, { "epoch": 4.5, "learning_rate": 7.366103253655553e-06, "loss": 0.0053, "step": 22120 }, { "epoch": 4.5, "learning_rate": 7.3601042687181474e-06, "loss": 0.0001, "step": 22121 }, { "epoch": 4.5, "learning_rate": 7.3541076661362555e-06, "loss": 0.0018, "step": 22122 }, { "epoch": 4.5, "learning_rate": 7.348113446010029e-06, "loss": 0.0004, "step": 22123 }, { "epoch": 4.5, "learning_rate": 7.342121608439588e-06, "loss": 0.0014, "step": 22124 }, { "epoch": 4.51, "learning_rate": 7.336132153525004e-06, "loss": 0.0007, "step": 22125 }, { "epoch": 4.51, "learning_rate": 7.330145081366295e-06, "loss": 0.0032, "step": 22126 }, { "epoch": 4.51, "learning_rate": 7.324160392063499e-06, "loss": 0.0016, "step": 22127 }, { "epoch": 4.51, "learning_rate": 7.318178085716519e-06, "loss": 0.0003, "step": 22128 }, { "epoch": 4.51, "learning_rate": 7.312198162425326e-06, "loss": 0.0017, "step": 22129 }, { "epoch": 4.51, "learning_rate": 7.306220622289721e-06, "loss": 0.0018, "step": 22130 }, { "epoch": 4.51, "learning_rate": 7.300245465409627e-06, "loss": 0.0015, "step": 22131 }, { "epoch": 4.51, "learning_rate": 7.294272691884778e-06, "loss": 0.0028, "step": 22132 }, { "epoch": 4.51, "learning_rate": 7.28830230181493e-06, "loss": 0.0005, "step": 22133 }, { "epoch": 4.51, "learning_rate": 7.282334295299852e-06, "loss": 0.0008, "step": 22134 }, { "epoch": 4.51, "learning_rate": 7.276368672439165e-06, "loss": 0.0037, "step": 22135 }, { "epoch": 4.51, "learning_rate": 7.270405433332571e-06, "loss": 0.0027, "step": 22136 }, { "epoch": 4.51, "learning_rate": 7.264444578079609e-06, "loss": 0.0027, "step": 22137 }, { "epoch": 4.51, "learning_rate": 7.258486106779848e-06, "loss": 0.0003, "step": 22138 }, { "epoch": 4.51, "learning_rate": 7.252530019532809e-06, "loss": 0.0043, "step": 22139 }, { "epoch": 4.51, "learning_rate": 7.24657631643798e-06, "loss": 0.0002, "step": 22140 }, { "epoch": 4.51, "learning_rate": 7.240624997594796e-06, "loss": 0.0019, "step": 22141 }, { "epoch": 4.51, "learning_rate": 7.234676063102646e-06, "loss": 0.0037, "step": 22142 }, { "epoch": 4.51, "learning_rate": 7.228729513060899e-06, "loss": 0.0009, "step": 22143 }, { "epoch": 4.51, "learning_rate": 7.2227853475688606e-06, "loss": 0.0019, "step": 22144 }, { "epoch": 4.51, "learning_rate": 7.21684356672585e-06, "loss": 0.0003, "step": 22145 }, { "epoch": 4.51, "learning_rate": 7.210904170631021e-06, "loss": 0.0003, "step": 22146 }, { "epoch": 4.51, "learning_rate": 7.204967159383679e-06, "loss": 0.0004, "step": 22147 }, { "epoch": 4.51, "learning_rate": 7.199032533082877e-06, "loss": 0.0001, "step": 22148 }, { "epoch": 4.51, "learning_rate": 7.193100291827836e-06, "loss": 0.0001, "step": 22149 }, { "epoch": 4.51, "learning_rate": 7.18717043571756e-06, "loss": 0.0053, "step": 22150 }, { "epoch": 4.51, "learning_rate": 7.181242964851119e-06, "loss": 0.0009, "step": 22151 }, { "epoch": 4.51, "learning_rate": 7.175317879327519e-06, "loss": 0.0016, "step": 22152 }, { "epoch": 4.51, "learning_rate": 7.169395179245696e-06, "loss": 0.0009, "step": 22153 }, { "epoch": 4.51, "learning_rate": 7.163474864704605e-06, "loss": 0.0015, "step": 22154 }, { "epoch": 4.51, "learning_rate": 7.157556935803099e-06, "loss": 0.0032, "step": 22155 }, { "epoch": 4.51, "learning_rate": 7.151641392640018e-06, "loss": 0.0019, "step": 22156 }, { "epoch": 4.51, "learning_rate": 7.14572823531418e-06, "loss": 0.0009, "step": 22157 }, { "epoch": 4.51, "learning_rate": 7.139817463924324e-06, "loss": 0.0003, "step": 22158 }, { "epoch": 4.51, "learning_rate": 7.133909078569189e-06, "loss": 0.0007, "step": 22159 }, { "epoch": 4.51, "learning_rate": 7.1280030793474775e-06, "loss": 0.0, "step": 22160 }, { "epoch": 4.51, "learning_rate": 7.122099466357762e-06, "loss": 0.0054, "step": 22161 }, { "epoch": 4.51, "learning_rate": 7.116198239698711e-06, "loss": 0.0004, "step": 22162 }, { "epoch": 4.51, "learning_rate": 7.110299399468866e-06, "loss": 0.0004, "step": 22163 }, { "epoch": 4.51, "learning_rate": 7.104402945766729e-06, "loss": 0.0008, "step": 22164 }, { "epoch": 4.51, "learning_rate": 7.098508878690823e-06, "loss": 0.0005, "step": 22165 }, { "epoch": 4.51, "learning_rate": 7.092617198339534e-06, "loss": 0.0059, "step": 22166 }, { "epoch": 4.51, "learning_rate": 7.086727904811318e-06, "loss": 0.0003, "step": 22167 }, { "epoch": 4.51, "learning_rate": 7.080840998204479e-06, "loss": 0.0003, "step": 22168 }, { "epoch": 4.51, "learning_rate": 7.074956478617422e-06, "loss": 0.0001, "step": 22169 }, { "epoch": 4.51, "learning_rate": 7.069074346148368e-06, "loss": 0.0035, "step": 22170 }, { "epoch": 4.51, "learning_rate": 7.0631946008955555e-06, "loss": 0.0002, "step": 22171 }, { "epoch": 4.51, "learning_rate": 7.0573172429572224e-06, "loss": 0.0007, "step": 22172 }, { "epoch": 4.51, "learning_rate": 7.05144227243149e-06, "loss": 0.0015, "step": 22173 }, { "epoch": 4.52, "learning_rate": 7.0455696894165306e-06, "loss": 0.0041, "step": 22174 }, { "epoch": 4.52, "learning_rate": 7.039699494010398e-06, "loss": 0.0003, "step": 22175 }, { "epoch": 4.52, "learning_rate": 7.033831686311131e-06, "loss": 0.0, "step": 22176 }, { "epoch": 4.52, "learning_rate": 7.027966266416751e-06, "loss": 0.001, "step": 22177 }, { "epoch": 4.52, "learning_rate": 7.022103234425231e-06, "loss": 0.0008, "step": 22178 }, { "epoch": 4.52, "learning_rate": 7.01624259043444e-06, "loss": 0.003, "step": 22179 }, { "epoch": 4.52, "learning_rate": 7.010384334542335e-06, "loss": 0.0039, "step": 22180 }, { "epoch": 4.52, "learning_rate": 7.0045284668466875e-06, "loss": 0.0012, "step": 22181 }, { "epoch": 4.52, "learning_rate": 6.998674987445369e-06, "loss": 0.0003, "step": 22182 }, { "epoch": 4.52, "learning_rate": 6.9928238964361005e-06, "loss": 0.0045, "step": 22183 }, { "epoch": 4.52, "learning_rate": 6.986975193916605e-06, "loss": 0.0019, "step": 22184 }, { "epoch": 4.52, "learning_rate": 6.981128879984588e-06, "loss": 0.0004, "step": 22185 }, { "epoch": 4.52, "learning_rate": 6.97528495473767e-06, "loss": 0.0024, "step": 22186 }, { "epoch": 4.52, "learning_rate": 6.969443418273507e-06, "loss": 0.0038, "step": 22187 }, { "epoch": 4.52, "learning_rate": 6.963604270689621e-06, "loss": 0.0001, "step": 22188 }, { "epoch": 4.52, "learning_rate": 6.957767512083534e-06, "loss": 0.0032, "step": 22189 }, { "epoch": 4.52, "learning_rate": 6.951933142552734e-06, "loss": 0.0002, "step": 22190 }, { "epoch": 4.52, "learning_rate": 6.946101162194678e-06, "loss": 0.0004, "step": 22191 }, { "epoch": 4.52, "learning_rate": 6.94027157110677e-06, "loss": 0.0026, "step": 22192 }, { "epoch": 4.52, "learning_rate": 6.934444369386366e-06, "loss": 0.0001, "step": 22193 }, { "epoch": 4.52, "learning_rate": 6.9286195571308045e-06, "loss": 0.0001, "step": 22194 }, { "epoch": 4.52, "learning_rate": 6.922797134437358e-06, "loss": 0.0013, "step": 22195 }, { "epoch": 4.52, "learning_rate": 6.9169771014032985e-06, "loss": 0.0006, "step": 22196 }, { "epoch": 4.52, "learning_rate": 6.911159458125764e-06, "loss": 0.0001, "step": 22197 }, { "epoch": 4.52, "learning_rate": 6.905344204702012e-06, "loss": 0.0018, "step": 22198 }, { "epoch": 4.52, "learning_rate": 6.899531341229081e-06, "loss": 0.0026, "step": 22199 }, { "epoch": 4.52, "learning_rate": 6.893720867804126e-06, "loss": 0.001, "step": 22200 }, { "epoch": 4.52, "learning_rate": 6.887912784524169e-06, "loss": 0.001, "step": 22201 }, { "epoch": 4.52, "learning_rate": 6.8821070914861835e-06, "loss": 0.0003, "step": 22202 }, { "epoch": 4.52, "learning_rate": 6.87630378878719e-06, "loss": 0.0002, "step": 22203 }, { "epoch": 4.52, "learning_rate": 6.870502876524065e-06, "loss": 0.0002, "step": 22204 }, { "epoch": 4.52, "learning_rate": 6.864704354793727e-06, "loss": 0.0013, "step": 22205 }, { "epoch": 4.52, "learning_rate": 6.858908223693016e-06, "loss": 0.0029, "step": 22206 }, { "epoch": 4.52, "learning_rate": 6.853114483318739e-06, "loss": 0.0003, "step": 22207 }, { "epoch": 4.52, "learning_rate": 6.847323133767651e-06, "loss": 0.006, "step": 22208 }, { "epoch": 4.52, "learning_rate": 6.841534175136493e-06, "loss": 0.0007, "step": 22209 }, { "epoch": 4.52, "learning_rate": 6.835747607521952e-06, "loss": 0.0008, "step": 22210 }, { "epoch": 4.52, "learning_rate": 6.829963431020668e-06, "loss": 0.0004, "step": 22211 }, { "epoch": 4.52, "learning_rate": 6.824181645729215e-06, "loss": 0.0002, "step": 22212 }, { "epoch": 4.52, "learning_rate": 6.8184022517442485e-06, "loss": 0.0004, "step": 22213 }, { "epoch": 4.52, "learning_rate": 6.812625249162173e-06, "loss": 0.0013, "step": 22214 }, { "epoch": 4.52, "learning_rate": 6.80685063807958e-06, "loss": 0.0013, "step": 22215 }, { "epoch": 4.52, "learning_rate": 6.801078418592892e-06, "loss": 0.0006, "step": 22216 }, { "epoch": 4.52, "learning_rate": 6.795308590798465e-06, "loss": 0.0063, "step": 22217 }, { "epoch": 4.52, "learning_rate": 6.789541154792721e-06, "loss": 0.0016, "step": 22218 }, { "epoch": 4.52, "learning_rate": 6.783776110671968e-06, "loss": 0.0002, "step": 22219 }, { "epoch": 4.52, "learning_rate": 6.7780134585324945e-06, "loss": 0.0005, "step": 22220 }, { "epoch": 4.52, "learning_rate": 6.77225319847054e-06, "loss": 0.0003, "step": 22221 }, { "epoch": 4.52, "learning_rate": 6.766495330582328e-06, "loss": 0.0003, "step": 22222 }, { "epoch": 4.53, "learning_rate": 6.760739854964014e-06, "loss": 0.0005, "step": 22223 }, { "epoch": 4.53, "learning_rate": 6.754986771711724e-06, "loss": 0.0046, "step": 22224 }, { "epoch": 4.53, "learning_rate": 6.749236080921544e-06, "loss": 0.003, "step": 22225 }, { "epoch": 4.53, "learning_rate": 6.743487782689533e-06, "loss": 0.0001, "step": 22226 }, { "epoch": 4.53, "learning_rate": 6.737741877111697e-06, "loss": 0.0081, "step": 22227 }, { "epoch": 4.53, "learning_rate": 6.731998364283991e-06, "loss": 0.0, "step": 22228 }, { "epoch": 4.53, "learning_rate": 6.7262572443023575e-06, "loss": 0.002, "step": 22229 }, { "epoch": 4.53, "learning_rate": 6.720518517262652e-06, "loss": 0.0008, "step": 22230 }, { "epoch": 4.53, "learning_rate": 6.714782183260781e-06, "loss": 0.0001, "step": 22231 }, { "epoch": 4.53, "learning_rate": 6.709048242392484e-06, "loss": 0.0001, "step": 22232 }, { "epoch": 4.53, "learning_rate": 6.703316694753602e-06, "loss": 0.0005, "step": 22233 }, { "epoch": 4.53, "learning_rate": 6.6975875404397915e-06, "loss": 0.001, "step": 22234 }, { "epoch": 4.53, "learning_rate": 6.691860779546792e-06, "loss": 0.0116, "step": 22235 }, { "epoch": 4.53, "learning_rate": 6.686136412170212e-06, "loss": 0.0045, "step": 22236 }, { "epoch": 4.53, "learning_rate": 6.68041443840569e-06, "loss": 0.0001, "step": 22237 }, { "epoch": 4.53, "learning_rate": 6.674694858348767e-06, "loss": 0.003, "step": 22238 }, { "epoch": 4.53, "learning_rate": 6.668977672094999e-06, "loss": 0.0069, "step": 22239 }, { "epoch": 4.53, "learning_rate": 6.663262879739861e-06, "loss": 0.0005, "step": 22240 }, { "epoch": 4.53, "learning_rate": 6.657550481378793e-06, "loss": 0.0006, "step": 22241 }, { "epoch": 4.53, "learning_rate": 6.651840477107217e-06, "loss": 0.0001, "step": 22242 }, { "epoch": 4.53, "learning_rate": 6.646132867020476e-06, "loss": 0.0043, "step": 22243 }, { "epoch": 4.53, "learning_rate": 6.6404276512139584e-06, "loss": 0.001, "step": 22244 }, { "epoch": 4.53, "learning_rate": 6.634724829782856e-06, "loss": 0.0149, "step": 22245 }, { "epoch": 4.53, "learning_rate": 6.629024402822492e-06, "loss": 0.0006, "step": 22246 }, { "epoch": 4.53, "learning_rate": 6.623326370428072e-06, "loss": 0.0022, "step": 22247 }, { "epoch": 4.53, "learning_rate": 6.617630732694707e-06, "loss": 0.0001, "step": 22248 }, { "epoch": 4.53, "learning_rate": 6.6119374897176005e-06, "loss": 0.0001, "step": 22249 }, { "epoch": 4.53, "learning_rate": 6.606246641591761e-06, "loss": 0.0009, "step": 22250 }, { "epoch": 4.53, "learning_rate": 6.60055818841233e-06, "loss": 0.0021, "step": 22251 }, { "epoch": 4.53, "learning_rate": 6.594872130274232e-06, "loss": 0.0021, "step": 22252 }, { "epoch": 4.53, "learning_rate": 6.589188467272455e-06, "loss": 0.0029, "step": 22253 }, { "epoch": 4.53, "learning_rate": 6.583507199501959e-06, "loss": 0.004, "step": 22254 }, { "epoch": 4.53, "learning_rate": 6.577828327057599e-06, "loss": 0.0007, "step": 22255 }, { "epoch": 4.53, "learning_rate": 6.572151850034235e-06, "loss": 0.0056, "step": 22256 }, { "epoch": 4.53, "learning_rate": 6.566477768526674e-06, "loss": 0.0001, "step": 22257 }, { "epoch": 4.53, "learning_rate": 6.560806082629688e-06, "loss": 0.002, "step": 22258 }, { "epoch": 4.53, "learning_rate": 6.555136792438004e-06, "loss": 0.003, "step": 22259 }, { "epoch": 4.53, "learning_rate": 6.549469898046294e-06, "loss": 0.0001, "step": 22260 }, { "epoch": 4.53, "learning_rate": 6.5438053995492176e-06, "loss": 0.0015, "step": 22261 }, { "epoch": 4.53, "learning_rate": 6.538143297041415e-06, "loss": 0.004, "step": 22262 }, { "epoch": 4.53, "learning_rate": 6.5324835906173935e-06, "loss": 0.0004, "step": 22263 }, { "epoch": 4.53, "learning_rate": 6.5268262803717276e-06, "loss": 0.0002, "step": 22264 }, { "epoch": 4.53, "learning_rate": 6.5211713663988585e-06, "loss": 0.0013, "step": 22265 }, { "epoch": 4.53, "learning_rate": 6.515518848793294e-06, "loss": 0.001, "step": 22266 }, { "epoch": 4.53, "learning_rate": 6.509868727649409e-06, "loss": 0.0001, "step": 22267 }, { "epoch": 4.53, "learning_rate": 6.504221003061544e-06, "loss": 0.0038, "step": 22268 }, { "epoch": 4.53, "learning_rate": 6.49857567512409e-06, "loss": 0.0038, "step": 22269 }, { "epoch": 4.53, "learning_rate": 6.49293274393129e-06, "loss": 0.0003, "step": 22270 }, { "epoch": 4.53, "learning_rate": 6.487292209577383e-06, "loss": 0.0137, "step": 22271 }, { "epoch": 4.54, "learning_rate": 6.481654072156611e-06, "loss": 0.0009, "step": 22272 }, { "epoch": 4.54, "learning_rate": 6.4760183317631335e-06, "loss": 0.003, "step": 22273 }, { "epoch": 4.54, "learning_rate": 6.4703849884910564e-06, "loss": 0.0055, "step": 22274 }, { "epoch": 4.54, "learning_rate": 6.464754042434505e-06, "loss": 0.0, "step": 22275 }, { "epoch": 4.54, "learning_rate": 6.459125493687473e-06, "loss": 0.0003, "step": 22276 }, { "epoch": 4.54, "learning_rate": 6.453499342343998e-06, "loss": 0.0019, "step": 22277 }, { "epoch": 4.54, "learning_rate": 6.4478755884980584e-06, "loss": 0.0026, "step": 22278 }, { "epoch": 4.54, "learning_rate": 6.442254232243576e-06, "loss": 0.0005, "step": 22279 }, { "epoch": 4.54, "learning_rate": 6.436635273674446e-06, "loss": 0.006, "step": 22280 }, { "epoch": 4.54, "learning_rate": 6.431018712884456e-06, "loss": 0.002, "step": 22281 }, { "epoch": 4.54, "learning_rate": 6.425404549967516e-06, "loss": 0.0023, "step": 22282 }, { "epoch": 4.54, "learning_rate": 6.419792785017286e-06, "loss": 0.0031, "step": 22283 }, { "epoch": 4.54, "learning_rate": 6.414183418127572e-06, "loss": 0.002, "step": 22284 }, { "epoch": 4.54, "learning_rate": 6.4085764493920335e-06, "loss": 0.0028, "step": 22285 }, { "epoch": 4.54, "learning_rate": 6.402971878904295e-06, "loss": 0.0004, "step": 22286 }, { "epoch": 4.54, "learning_rate": 6.397369706757999e-06, "loss": 0.0008, "step": 22287 }, { "epoch": 4.54, "learning_rate": 6.391769933046703e-06, "loss": 0.0012, "step": 22288 }, { "epoch": 4.54, "learning_rate": 6.386172557863917e-06, "loss": 0.0001, "step": 22289 }, { "epoch": 4.54, "learning_rate": 6.380577581303148e-06, "loss": 0.0016, "step": 22290 }, { "epoch": 4.54, "learning_rate": 6.374985003457822e-06, "loss": 0.0004, "step": 22291 }, { "epoch": 4.54, "learning_rate": 6.369394824421364e-06, "loss": 0.0042, "step": 22292 }, { "epoch": 4.54, "learning_rate": 6.363807044287167e-06, "loss": 0.0002, "step": 22293 }, { "epoch": 4.54, "learning_rate": 6.358221663148472e-06, "loss": 0.0091, "step": 22294 }, { "epoch": 4.54, "learning_rate": 6.352638681098654e-06, "loss": 0.0004, "step": 22295 }, { "epoch": 4.54, "learning_rate": 6.347058098230889e-06, "loss": 0.0001, "step": 22296 }, { "epoch": 4.54, "learning_rate": 6.341479914638454e-06, "loss": 0.0002, "step": 22297 }, { "epoch": 4.54, "learning_rate": 6.335904130414471e-06, "loss": 0.001, "step": 22298 }, { "epoch": 4.54, "learning_rate": 6.330330745652051e-06, "loss": 0.0015, "step": 22299 }, { "epoch": 4.54, "learning_rate": 6.324759760444337e-06, "loss": 0.0003, "step": 22300 }, { "epoch": 4.54, "learning_rate": 6.319191174884302e-06, "loss": 0.0015, "step": 22301 }, { "epoch": 4.54, "learning_rate": 6.313624989065041e-06, "loss": 0.0012, "step": 22302 }, { "epoch": 4.54, "learning_rate": 6.308061203079429e-06, "loss": 0.0034, "step": 22303 }, { "epoch": 4.54, "learning_rate": 6.3024998170204566e-06, "loss": 0.0008, "step": 22304 }, { "epoch": 4.54, "learning_rate": 6.296940830980967e-06, "loss": 0.0032, "step": 22305 }, { "epoch": 4.54, "learning_rate": 6.291384245053837e-06, "loss": 0.0007, "step": 22306 }, { "epoch": 4.54, "learning_rate": 6.285830059331842e-06, "loss": 0.0004, "step": 22307 }, { "epoch": 4.54, "learning_rate": 6.280278273907791e-06, "loss": 0.0017, "step": 22308 }, { "epoch": 4.54, "learning_rate": 6.274728888874358e-06, "loss": 0.0017, "step": 22309 }, { "epoch": 4.54, "learning_rate": 6.269181904324272e-06, "loss": 0.0102, "step": 22310 }, { "epoch": 4.54, "learning_rate": 6.26363732035014e-06, "loss": 0.0023, "step": 22311 }, { "epoch": 4.54, "learning_rate": 6.2580951370446055e-06, "loss": 0.0038, "step": 22312 }, { "epoch": 4.54, "learning_rate": 6.252555354500227e-06, "loss": 0.0007, "step": 22313 }, { "epoch": 4.54, "learning_rate": 6.2470179728094815e-06, "loss": 0.0052, "step": 22314 }, { "epoch": 4.54, "learning_rate": 6.241482992064911e-06, "loss": 0.0004, "step": 22315 }, { "epoch": 4.54, "learning_rate": 6.235950412358908e-06, "loss": 0.0006, "step": 22316 }, { "epoch": 4.54, "learning_rate": 6.230420233783951e-06, "loss": 0.0049, "step": 22317 }, { "epoch": 4.54, "learning_rate": 6.224892456432345e-06, "loss": 0.002, "step": 22318 }, { "epoch": 4.54, "learning_rate": 6.21936708039642e-06, "loss": 0.0004, "step": 22319 }, { "epoch": 4.54, "learning_rate": 6.213844105768467e-06, "loss": 0.0017, "step": 22320 }, { "epoch": 4.54, "learning_rate": 6.208323532640746e-06, "loss": 0.0032, "step": 22321 }, { "epoch": 4.55, "learning_rate": 6.202805361105451e-06, "loss": 0.0017, "step": 22322 }, { "epoch": 4.55, "learning_rate": 6.197289591254722e-06, "loss": 0.0011, "step": 22323 }, { "epoch": 4.55, "learning_rate": 6.1917762231807225e-06, "loss": 0.0041, "step": 22324 }, { "epoch": 4.55, "learning_rate": 6.186265256975509e-06, "loss": 0.0031, "step": 22325 }, { "epoch": 4.55, "learning_rate": 6.180756692731142e-06, "loss": 0.0017, "step": 22326 }, { "epoch": 4.55, "learning_rate": 6.1752505305396e-06, "loss": 0.0036, "step": 22327 }, { "epoch": 4.55, "learning_rate": 6.16974677049289e-06, "loss": 0.0047, "step": 22328 }, { "epoch": 4.55, "learning_rate": 6.164245412682872e-06, "loss": 0.0061, "step": 22329 }, { "epoch": 4.55, "learning_rate": 6.158746457201475e-06, "loss": 0.0001, "step": 22330 }, { "epoch": 4.55, "learning_rate": 6.153249904140556e-06, "loss": 0.0014, "step": 22331 }, { "epoch": 4.55, "learning_rate": 6.14775575359186e-06, "loss": 0.0001, "step": 22332 }, { "epoch": 4.55, "learning_rate": 6.142264005647213e-06, "loss": 0.0004, "step": 22333 }, { "epoch": 4.55, "learning_rate": 6.136774660398275e-06, "loss": 0.0003, "step": 22334 }, { "epoch": 4.55, "learning_rate": 6.131287717936806e-06, "loss": 0.0001, "step": 22335 }, { "epoch": 4.55, "learning_rate": 6.125803178354383e-06, "loss": 0.0019, "step": 22336 }, { "epoch": 4.55, "learning_rate": 6.120321041742615e-06, "loss": 0.0051, "step": 22337 }, { "epoch": 4.55, "learning_rate": 6.11484130819308e-06, "loss": 0.0006, "step": 22338 }, { "epoch": 4.55, "learning_rate": 6.109363977797305e-06, "loss": 0.0024, "step": 22339 }, { "epoch": 4.55, "learning_rate": 6.1038890506467656e-06, "loss": 0.0009, "step": 22340 }, { "epoch": 4.55, "learning_rate": 6.098416526832905e-06, "loss": 0.0001, "step": 22341 }, { "epoch": 4.55, "learning_rate": 6.092946406447119e-06, "loss": 0.0001, "step": 22342 }, { "epoch": 4.55, "learning_rate": 6.087478689580766e-06, "loss": 0.0, "step": 22343 }, { "epoch": 4.55, "learning_rate": 6.08201337632519e-06, "loss": 0.003, "step": 22344 }, { "epoch": 4.55, "learning_rate": 6.076550466771634e-06, "loss": 0.0002, "step": 22345 }, { "epoch": 4.55, "learning_rate": 6.071089961011377e-06, "loss": 0.0012, "step": 22346 }, { "epoch": 4.55, "learning_rate": 6.065631859135578e-06, "loss": 0.0011, "step": 22347 }, { "epoch": 4.55, "learning_rate": 6.0601761612354636e-06, "loss": 0.0002, "step": 22348 }, { "epoch": 4.55, "learning_rate": 6.054722867402079e-06, "loss": 0.0062, "step": 22349 }, { "epoch": 4.55, "learning_rate": 6.0492719777265494e-06, "loss": 0.0005, "step": 22350 }, { "epoch": 4.55, "learning_rate": 6.0438234922999044e-06, "loss": 0.0034, "step": 22351 }, { "epoch": 4.55, "learning_rate": 6.0383774112131185e-06, "loss": 0.0001, "step": 22352 }, { "epoch": 4.55, "learning_rate": 6.0329337345572215e-06, "loss": 0.0006, "step": 22353 }, { "epoch": 4.55, "learning_rate": 6.027492462423056e-06, "loss": 0.0003, "step": 22354 }, { "epoch": 4.55, "learning_rate": 6.022053594901549e-06, "loss": 0.0005, "step": 22355 }, { "epoch": 4.55, "learning_rate": 6.016617132083512e-06, "loss": 0.0001, "step": 22356 }, { "epoch": 4.55, "learning_rate": 6.011183074059772e-06, "loss": 0.001, "step": 22357 }, { "epoch": 4.55, "learning_rate": 6.0057514209210566e-06, "loss": 0.0001, "step": 22358 }, { "epoch": 4.55, "learning_rate": 6.00032217275811e-06, "loss": 0.0002, "step": 22359 }, { "epoch": 4.55, "learning_rate": 5.994895329661608e-06, "loss": 0.0004, "step": 22360 }, { "epoch": 4.55, "learning_rate": 5.989470891722165e-06, "loss": 0.0001, "step": 22361 }, { "epoch": 4.55, "learning_rate": 5.984048859030421e-06, "loss": 0.0009, "step": 22362 }, { "epoch": 4.55, "learning_rate": 5.97862923167689e-06, "loss": 0.0043, "step": 22363 }, { "epoch": 4.55, "learning_rate": 5.973212009752132e-06, "loss": 0.0006, "step": 22364 }, { "epoch": 4.55, "learning_rate": 5.967797193346574e-06, "loss": 0.0005, "step": 22365 }, { "epoch": 4.55, "learning_rate": 5.962384782550711e-06, "loss": 0.0021, "step": 22366 }, { "epoch": 4.55, "learning_rate": 5.9569747774549035e-06, "loss": 0.009, "step": 22367 }, { "epoch": 4.55, "learning_rate": 5.951567178149513e-06, "loss": 0.0059, "step": 22368 }, { "epoch": 4.55, "learning_rate": 5.946161984724868e-06, "loss": 0.0024, "step": 22369 }, { "epoch": 4.55, "learning_rate": 5.940759197271228e-06, "loss": 0.0075, "step": 22370 }, { "epoch": 4.56, "learning_rate": 5.9353588158788375e-06, "loss": 0.0037, "step": 22371 }, { "epoch": 4.56, "learning_rate": 5.929960840637909e-06, "loss": 0.0032, "step": 22372 }, { "epoch": 4.56, "learning_rate": 5.924565271638587e-06, "loss": 0.0004, "step": 22373 }, { "epoch": 4.56, "learning_rate": 5.919172108970966e-06, "loss": 0.002, "step": 22374 }, { "epoch": 4.56, "learning_rate": 5.913781352725155e-06, "loss": 0.0004, "step": 22375 }, { "epoch": 4.56, "learning_rate": 5.908393002991185e-06, "loss": 0.0011, "step": 22376 }, { "epoch": 4.56, "learning_rate": 5.903007059859049e-06, "loss": 0.004, "step": 22377 }, { "epoch": 4.56, "learning_rate": 5.8976235234186765e-06, "loss": 0.002, "step": 22378 }, { "epoch": 4.56, "learning_rate": 5.8922423937600275e-06, "loss": 0.0013, "step": 22379 }, { "epoch": 4.56, "learning_rate": 5.88686367097293e-06, "loss": 0.0017, "step": 22380 }, { "epoch": 4.56, "learning_rate": 5.881487355147263e-06, "loss": 0.0063, "step": 22381 }, { "epoch": 4.56, "learning_rate": 5.876113446372788e-06, "loss": 0.0044, "step": 22382 }, { "epoch": 4.56, "learning_rate": 5.870741944739249e-06, "loss": 0.0048, "step": 22383 }, { "epoch": 4.56, "learning_rate": 5.865372850336425e-06, "loss": 0.0001, "step": 22384 }, { "epoch": 4.56, "learning_rate": 5.860006163253911e-06, "loss": 0.0003, "step": 22385 }, { "epoch": 4.56, "learning_rate": 5.854641883581418e-06, "loss": 0.0004, "step": 22386 }, { "epoch": 4.56, "learning_rate": 5.8492800114084745e-06, "loss": 0.0006, "step": 22387 }, { "epoch": 4.56, "learning_rate": 5.84392054682466e-06, "loss": 0.0002, "step": 22388 }, { "epoch": 4.56, "learning_rate": 5.838563489919484e-06, "loss": 0.0006, "step": 22389 }, { "epoch": 4.56, "learning_rate": 5.833208840782427e-06, "loss": 0.0001, "step": 22390 }, { "epoch": 4.56, "learning_rate": 5.827856599502917e-06, "loss": 0.0006, "step": 22391 }, { "epoch": 4.56, "learning_rate": 5.8225067661703315e-06, "loss": 0.0009, "step": 22392 }, { "epoch": 4.56, "learning_rate": 5.81715934087405e-06, "loss": 0.0026, "step": 22393 }, { "epoch": 4.56, "learning_rate": 5.811814323703384e-06, "loss": 0.0022, "step": 22394 }, { "epoch": 4.56, "learning_rate": 5.806471714747596e-06, "loss": 0.0028, "step": 22395 }, { "epoch": 4.56, "learning_rate": 5.80113151409588e-06, "loss": 0.0054, "step": 22396 }, { "epoch": 4.56, "learning_rate": 5.7957937218375e-06, "loss": 0.0005, "step": 22397 }, { "epoch": 4.56, "learning_rate": 5.790458338061532e-06, "loss": 0.0017, "step": 22398 }, { "epoch": 4.56, "learning_rate": 5.785125362857157e-06, "loss": 0.0001, "step": 22399 }, { "epoch": 4.56, "learning_rate": 5.7797947963134025e-06, "loss": 0.0008, "step": 22400 }, { "epoch": 4.56, "learning_rate": 5.774466638519298e-06, "loss": 0.0007, "step": 22401 }, { "epoch": 4.56, "learning_rate": 5.769140889563855e-06, "loss": 0.0015, "step": 22402 }, { "epoch": 4.56, "learning_rate": 5.763817549536021e-06, "loss": 0.0019, "step": 22403 }, { "epoch": 4.56, "learning_rate": 5.758496618524688e-06, "loss": 0.0002, "step": 22404 }, { "epoch": 4.56, "learning_rate": 5.753178096618738e-06, "loss": 0.0008, "step": 22405 }, { "epoch": 4.56, "learning_rate": 5.747861983906998e-06, "loss": 0.003, "step": 22406 }, { "epoch": 4.56, "learning_rate": 5.742548280478266e-06, "loss": 0.0035, "step": 22407 }, { "epoch": 4.56, "learning_rate": 5.7372369864212846e-06, "loss": 0.0004, "step": 22408 }, { "epoch": 4.56, "learning_rate": 5.731928101824751e-06, "loss": 0.0003, "step": 22409 }, { "epoch": 4.56, "learning_rate": 5.726621626777361e-06, "loss": 0.0001, "step": 22410 }, { "epoch": 4.56, "learning_rate": 5.721317561367694e-06, "loss": 0.0012, "step": 22411 }, { "epoch": 4.56, "learning_rate": 5.716015905684379e-06, "loss": 0.0005, "step": 22412 }, { "epoch": 4.56, "learning_rate": 5.710716659815962e-06, "loss": 0.0002, "step": 22413 }, { "epoch": 4.56, "learning_rate": 5.705419823850938e-06, "loss": 0.0005, "step": 22414 }, { "epoch": 4.56, "learning_rate": 5.700125397877803e-06, "loss": 0.0035, "step": 22415 }, { "epoch": 4.56, "learning_rate": 5.69483338198492e-06, "loss": 0.0002, "step": 22416 }, { "epoch": 4.56, "learning_rate": 5.689543776260752e-06, "loss": 0.0022, "step": 22417 }, { "epoch": 4.56, "learning_rate": 5.684256580793578e-06, "loss": 0.0006, "step": 22418 }, { "epoch": 4.56, "learning_rate": 5.678971795671744e-06, "loss": 0.002, "step": 22419 }, { "epoch": 4.57, "learning_rate": 5.6736894209835126e-06, "loss": 0.0019, "step": 22420 }, { "epoch": 4.57, "learning_rate": 5.6684094568170965e-06, "loss": 0.002, "step": 22421 }, { "epoch": 4.57, "learning_rate": 5.6631319032606924e-06, "loss": 0.0002, "step": 22422 }, { "epoch": 4.57, "learning_rate": 5.657856760402429e-06, "loss": 0.0013, "step": 22423 }, { "epoch": 4.57, "learning_rate": 5.652584028330437e-06, "loss": 0.0014, "step": 22424 }, { "epoch": 4.57, "learning_rate": 5.647313707132761e-06, "loss": 0.0052, "step": 22425 }, { "epoch": 4.57, "learning_rate": 5.642045796897432e-06, "loss": 0.0017, "step": 22426 }, { "epoch": 4.57, "learning_rate": 5.636780297712428e-06, "loss": 0.0014, "step": 22427 }, { "epoch": 4.57, "learning_rate": 5.631517209665715e-06, "loss": 0.0014, "step": 22428 }, { "epoch": 4.57, "learning_rate": 5.626256532845153e-06, "loss": 0.0019, "step": 22429 }, { "epoch": 4.57, "learning_rate": 5.6209982673386554e-06, "loss": 0.004, "step": 22430 }, { "epoch": 4.57, "learning_rate": 5.615742413234004e-06, "loss": 0.0019, "step": 22431 }, { "epoch": 4.57, "learning_rate": 5.6104889706190256e-06, "loss": 0.0022, "step": 22432 }, { "epoch": 4.57, "learning_rate": 5.605237939581403e-06, "loss": 0.0003, "step": 22433 }, { "epoch": 4.57, "learning_rate": 5.599989320208881e-06, "loss": 0.0012, "step": 22434 }, { "epoch": 4.57, "learning_rate": 5.594743112589123e-06, "loss": 0.0003, "step": 22435 }, { "epoch": 4.57, "learning_rate": 5.589499316809709e-06, "loss": 0.0028, "step": 22436 }, { "epoch": 4.57, "learning_rate": 5.584257932958286e-06, "loss": 0.0011, "step": 22437 }, { "epoch": 4.57, "learning_rate": 5.5790189611223504e-06, "loss": 0.0034, "step": 22438 }, { "epoch": 4.57, "learning_rate": 5.573782401389415e-06, "loss": 0.0039, "step": 22439 }, { "epoch": 4.57, "learning_rate": 5.568548253846928e-06, "loss": 0.0001, "step": 22440 }, { "epoch": 4.57, "learning_rate": 5.563316518582334e-06, "loss": 0.0005, "step": 22441 }, { "epoch": 4.57, "learning_rate": 5.558087195682964e-06, "loss": 0.0019, "step": 22442 }, { "epoch": 4.57, "learning_rate": 5.552860285236216e-06, "loss": 0.0038, "step": 22443 }, { "epoch": 4.57, "learning_rate": 5.547635787329352e-06, "loss": 0.0007, "step": 22444 }, { "epoch": 4.57, "learning_rate": 5.542413702049653e-06, "loss": 0.0003, "step": 22445 }, { "epoch": 4.57, "learning_rate": 5.537194029484349e-06, "loss": 0.0009, "step": 22446 }, { "epoch": 4.57, "learning_rate": 5.531976769720553e-06, "loss": 0.0003, "step": 22447 }, { "epoch": 4.57, "learning_rate": 5.526761922845496e-06, "loss": 0.0027, "step": 22448 }, { "epoch": 4.57, "learning_rate": 5.521549488946175e-06, "loss": 0.0022, "step": 22449 }, { "epoch": 4.57, "learning_rate": 5.516339468109754e-06, "loss": 0.0, "step": 22450 }, { "epoch": 4.57, "learning_rate": 5.511131860423163e-06, "loss": 0.0013, "step": 22451 }, { "epoch": 4.57, "learning_rate": 5.505926665973415e-06, "loss": 0.001, "step": 22452 }, { "epoch": 4.57, "learning_rate": 5.500723884847458e-06, "loss": 0.0001, "step": 22453 }, { "epoch": 4.57, "learning_rate": 5.495523517132156e-06, "loss": 0.0007, "step": 22454 }, { "epoch": 4.57, "learning_rate": 5.490325562914388e-06, "loss": 0.0009, "step": 22455 }, { "epoch": 4.57, "learning_rate": 5.48513002228097e-06, "loss": 0.0016, "step": 22456 }, { "epoch": 4.57, "learning_rate": 5.479936895318665e-06, "loss": 0.0008, "step": 22457 }, { "epoch": 4.57, "learning_rate": 5.47474618211422e-06, "loss": 0.0008, "step": 22458 }, { "epoch": 4.57, "learning_rate": 5.469557882754316e-06, "loss": 0.0002, "step": 22459 }, { "epoch": 4.57, "learning_rate": 5.464371997325617e-06, "loss": 0.0016, "step": 22460 }, { "epoch": 4.57, "learning_rate": 5.459188525914754e-06, "loss": 0.0001, "step": 22461 }, { "epoch": 4.57, "learning_rate": 5.454007468608257e-06, "loss": 0.0021, "step": 22462 }, { "epoch": 4.57, "learning_rate": 5.448828825492723e-06, "loss": 0.0003, "step": 22463 }, { "epoch": 4.57, "learning_rate": 5.443652596654552e-06, "loss": 0.0002, "step": 22464 }, { "epoch": 4.57, "learning_rate": 5.438478782180289e-06, "loss": 0.0006, "step": 22465 }, { "epoch": 4.57, "learning_rate": 5.433307382156316e-06, "loss": 0.0074, "step": 22466 }, { "epoch": 4.57, "learning_rate": 5.428138396668963e-06, "loss": 0.0022, "step": 22467 }, { "epoch": 4.57, "learning_rate": 5.422971825804645e-06, "loss": 0.0008, "step": 22468 }, { "epoch": 4.58, "learning_rate": 5.417807669649577e-06, "loss": 0.0005, "step": 22469 }, { "epoch": 4.58, "learning_rate": 5.412645928290038e-06, "loss": 0.0004, "step": 22470 }, { "epoch": 4.58, "learning_rate": 5.407486601812244e-06, "loss": 0.0004, "step": 22471 }, { "epoch": 4.58, "learning_rate": 5.402329690302359e-06, "loss": 0.0007, "step": 22472 }, { "epoch": 4.58, "learning_rate": 5.397175193846531e-06, "loss": 0.0008, "step": 22473 }, { "epoch": 4.58, "learning_rate": 5.392023112530808e-06, "loss": 0.0018, "step": 22474 }, { "epoch": 4.58, "learning_rate": 5.386873446441287e-06, "loss": 0.0001, "step": 22475 }, { "epoch": 4.58, "learning_rate": 5.381726195663949e-06, "loss": 0.0007, "step": 22476 }, { "epoch": 4.58, "learning_rate": 5.376581360284776e-06, "loss": 0.0034, "step": 22477 }, { "epoch": 4.58, "learning_rate": 5.371438940389683e-06, "loss": 0.0016, "step": 22478 }, { "epoch": 4.58, "learning_rate": 5.366298936064584e-06, "loss": 0.0001, "step": 22479 }, { "epoch": 4.58, "learning_rate": 5.3611613473952595e-06, "loss": 0.0002, "step": 22480 }, { "epoch": 4.58, "learning_rate": 5.356026174467626e-06, "loss": 0.0022, "step": 22481 }, { "epoch": 4.58, "learning_rate": 5.350893417367346e-06, "loss": 0.0021, "step": 22482 }, { "epoch": 4.58, "learning_rate": 5.345763076180221e-06, "loss": 0.0003, "step": 22483 }, { "epoch": 4.58, "learning_rate": 5.340635150991879e-06, "loss": 0.0034, "step": 22484 }, { "epoch": 4.58, "learning_rate": 5.33550964188802e-06, "loss": 0.001, "step": 22485 }, { "epoch": 4.58, "learning_rate": 5.330386548954208e-06, "loss": 0.0014, "step": 22486 }, { "epoch": 4.58, "learning_rate": 5.325265872276025e-06, "loss": 0.0011, "step": 22487 }, { "epoch": 4.58, "learning_rate": 5.320147611938985e-06, "loss": 0.0002, "step": 22488 }, { "epoch": 4.58, "learning_rate": 5.315031768028605e-06, "loss": 0.003, "step": 22489 }, { "epoch": 4.58, "learning_rate": 5.309918340630281e-06, "loss": 0.0078, "step": 22490 }, { "epoch": 4.58, "learning_rate": 5.304807329829463e-06, "loss": 0.0014, "step": 22491 }, { "epoch": 4.58, "learning_rate": 5.2996987357115e-06, "loss": 0.005, "step": 22492 }, { "epoch": 4.58, "learning_rate": 5.294592558361688e-06, "loss": 0.0002, "step": 22493 }, { "epoch": 4.58, "learning_rate": 5.28948879786536e-06, "loss": 0.0002, "step": 22494 }, { "epoch": 4.58, "learning_rate": 5.2843874543076815e-06, "loss": 0.0019, "step": 22495 }, { "epoch": 4.58, "learning_rate": 5.279288527773934e-06, "loss": 0.0015, "step": 22496 }, { "epoch": 4.58, "learning_rate": 5.2741920183492655e-06, "loss": 0.001, "step": 22497 }, { "epoch": 4.58, "learning_rate": 5.2690979261187426e-06, "loss": 0.0003, "step": 22498 }, { "epoch": 4.58, "learning_rate": 5.264006251167513e-06, "loss": 0.0014, "step": 22499 }, { "epoch": 4.58, "learning_rate": 5.258916993580559e-06, "loss": 0.0001, "step": 22500 }, { "epoch": 4.58, "learning_rate": 5.253830153442928e-06, "loss": 0.0034, "step": 22501 }, { "epoch": 4.58, "learning_rate": 5.2487457308395705e-06, "loss": 0.0009, "step": 22502 }, { "epoch": 4.58, "learning_rate": 5.2436637258553685e-06, "loss": 0.0001, "step": 22503 }, { "epoch": 4.58, "learning_rate": 5.238584138575252e-06, "loss": 0.0033, "step": 22504 }, { "epoch": 4.58, "learning_rate": 5.233506969084022e-06, "loss": 0.0001, "step": 22505 }, { "epoch": 4.58, "learning_rate": 5.22843221746651e-06, "loss": 0.0006, "step": 22506 }, { "epoch": 4.58, "learning_rate": 5.223359883807432e-06, "loss": 0.0006, "step": 22507 }, { "epoch": 4.58, "learning_rate": 5.218289968191553e-06, "loss": 0.001, "step": 22508 }, { "epoch": 4.58, "learning_rate": 5.213222470703504e-06, "loss": 0.0006, "step": 22509 }, { "epoch": 4.58, "learning_rate": 5.208157391427953e-06, "loss": 0.0034, "step": 22510 }, { "epoch": 4.58, "learning_rate": 5.203094730449497e-06, "loss": 0.0017, "step": 22511 }, { "epoch": 4.58, "learning_rate": 5.198034487852687e-06, "loss": 0.0009, "step": 22512 }, { "epoch": 4.58, "learning_rate": 5.192976663722004e-06, "loss": 0.0005, "step": 22513 }, { "epoch": 4.58, "learning_rate": 5.187921258141997e-06, "loss": 0.0002, "step": 22514 }, { "epoch": 4.58, "learning_rate": 5.182868271197032e-06, "loss": 0.0085, "step": 22515 }, { "epoch": 4.58, "learning_rate": 5.177817702971526e-06, "loss": 0.0016, "step": 22516 }, { "epoch": 4.58, "learning_rate": 5.172769553549844e-06, "loss": 0.0011, "step": 22517 }, { "epoch": 4.59, "learning_rate": 5.1677238230162675e-06, "loss": 0.0031, "step": 22518 }, { "epoch": 4.59, "learning_rate": 5.162680511455114e-06, "loss": 0.0062, "step": 22519 }, { "epoch": 4.59, "learning_rate": 5.157639618950599e-06, "loss": 0.0038, "step": 22520 }, { "epoch": 4.59, "learning_rate": 5.152601145586904e-06, "loss": 0.0022, "step": 22521 }, { "epoch": 4.59, "learning_rate": 5.147565091448197e-06, "loss": 0.0003, "step": 22522 }, { "epoch": 4.59, "learning_rate": 5.142531456618576e-06, "loss": 0.0001, "step": 22523 }, { "epoch": 4.59, "learning_rate": 5.137500241182108e-06, "loss": 0.004, "step": 22524 }, { "epoch": 4.59, "learning_rate": 5.132471445222841e-06, "loss": 0.0002, "step": 22525 }, { "epoch": 4.59, "learning_rate": 5.127445068824759e-06, "loss": 0.0013, "step": 22526 }, { "epoch": 4.59, "learning_rate": 5.122421112071812e-06, "loss": 0.0023, "step": 22527 }, { "epoch": 4.59, "learning_rate": 5.117399575047898e-06, "loss": 0.0009, "step": 22528 }, { "epoch": 4.59, "learning_rate": 5.112380457836918e-06, "loss": 0.001, "step": 22529 }, { "epoch": 4.59, "learning_rate": 5.10736376052267e-06, "loss": 0.0001, "step": 22530 }, { "epoch": 4.59, "learning_rate": 5.102349483188939e-06, "loss": 0.0039, "step": 22531 }, { "epoch": 4.59, "learning_rate": 5.097337625919507e-06, "loss": 0.0005, "step": 22532 }, { "epoch": 4.59, "learning_rate": 5.0923281887980225e-06, "loss": 0.0034, "step": 22533 }, { "epoch": 4.59, "learning_rate": 5.087321171908237e-06, "loss": 0.0028, "step": 22534 }, { "epoch": 4.59, "learning_rate": 5.082316575333701e-06, "loss": 0.001, "step": 22535 }, { "epoch": 4.59, "learning_rate": 5.077314399158044e-06, "loss": 0.0005, "step": 22536 }, { "epoch": 4.59, "learning_rate": 5.072314643464787e-06, "loss": 0.0003, "step": 22537 }, { "epoch": 4.59, "learning_rate": 5.067317308337443e-06, "loss": 0.0003, "step": 22538 }, { "epoch": 4.59, "learning_rate": 5.06232239385948e-06, "loss": 0.0003, "step": 22539 }, { "epoch": 4.59, "learning_rate": 5.057329900114332e-06, "loss": 0.0007, "step": 22540 }, { "epoch": 4.59, "learning_rate": 5.052339827185364e-06, "loss": 0.0058, "step": 22541 }, { "epoch": 4.59, "learning_rate": 5.047352175155928e-06, "loss": 0.0002, "step": 22542 }, { "epoch": 4.59, "learning_rate": 5.042366944109355e-06, "loss": 0.0031, "step": 22543 }, { "epoch": 4.59, "learning_rate": 5.037384134128847e-06, "loss": 0.0045, "step": 22544 }, { "epoch": 4.59, "learning_rate": 5.032403745297686e-06, "loss": 0.0021, "step": 22545 }, { "epoch": 4.59, "learning_rate": 5.02742577769899e-06, "loss": 0.0011, "step": 22546 }, { "epoch": 4.59, "learning_rate": 5.022450231415992e-06, "loss": 0.0001, "step": 22547 }, { "epoch": 4.59, "learning_rate": 5.017477106531708e-06, "loss": 0.0013, "step": 22548 }, { "epoch": 4.59, "learning_rate": 5.012506403129208e-06, "loss": 0.0016, "step": 22549 }, { "epoch": 4.59, "learning_rate": 5.007538121291587e-06, "loss": 0.005, "step": 22550 }, { "epoch": 4.59, "learning_rate": 5.002572261101717e-06, "loss": 0.0024, "step": 22551 }, { "epoch": 4.59, "learning_rate": 4.997608822642646e-06, "loss": 0.0016, "step": 22552 }, { "epoch": 4.59, "learning_rate": 4.992647805997191e-06, "loss": 0.001, "step": 22553 }, { "epoch": 4.59, "learning_rate": 4.987689211248236e-06, "loss": 0.0004, "step": 22554 }, { "epoch": 4.59, "learning_rate": 4.982733038478598e-06, "loss": 0.0004, "step": 22555 }, { "epoch": 4.59, "learning_rate": 4.977779287771078e-06, "loss": 0.0037, "step": 22556 }, { "epoch": 4.59, "learning_rate": 4.9728279592083756e-06, "loss": 0.0015, "step": 22557 }, { "epoch": 4.59, "learning_rate": 4.967879052873208e-06, "loss": 0.0021, "step": 22558 }, { "epoch": 4.59, "learning_rate": 4.962932568848227e-06, "loss": 0.0001, "step": 22559 }, { "epoch": 4.59, "learning_rate": 4.957988507216048e-06, "loss": 0.0011, "step": 22560 }, { "epoch": 4.59, "learning_rate": 4.953046868059258e-06, "loss": 0.0003, "step": 22561 }, { "epoch": 4.59, "learning_rate": 4.94810765146037e-06, "loss": 0.0021, "step": 22562 }, { "epoch": 4.59, "learning_rate": 4.943170857501904e-06, "loss": 0.0078, "step": 22563 }, { "epoch": 4.59, "learning_rate": 4.9382364862662614e-06, "loss": 0.0011, "step": 22564 }, { "epoch": 4.59, "learning_rate": 4.933304537835942e-06, "loss": 0.0001, "step": 22565 }, { "epoch": 4.59, "learning_rate": 4.928375012293245e-06, "loss": 0.0012, "step": 22566 }, { "epoch": 4.6, "learning_rate": 4.923447909720524e-06, "loss": 0.0008, "step": 22567 }, { "epoch": 4.6, "learning_rate": 4.918523230200078e-06, "loss": 0.0016, "step": 22568 }, { "epoch": 4.6, "learning_rate": 4.913600973814158e-06, "loss": 0.0004, "step": 22569 }, { "epoch": 4.6, "learning_rate": 4.9086811406449655e-06, "loss": 0.001, "step": 22570 }, { "epoch": 4.6, "learning_rate": 4.903763730774684e-06, "loss": 0.002, "step": 22571 }, { "epoch": 4.6, "learning_rate": 4.8988487442854325e-06, "loss": 0.0002, "step": 22572 }, { "epoch": 4.6, "learning_rate": 4.893936181259311e-06, "loss": 0.0032, "step": 22573 }, { "epoch": 4.6, "learning_rate": 4.889026041778355e-06, "loss": 0.0005, "step": 22574 }, { "epoch": 4.6, "learning_rate": 4.8841183259245795e-06, "loss": 0.0037, "step": 22575 }, { "epoch": 4.6, "learning_rate": 4.879213033779972e-06, "loss": 0.0003, "step": 22576 }, { "epoch": 4.6, "learning_rate": 4.874310165426415e-06, "loss": 0.0019, "step": 22577 }, { "epoch": 4.6, "learning_rate": 4.8694097209458275e-06, "loss": 0.0024, "step": 22578 }, { "epoch": 4.6, "learning_rate": 4.864511700420059e-06, "loss": 0.0002, "step": 22579 }, { "epoch": 4.6, "learning_rate": 4.8596161039308965e-06, "loss": 0.0002, "step": 22580 }, { "epoch": 4.6, "learning_rate": 4.85472293156014e-06, "loss": 0.0097, "step": 22581 }, { "epoch": 4.6, "learning_rate": 4.8498321833894735e-06, "loss": 0.0014, "step": 22582 }, { "epoch": 4.6, "learning_rate": 4.844943859500616e-06, "loss": 0.0002, "step": 22583 }, { "epoch": 4.6, "learning_rate": 4.840057959975169e-06, "loss": 0.0007, "step": 22584 }, { "epoch": 4.6, "learning_rate": 4.835174484894799e-06, "loss": 0.0033, "step": 22585 }, { "epoch": 4.6, "learning_rate": 4.830293434341009e-06, "loss": 0.0008, "step": 22586 }, { "epoch": 4.6, "learning_rate": 4.82541480839535e-06, "loss": 0.0019, "step": 22587 }, { "epoch": 4.6, "learning_rate": 4.82053860713929e-06, "loss": 0.0006, "step": 22588 }, { "epoch": 4.6, "learning_rate": 4.815664830654297e-06, "loss": 0.0012, "step": 22589 }, { "epoch": 4.6, "learning_rate": 4.81079347902174e-06, "loss": 0.001, "step": 22590 }, { "epoch": 4.6, "learning_rate": 4.805924552323004e-06, "loss": 0.0008, "step": 22591 }, { "epoch": 4.6, "learning_rate": 4.801058050639406e-06, "loss": 0.0001, "step": 22592 }, { "epoch": 4.6, "learning_rate": 4.796193974052215e-06, "loss": 0.0012, "step": 22593 }, { "epoch": 4.6, "learning_rate": 4.791332322642699e-06, "loss": 0.0002, "step": 22594 }, { "epoch": 4.6, "learning_rate": 4.786473096491994e-06, "loss": 0.0026, "step": 22595 }, { "epoch": 4.6, "learning_rate": 4.781616295681334e-06, "loss": 0.0032, "step": 22596 }, { "epoch": 4.6, "learning_rate": 4.776761920291772e-06, "loss": 0.0028, "step": 22597 }, { "epoch": 4.6, "learning_rate": 4.771909970404442e-06, "loss": 0.0007, "step": 22598 }, { "epoch": 4.6, "learning_rate": 4.767060446100329e-06, "loss": 0.0009, "step": 22599 }, { "epoch": 4.6, "learning_rate": 4.762213347460469e-06, "loss": 0.0006, "step": 22600 }, { "epoch": 4.6, "learning_rate": 4.757368674565798e-06, "loss": 0.0009, "step": 22601 }, { "epoch": 4.6, "learning_rate": 4.752526427497216e-06, "loss": 0.0013, "step": 22602 }, { "epoch": 4.6, "learning_rate": 4.747686606335643e-06, "loss": 0.0026, "step": 22603 }, { "epoch": 4.6, "learning_rate": 4.742849211161881e-06, "loss": 0.003, "step": 22604 }, { "epoch": 4.6, "learning_rate": 4.738014242056715e-06, "loss": 0.0023, "step": 22605 }, { "epoch": 4.6, "learning_rate": 4.7331816991009295e-06, "loss": 0.0023, "step": 22606 }, { "epoch": 4.6, "learning_rate": 4.728351582375211e-06, "loss": 0.0046, "step": 22607 }, { "epoch": 4.6, "learning_rate": 4.723523891960246e-06, "loss": 0.001, "step": 22608 }, { "epoch": 4.6, "learning_rate": 4.718698627936651e-06, "loss": 0.0013, "step": 22609 }, { "epoch": 4.6, "learning_rate": 4.71387579038503e-06, "loss": 0.0001, "step": 22610 }, { "epoch": 4.6, "learning_rate": 4.709055379385934e-06, "loss": 0.0019, "step": 22611 }, { "epoch": 4.6, "learning_rate": 4.704237395019866e-06, "loss": 0.0045, "step": 22612 }, { "epoch": 4.6, "learning_rate": 4.699421837367312e-06, "loss": 0.0042, "step": 22613 }, { "epoch": 4.6, "learning_rate": 4.69460870650869e-06, "loss": 0.0089, "step": 22614 }, { "epoch": 4.6, "learning_rate": 4.689798002524353e-06, "loss": 0.0005, "step": 22615 }, { "epoch": 4.61, "learning_rate": 4.68498972549472e-06, "loss": 0.0019, "step": 22616 }, { "epoch": 4.61, "learning_rate": 4.680183875500043e-06, "loss": 0.0017, "step": 22617 }, { "epoch": 4.61, "learning_rate": 4.675380452620608e-06, "loss": 0.0001, "step": 22618 }, { "epoch": 4.61, "learning_rate": 4.670579456936635e-06, "loss": 0.0002, "step": 22619 }, { "epoch": 4.61, "learning_rate": 4.665780888528308e-06, "loss": 0.0025, "step": 22620 }, { "epoch": 4.61, "learning_rate": 4.660984747475782e-06, "loss": 0.0007, "step": 22621 }, { "epoch": 4.61, "learning_rate": 4.656191033859175e-06, "loss": 0.0008, "step": 22622 }, { "epoch": 4.61, "learning_rate": 4.651399747758505e-06, "loss": 0.0023, "step": 22623 }, { "epoch": 4.61, "learning_rate": 4.646610889253844e-06, "loss": 0.0029, "step": 22624 }, { "epoch": 4.61, "learning_rate": 4.641824458425142e-06, "loss": 0.0055, "step": 22625 }, { "epoch": 4.61, "learning_rate": 4.63704045535237e-06, "loss": 0.0003, "step": 22626 }, { "epoch": 4.61, "learning_rate": 4.632258880115414e-06, "loss": 0.0002, "step": 22627 }, { "epoch": 4.61, "learning_rate": 4.627479732794126e-06, "loss": 0.0008, "step": 22628 }, { "epoch": 4.61, "learning_rate": 4.622703013468343e-06, "loss": 0.0005, "step": 22629 }, { "epoch": 4.61, "learning_rate": 4.617928722217817e-06, "loss": 0.0002, "step": 22630 }, { "epoch": 4.61, "learning_rate": 4.613156859122336e-06, "loss": 0.0005, "step": 22631 }, { "epoch": 4.61, "learning_rate": 4.608387424261567e-06, "loss": 0.0017, "step": 22632 }, { "epoch": 4.61, "learning_rate": 4.6036204177151644e-06, "loss": 0.0003, "step": 22633 }, { "epoch": 4.61, "learning_rate": 4.598855839562782e-06, "loss": 0.0004, "step": 22634 }, { "epoch": 4.61, "learning_rate": 4.594093689883921e-06, "loss": 0.002, "step": 22635 }, { "epoch": 4.61, "learning_rate": 4.589333968758219e-06, "loss": 0.0033, "step": 22636 }, { "epoch": 4.61, "learning_rate": 4.584576676265095e-06, "loss": 0.0027, "step": 22637 }, { "epoch": 4.61, "learning_rate": 4.579821812484053e-06, "loss": 0.0026, "step": 22638 }, { "epoch": 4.61, "learning_rate": 4.575069377494461e-06, "loss": 0.0001, "step": 22639 }, { "epoch": 4.61, "learning_rate": 4.5703193713757245e-06, "loss": 0.0023, "step": 22640 }, { "epoch": 4.61, "learning_rate": 4.565571794207179e-06, "loss": 0.0004, "step": 22641 }, { "epoch": 4.61, "learning_rate": 4.560826646068111e-06, "loss": 0.0002, "step": 22642 }, { "epoch": 4.61, "learning_rate": 4.5560839270377736e-06, "loss": 0.0022, "step": 22643 }, { "epoch": 4.61, "learning_rate": 4.551343637195387e-06, "loss": 0.004, "step": 22644 }, { "epoch": 4.61, "learning_rate": 4.546605776620122e-06, "loss": 0.0013, "step": 22645 }, { "epoch": 4.61, "learning_rate": 4.54187034539108e-06, "loss": 0.0053, "step": 22646 }, { "epoch": 4.61, "learning_rate": 4.537137343587399e-06, "loss": 0.0082, "step": 22647 }, { "epoch": 4.61, "learning_rate": 4.532406771288067e-06, "loss": 0.0006, "step": 22648 }, { "epoch": 4.61, "learning_rate": 4.527678628572168e-06, "loss": 0.0003, "step": 22649 }, { "epoch": 4.61, "learning_rate": 4.522952915518624e-06, "loss": 0.0032, "step": 22650 }, { "epoch": 4.61, "learning_rate": 4.518229632206371e-06, "loss": 0.0002, "step": 22651 }, { "epoch": 4.61, "learning_rate": 4.513508778714297e-06, "loss": 0.0007, "step": 22652 }, { "epoch": 4.61, "learning_rate": 4.508790355121256e-06, "loss": 0.0011, "step": 22653 }, { "epoch": 4.61, "learning_rate": 4.504074361506049e-06, "loss": 0.0028, "step": 22654 }, { "epoch": 4.61, "learning_rate": 4.499360797947432e-06, "loss": 0.003, "step": 22655 }, { "epoch": 4.61, "learning_rate": 4.494649664524158e-06, "loss": 0.0009, "step": 22656 }, { "epoch": 4.61, "learning_rate": 4.489940961314881e-06, "loss": 0.0004, "step": 22657 }, { "epoch": 4.61, "learning_rate": 4.48523468839827e-06, "loss": 0.0012, "step": 22658 }, { "epoch": 4.61, "learning_rate": 4.4805308458529144e-06, "loss": 0.0003, "step": 22659 }, { "epoch": 4.61, "learning_rate": 4.4758294337574e-06, "loss": 0.0075, "step": 22660 }, { "epoch": 4.61, "learning_rate": 4.471130452190197e-06, "loss": 0.0002, "step": 22661 }, { "epoch": 4.61, "learning_rate": 4.466433901229843e-06, "loss": 0.0003, "step": 22662 }, { "epoch": 4.61, "learning_rate": 4.461739780954743e-06, "loss": 0.0013, "step": 22663 }, { "epoch": 4.61, "learning_rate": 4.457048091443316e-06, "loss": 0.0, "step": 22664 }, { "epoch": 4.62, "learning_rate": 4.452358832773934e-06, "loss": 0.0039, "step": 22665 }, { "epoch": 4.62, "learning_rate": 4.447672005024883e-06, "loss": 0.0024, "step": 22666 }, { "epoch": 4.62, "learning_rate": 4.442987608274468e-06, "loss": 0.0003, "step": 22667 }, { "epoch": 4.62, "learning_rate": 4.438305642600925e-06, "loss": 0.0065, "step": 22668 }, { "epoch": 4.62, "learning_rate": 4.433626108082428e-06, "loss": 0.0008, "step": 22669 }, { "epoch": 4.62, "learning_rate": 4.428949004797161e-06, "loss": 0.0015, "step": 22670 }, { "epoch": 4.62, "learning_rate": 4.424274332823213e-06, "loss": 0.0001, "step": 22671 }, { "epoch": 4.62, "learning_rate": 4.419602092238689e-06, "loss": 0.0, "step": 22672 }, { "epoch": 4.62, "learning_rate": 4.414932283121625e-06, "loss": 0.0001, "step": 22673 }, { "epoch": 4.62, "learning_rate": 4.410264905549993e-06, "loss": 0.0019, "step": 22674 }, { "epoch": 4.62, "learning_rate": 4.405599959601747e-06, "loss": 0.0009, "step": 22675 }, { "epoch": 4.62, "learning_rate": 4.400937445354824e-06, "loss": 0.001, "step": 22676 }, { "epoch": 4.62, "learning_rate": 4.396277362887079e-06, "loss": 0.0029, "step": 22677 }, { "epoch": 4.62, "learning_rate": 4.39161971227635e-06, "loss": 0.0003, "step": 22678 }, { "epoch": 4.62, "learning_rate": 4.386964493600409e-06, "loss": 0.0027, "step": 22679 }, { "epoch": 4.62, "learning_rate": 4.3823117069370584e-06, "loss": 0.0006, "step": 22680 }, { "epoch": 4.62, "learning_rate": 4.377661352363954e-06, "loss": 0.0042, "step": 22681 }, { "epoch": 4.62, "learning_rate": 4.3730134299588e-06, "loss": 0.0041, "step": 22682 }, { "epoch": 4.62, "learning_rate": 4.3683679397992e-06, "loss": 0.0002, "step": 22683 }, { "epoch": 4.62, "learning_rate": 4.363724881962744e-06, "loss": 0.0058, "step": 22684 }, { "epoch": 4.62, "learning_rate": 4.359084256527018e-06, "loss": 0.001, "step": 22685 }, { "epoch": 4.62, "learning_rate": 4.354446063569478e-06, "loss": 0.0009, "step": 22686 }, { "epoch": 4.62, "learning_rate": 4.349810303167628e-06, "loss": 0.0008, "step": 22687 }, { "epoch": 4.62, "learning_rate": 4.345176975398889e-06, "loss": 0.0039, "step": 22688 }, { "epoch": 4.62, "learning_rate": 4.340546080340618e-06, "loss": 0.0007, "step": 22689 }, { "epoch": 4.62, "learning_rate": 4.335917618070184e-06, "loss": 0.0087, "step": 22690 }, { "epoch": 4.62, "learning_rate": 4.331291588664893e-06, "loss": 0.0087, "step": 22691 }, { "epoch": 4.62, "learning_rate": 4.326667992201998e-06, "loss": 0.0085, "step": 22692 }, { "epoch": 4.62, "learning_rate": 4.322046828758724e-06, "loss": 0.0027, "step": 22693 }, { "epoch": 4.62, "learning_rate": 4.31742809841224e-06, "loss": 0.0011, "step": 22694 }, { "epoch": 4.62, "learning_rate": 4.312811801239718e-06, "loss": 0.0014, "step": 22695 }, { "epoch": 4.62, "learning_rate": 4.308197937318264e-06, "loss": 0.0019, "step": 22696 }, { "epoch": 4.62, "learning_rate": 4.303586506724882e-06, "loss": 0.0002, "step": 22697 }, { "epoch": 4.62, "learning_rate": 4.298977509536644e-06, "loss": 0.005, "step": 22698 }, { "epoch": 4.62, "learning_rate": 4.2943709458304886e-06, "loss": 0.0015, "step": 22699 }, { "epoch": 4.62, "learning_rate": 4.2897668156834205e-06, "loss": 0.0052, "step": 22700 }, { "epoch": 4.62, "learning_rate": 4.285165119172262e-06, "loss": 0.0037, "step": 22701 }, { "epoch": 4.62, "learning_rate": 4.280565856373918e-06, "loss": 0.0017, "step": 22702 }, { "epoch": 4.62, "learning_rate": 4.275969027365178e-06, "loss": 0.0019, "step": 22703 }, { "epoch": 4.62, "learning_rate": 4.2713746322228296e-06, "loss": 0.0012, "step": 22704 }, { "epoch": 4.62, "learning_rate": 4.266782671023611e-06, "loss": 0.0003, "step": 22705 }, { "epoch": 4.62, "learning_rate": 4.262193143844211e-06, "loss": 0.0003, "step": 22706 }, { "epoch": 4.62, "learning_rate": 4.257606050761286e-06, "loss": 0.0006, "step": 22707 }, { "epoch": 4.62, "learning_rate": 4.253021391851441e-06, "loss": 0.0137, "step": 22708 }, { "epoch": 4.62, "learning_rate": 4.2484391671912644e-06, "loss": 0.0002, "step": 22709 }, { "epoch": 4.62, "learning_rate": 4.243859376857278e-06, "loss": 0.0031, "step": 22710 }, { "epoch": 4.62, "learning_rate": 4.239282020925988e-06, "loss": 0.0015, "step": 22711 }, { "epoch": 4.62, "learning_rate": 4.2347070994738e-06, "loss": 0.0041, "step": 22712 }, { "epoch": 4.62, "learning_rate": 4.230134612577185e-06, "loss": 0.0003, "step": 22713 }, { "epoch": 4.63, "learning_rate": 4.225564560312466e-06, "loss": 0.0086, "step": 22714 }, { "epoch": 4.63, "learning_rate": 4.220996942755983e-06, "loss": 0.0002, "step": 22715 }, { "epoch": 4.63, "learning_rate": 4.21643175998404e-06, "loss": 0.003, "step": 22716 }, { "epoch": 4.63, "learning_rate": 4.21186901207286e-06, "loss": 0.0002, "step": 22717 }, { "epoch": 4.63, "learning_rate": 4.2073086990986826e-06, "loss": 0.0021, "step": 22718 }, { "epoch": 4.63, "learning_rate": 4.202750821137646e-06, "loss": 0.0013, "step": 22719 }, { "epoch": 4.63, "learning_rate": 4.1981953782658725e-06, "loss": 0.0022, "step": 22720 }, { "epoch": 4.63, "learning_rate": 4.193642370559453e-06, "loss": 0.0016, "step": 22721 }, { "epoch": 4.63, "learning_rate": 4.18909179809444e-06, "loss": 0.0031, "step": 22722 }, { "epoch": 4.63, "learning_rate": 4.184543660946843e-06, "loss": 0.0, "step": 22723 }, { "epoch": 4.63, "learning_rate": 4.179997959192599e-06, "loss": 0.0003, "step": 22724 }, { "epoch": 4.63, "learning_rate": 4.175454692907648e-06, "loss": 0.0002, "step": 22725 }, { "epoch": 4.63, "learning_rate": 4.170913862167879e-06, "loss": 0.0004, "step": 22726 }, { "epoch": 4.63, "learning_rate": 4.166375467049099e-06, "loss": 0.0006, "step": 22727 }, { "epoch": 4.63, "learning_rate": 4.161839507627146e-06, "loss": 0.0031, "step": 22728 }, { "epoch": 4.63, "learning_rate": 4.15730598397776e-06, "loss": 0.0003, "step": 22729 }, { "epoch": 4.63, "learning_rate": 4.152774896176647e-06, "loss": 0.0021, "step": 22730 }, { "epoch": 4.63, "learning_rate": 4.14824624429953e-06, "loss": 0.0006, "step": 22731 }, { "epoch": 4.63, "learning_rate": 4.143720028421982e-06, "loss": 0.0013, "step": 22732 }, { "epoch": 4.63, "learning_rate": 4.139196248619658e-06, "loss": 0.0002, "step": 22733 }, { "epoch": 4.63, "learning_rate": 4.1346749049680824e-06, "loss": 0.0003, "step": 22734 }, { "epoch": 4.63, "learning_rate": 4.130155997542761e-06, "loss": 0.0027, "step": 22735 }, { "epoch": 4.63, "learning_rate": 4.1256395264191995e-06, "loss": 0.0032, "step": 22736 }, { "epoch": 4.63, "learning_rate": 4.121125491672789e-06, "loss": 0.0004, "step": 22737 }, { "epoch": 4.63, "learning_rate": 4.116613893378984e-06, "loss": 0.0029, "step": 22738 }, { "epoch": 4.63, "learning_rate": 4.112104731613092e-06, "loss": 0.0027, "step": 22739 }, { "epoch": 4.63, "learning_rate": 4.107598006450419e-06, "loss": 0.0091, "step": 22740 }, { "epoch": 4.63, "learning_rate": 4.103093717966255e-06, "loss": 0.0003, "step": 22741 }, { "epoch": 4.63, "learning_rate": 4.098591866235856e-06, "loss": 0.0005, "step": 22742 }, { "epoch": 4.63, "learning_rate": 4.09409245133433e-06, "loss": 0.0017, "step": 22743 }, { "epoch": 4.63, "learning_rate": 4.089595473336899e-06, "loss": 0.0001, "step": 22744 }, { "epoch": 4.63, "learning_rate": 4.085100932318653e-06, "loss": 0.0031, "step": 22745 }, { "epoch": 4.63, "learning_rate": 4.080608828354664e-06, "loss": 0.0001, "step": 22746 }, { "epoch": 4.63, "learning_rate": 4.076119161519958e-06, "loss": 0.0001, "step": 22747 }, { "epoch": 4.63, "learning_rate": 4.071631931889474e-06, "loss": 0.0009, "step": 22748 }, { "epoch": 4.63, "learning_rate": 4.067147139538235e-06, "loss": 0.0062, "step": 22749 }, { "epoch": 4.63, "learning_rate": 4.0626647845410646e-06, "loss": 0.0008, "step": 22750 }, { "epoch": 4.63, "learning_rate": 4.058184866972919e-06, "loss": 0.0007, "step": 22751 }, { "epoch": 4.63, "learning_rate": 4.053707386908539e-06, "loss": 0.0002, "step": 22752 }, { "epoch": 4.63, "learning_rate": 4.049232344422748e-06, "loss": 0.0032, "step": 22753 }, { "epoch": 4.63, "learning_rate": 4.04475973959027e-06, "loss": 0.0009, "step": 22754 }, { "epoch": 4.63, "learning_rate": 4.040289572485811e-06, "loss": 0.0046, "step": 22755 }, { "epoch": 4.63, "learning_rate": 4.035821843184045e-06, "loss": 0.0002, "step": 22756 }, { "epoch": 4.63, "learning_rate": 4.031356551759579e-06, "loss": 0.0081, "step": 22757 }, { "epoch": 4.63, "learning_rate": 4.026893698287004e-06, "loss": 0.0017, "step": 22758 }, { "epoch": 4.63, "learning_rate": 4.022433282840826e-06, "loss": 0.0002, "step": 22759 }, { "epoch": 4.63, "learning_rate": 4.0179753054955854e-06, "loss": 0.006, "step": 22760 }, { "epoch": 4.63, "learning_rate": 4.013519766325707e-06, "loss": 0.0027, "step": 22761 }, { "epoch": 4.63, "learning_rate": 4.0090666654056305e-06, "loss": 0.0003, "step": 22762 }, { "epoch": 4.63, "learning_rate": 4.0046160028096966e-06, "loss": 0.0022, "step": 22763 }, { "epoch": 4.64, "learning_rate": 4.000167778612279e-06, "loss": 0.0027, "step": 22764 }, { "epoch": 4.64, "learning_rate": 3.9957219928876514e-06, "loss": 0.0002, "step": 22765 }, { "epoch": 4.64, "learning_rate": 3.991278645710056e-06, "loss": 0.0032, "step": 22766 }, { "epoch": 4.64, "learning_rate": 3.986837737153731e-06, "loss": 0.0042, "step": 22767 }, { "epoch": 4.64, "learning_rate": 3.982399267292819e-06, "loss": 0.007, "step": 22768 }, { "epoch": 4.64, "learning_rate": 3.977963236201492e-06, "loss": 0.0017, "step": 22769 }, { "epoch": 4.64, "learning_rate": 3.973529643953793e-06, "loss": 0.0002, "step": 22770 }, { "epoch": 4.64, "learning_rate": 3.969098490623812e-06, "loss": 0.001, "step": 22771 }, { "epoch": 4.64, "learning_rate": 3.964669776285523e-06, "loss": 0.0013, "step": 22772 }, { "epoch": 4.64, "learning_rate": 3.960243501012916e-06, "loss": 0.0031, "step": 22773 }, { "epoch": 4.64, "learning_rate": 3.955819664879917e-06, "loss": 0.0001, "step": 22774 }, { "epoch": 4.64, "learning_rate": 3.951398267960399e-06, "loss": 0.0014, "step": 22775 }, { "epoch": 4.64, "learning_rate": 3.946979310328219e-06, "loss": 0.0066, "step": 22776 }, { "epoch": 4.64, "learning_rate": 3.942562792057186e-06, "loss": 0.0019, "step": 22777 }, { "epoch": 4.64, "learning_rate": 3.93814871322104e-06, "loss": 0.0012, "step": 22778 }, { "epoch": 4.64, "learning_rate": 3.9337370738935395e-06, "loss": 0.0009, "step": 22779 }, { "epoch": 4.64, "learning_rate": 3.929327874148358e-06, "loss": 0.0011, "step": 22780 }, { "epoch": 4.64, "learning_rate": 3.924921114059088e-06, "loss": 0.0012, "step": 22781 }, { "epoch": 4.64, "learning_rate": 3.920516793699418e-06, "loss": 0.0001, "step": 22782 }, { "epoch": 4.64, "learning_rate": 3.916114913142826e-06, "loss": 0.0101, "step": 22783 }, { "epoch": 4.64, "learning_rate": 3.9117154724629005e-06, "loss": 0.0003, "step": 22784 }, { "epoch": 4.64, "learning_rate": 3.907318471733068e-06, "loss": 0.0002, "step": 22785 }, { "epoch": 4.64, "learning_rate": 3.902923911026784e-06, "loss": 0.0012, "step": 22786 }, { "epoch": 4.64, "learning_rate": 3.898531790417459e-06, "loss": 0.0015, "step": 22787 }, { "epoch": 4.64, "learning_rate": 3.894142109978432e-06, "loss": 0.004, "step": 22788 }, { "epoch": 4.64, "learning_rate": 3.8897548697830295e-06, "loss": 0.0005, "step": 22789 }, { "epoch": 4.64, "learning_rate": 3.885370069904525e-06, "loss": 0.0004, "step": 22790 }, { "epoch": 4.64, "learning_rate": 3.880987710416145e-06, "loss": 0.0033, "step": 22791 }, { "epoch": 4.64, "learning_rate": 3.876607791391096e-06, "loss": 0.0003, "step": 22792 }, { "epoch": 4.64, "learning_rate": 3.8722303129025354e-06, "loss": 0.0003, "step": 22793 }, { "epoch": 4.64, "learning_rate": 3.867855275023523e-06, "loss": 0.0015, "step": 22794 }, { "epoch": 4.64, "learning_rate": 3.8634826778272176e-06, "loss": 0.0005, "step": 22795 }, { "epoch": 4.64, "learning_rate": 3.859112521386576e-06, "loss": 0.0003, "step": 22796 }, { "epoch": 4.64, "learning_rate": 3.85474480577464e-06, "loss": 0.0082, "step": 22797 }, { "epoch": 4.64, "learning_rate": 3.850379531064319e-06, "loss": 0.0001, "step": 22798 }, { "epoch": 4.64, "learning_rate": 3.846016697328519e-06, "loss": 0.0002, "step": 22799 }, { "epoch": 4.64, "learning_rate": 3.84165630464015e-06, "loss": 0.002, "step": 22800 }, { "epoch": 4.64, "learning_rate": 3.837298353071988e-06, "loss": 0.0026, "step": 22801 }, { "epoch": 4.64, "learning_rate": 3.83294284269689e-06, "loss": 0.0012, "step": 22802 }, { "epoch": 4.64, "learning_rate": 3.828589773587515e-06, "loss": 0.0002, "step": 22803 }, { "epoch": 4.64, "learning_rate": 3.824239145816638e-06, "loss": 0.0009, "step": 22804 }, { "epoch": 4.64, "learning_rate": 3.819890959456867e-06, "loss": 0.001, "step": 22805 }, { "epoch": 4.64, "learning_rate": 3.815545214580862e-06, "loss": 0.0032, "step": 22806 }, { "epoch": 4.64, "learning_rate": 3.811201911261197e-06, "loss": 0.0006, "step": 22807 }, { "epoch": 4.64, "learning_rate": 3.8068610495704144e-06, "loss": 0.0035, "step": 22808 }, { "epoch": 4.64, "learning_rate": 3.8025226295810064e-06, "loss": 0.0016, "step": 22809 }, { "epoch": 4.64, "learning_rate": 3.798186651365448e-06, "loss": 0.001, "step": 22810 }, { "epoch": 4.64, "learning_rate": 3.7938531149961317e-06, "loss": 0.0009, "step": 22811 }, { "epoch": 4.64, "learning_rate": 3.7895220205454656e-06, "loss": 0.0048, "step": 22812 }, { "epoch": 4.65, "learning_rate": 3.785193368085776e-06, "loss": 0.0006, "step": 22813 }, { "epoch": 4.65, "learning_rate": 3.7808671576893377e-06, "loss": 0.0003, "step": 22814 }, { "epoch": 4.65, "learning_rate": 3.7765433894284436e-06, "loss": 0.0041, "step": 22815 }, { "epoch": 4.65, "learning_rate": 3.7722220633752853e-06, "loss": 0.0002, "step": 22816 }, { "epoch": 4.65, "learning_rate": 3.7679031796020386e-06, "loss": 0.0008, "step": 22817 }, { "epoch": 4.65, "learning_rate": 3.763586738180846e-06, "loss": 0.0021, "step": 22818 }, { "epoch": 4.65, "learning_rate": 3.7592727391837994e-06, "loss": 0.0004, "step": 22819 }, { "epoch": 4.65, "learning_rate": 3.754961182682942e-06, "loss": 0.0034, "step": 22820 }, { "epoch": 4.65, "learning_rate": 3.7506520687502985e-06, "loss": 0.0021, "step": 22821 }, { "epoch": 4.65, "learning_rate": 3.746345397457812e-06, "loss": 0.0001, "step": 22822 }, { "epoch": 4.65, "learning_rate": 3.742041168877441e-06, "loss": 0.0002, "step": 22823 }, { "epoch": 4.65, "learning_rate": 3.737739383081062e-06, "loss": 0.0002, "step": 22824 }, { "epoch": 4.65, "learning_rate": 3.733440040140534e-06, "loss": 0.0049, "step": 22825 }, { "epoch": 4.65, "learning_rate": 3.7291431401276663e-06, "loss": 0.0004, "step": 22826 }, { "epoch": 4.65, "learning_rate": 3.7248486831141678e-06, "loss": 0.0001, "step": 22827 }, { "epoch": 4.65, "learning_rate": 3.720556669171848e-06, "loss": 0.0037, "step": 22828 }, { "epoch": 4.65, "learning_rate": 3.716267098372333e-06, "loss": 0.0016, "step": 22829 }, { "epoch": 4.65, "learning_rate": 3.7119799707872987e-06, "loss": 0.0029, "step": 22830 }, { "epoch": 4.65, "learning_rate": 3.707695286488355e-06, "loss": 0.0001, "step": 22831 }, { "epoch": 4.65, "learning_rate": 3.7034130455470103e-06, "loss": 0.0007, "step": 22832 }, { "epoch": 4.65, "learning_rate": 3.6991332480348577e-06, "loss": 0.0037, "step": 22833 }, { "epoch": 4.65, "learning_rate": 3.6948558940233077e-06, "loss": 0.0005, "step": 22834 }, { "epoch": 4.65, "learning_rate": 3.6905809835838683e-06, "loss": 0.0003, "step": 22835 }, { "epoch": 4.65, "learning_rate": 3.6863085167878835e-06, "loss": 0.0012, "step": 22836 }, { "epoch": 4.65, "learning_rate": 3.682038493706746e-06, "loss": 0.001, "step": 22837 }, { "epoch": 4.65, "learning_rate": 3.6777709144117486e-06, "loss": 0.0003, "step": 22838 }, { "epoch": 4.65, "learning_rate": 3.673505778974184e-06, "loss": 0.0004, "step": 22839 }, { "epoch": 4.65, "learning_rate": 3.669243087465279e-06, "loss": 0.0001, "step": 22840 }, { "epoch": 4.65, "learning_rate": 3.664982839956243e-06, "loss": 0.0024, "step": 22841 }, { "epoch": 4.65, "learning_rate": 3.6607250365182196e-06, "loss": 0.0001, "step": 22842 }, { "epoch": 4.65, "learning_rate": 3.656469677222318e-06, "loss": 0.0019, "step": 22843 }, { "epoch": 4.65, "learning_rate": 3.6522167621396147e-06, "loss": 0.0002, "step": 22844 }, { "epoch": 4.65, "learning_rate": 3.647966291341137e-06, "loss": 0.0042, "step": 22845 }, { "epoch": 4.65, "learning_rate": 3.64371826489791e-06, "loss": 0.0002, "step": 22846 }, { "epoch": 4.65, "learning_rate": 3.639472682880812e-06, "loss": 0.0009, "step": 22847 }, { "epoch": 4.65, "learning_rate": 3.635229545360835e-06, "loss": 0.0013, "step": 22848 }, { "epoch": 4.65, "learning_rate": 3.6309888524087894e-06, "loss": 0.0037, "step": 22849 }, { "epoch": 4.65, "learning_rate": 3.6267506040955183e-06, "loss": 0.0012, "step": 22850 }, { "epoch": 4.65, "learning_rate": 3.6225148004918157e-06, "loss": 0.0008, "step": 22851 }, { "epoch": 4.65, "learning_rate": 3.618281441668408e-06, "loss": 0.0001, "step": 22852 }, { "epoch": 4.65, "learning_rate": 3.6140505276960384e-06, "loss": 0.0018, "step": 22853 }, { "epoch": 4.65, "learning_rate": 3.609822058645334e-06, "loss": 0.0008, "step": 22854 }, { "epoch": 4.65, "learning_rate": 3.6055960345869384e-06, "loss": 0.0005, "step": 22855 }, { "epoch": 4.65, "learning_rate": 3.601372455591428e-06, "loss": 0.0007, "step": 22856 }, { "epoch": 4.65, "learning_rate": 3.597151321729347e-06, "loss": 0.0027, "step": 22857 }, { "epoch": 4.65, "learning_rate": 3.592932633071188e-06, "loss": 0.002, "step": 22858 }, { "epoch": 4.65, "learning_rate": 3.5887163896874127e-06, "loss": 0.0004, "step": 22859 }, { "epoch": 4.65, "learning_rate": 3.5845025916484473e-06, "loss": 0.0008, "step": 22860 }, { "epoch": 4.65, "learning_rate": 3.5802912390246685e-06, "loss": 0.0002, "step": 22861 }, { "epoch": 4.66, "learning_rate": 3.5760823318864373e-06, "loss": 0.0078, "step": 22862 }, { "epoch": 4.66, "learning_rate": 3.5718758703039806e-06, "loss": 0.0001, "step": 22863 }, { "epoch": 4.66, "learning_rate": 3.567671854347642e-06, "loss": 0.0004, "step": 22864 }, { "epoch": 4.66, "learning_rate": 3.5634702840875494e-06, "loss": 0.0038, "step": 22865 }, { "epoch": 4.66, "learning_rate": 3.559271159593963e-06, "loss": 0.006, "step": 22866 }, { "epoch": 4.66, "learning_rate": 3.5550744809369593e-06, "loss": 0.0004, "step": 22867 }, { "epoch": 4.66, "learning_rate": 3.5508802481866493e-06, "loss": 0.0004, "step": 22868 }, { "epoch": 4.66, "learning_rate": 3.5466884614130775e-06, "loss": 0.0019, "step": 22869 }, { "epoch": 4.66, "learning_rate": 3.542499120686254e-06, "loss": 0.0002, "step": 22870 }, { "epoch": 4.66, "learning_rate": 3.5383122260761565e-06, "loss": 0.0001, "step": 22871 }, { "epoch": 4.66, "learning_rate": 3.534127777652712e-06, "loss": 0.0003, "step": 22872 }, { "epoch": 4.66, "learning_rate": 3.5299457754858153e-06, "loss": 0.0003, "step": 22873 }, { "epoch": 4.66, "learning_rate": 3.5257662196452927e-06, "loss": 0.0001, "step": 22874 }, { "epoch": 4.66, "learning_rate": 3.521589110200973e-06, "loss": 0.0021, "step": 22875 }, { "epoch": 4.66, "learning_rate": 3.5174144472225994e-06, "loss": 0.0005, "step": 22876 }, { "epoch": 4.66, "learning_rate": 3.5132422307799333e-06, "loss": 0.0002, "step": 22877 }, { "epoch": 4.66, "learning_rate": 3.509072460942619e-06, "loss": 0.0002, "step": 22878 }, { "epoch": 4.66, "learning_rate": 3.5049051377803338e-06, "loss": 0.0002, "step": 22879 }, { "epoch": 4.66, "learning_rate": 3.5007402613626225e-06, "loss": 0.0002, "step": 22880 }, { "epoch": 4.66, "learning_rate": 3.496577831759112e-06, "loss": 0.0003, "step": 22881 }, { "epoch": 4.66, "learning_rate": 3.492417849039314e-06, "loss": 0.0011, "step": 22882 }, { "epoch": 4.66, "learning_rate": 3.488260313272656e-06, "loss": 0.0002, "step": 22883 }, { "epoch": 4.66, "learning_rate": 3.4841052245286325e-06, "loss": 0.0013, "step": 22884 }, { "epoch": 4.66, "learning_rate": 3.479952582876605e-06, "loss": 0.0113, "step": 22885 }, { "epoch": 4.66, "learning_rate": 3.4758023883859675e-06, "loss": 0.0001, "step": 22886 }, { "epoch": 4.66, "learning_rate": 3.471654641125998e-06, "loss": 0.0021, "step": 22887 }, { "epoch": 4.66, "learning_rate": 3.4675093411659915e-06, "loss": 0.0005, "step": 22888 }, { "epoch": 4.66, "learning_rate": 3.4633664885751753e-06, "loss": 0.0001, "step": 22889 }, { "epoch": 4.66, "learning_rate": 3.459226083422745e-06, "loss": 0.0019, "step": 22890 }, { "epoch": 4.66, "learning_rate": 3.4550881257778606e-06, "loss": 0.0028, "step": 22891 }, { "epoch": 4.66, "learning_rate": 3.4509526157096347e-06, "loss": 0.0009, "step": 22892 }, { "epoch": 4.66, "learning_rate": 3.4468195532871114e-06, "loss": 0.0015, "step": 22893 }, { "epoch": 4.66, "learning_rate": 3.4426889385793523e-06, "loss": 0.0018, "step": 22894 }, { "epoch": 4.66, "learning_rate": 3.438560771655352e-06, "loss": 0.0031, "step": 22895 }, { "epoch": 4.66, "learning_rate": 3.4344350525840057e-06, "loss": 0.0006, "step": 22896 }, { "epoch": 4.66, "learning_rate": 3.430311781434292e-06, "loss": 0.0002, "step": 22897 }, { "epoch": 4.66, "learning_rate": 3.426190958275005e-06, "loss": 0.0005, "step": 22898 }, { "epoch": 4.66, "learning_rate": 3.4220725831750393e-06, "loss": 0.0001, "step": 22899 }, { "epoch": 4.66, "learning_rate": 3.4179566562031245e-06, "loss": 0.0002, "step": 22900 }, { "epoch": 4.66, "learning_rate": 3.4138431774280384e-06, "loss": 0.0009, "step": 22901 }, { "epoch": 4.66, "learning_rate": 3.409732146918459e-06, "loss": 0.0002, "step": 22902 }, { "epoch": 4.66, "learning_rate": 3.405623564743065e-06, "loss": 0.0002, "step": 22903 }, { "epoch": 4.66, "learning_rate": 3.4015174309704853e-06, "loss": 0.0036, "step": 22904 }, { "epoch": 4.66, "learning_rate": 3.3974137456692806e-06, "loss": 0.0006, "step": 22905 }, { "epoch": 4.66, "learning_rate": 3.393312508907997e-06, "loss": 0.0008, "step": 22906 }, { "epoch": 4.66, "learning_rate": 3.3892137207551463e-06, "loss": 0.0017, "step": 22907 }, { "epoch": 4.66, "learning_rate": 3.3851173812791565e-06, "loss": 0.0035, "step": 22908 }, { "epoch": 4.66, "learning_rate": 3.3810234905484735e-06, "loss": 0.0002, "step": 22909 }, { "epoch": 4.66, "learning_rate": 3.3769320486314754e-06, "loss": 0.0007, "step": 22910 }, { "epoch": 4.67, "learning_rate": 3.3728430555964414e-06, "loss": 0.0035, "step": 22911 }, { "epoch": 4.67, "learning_rate": 3.3687565115117334e-06, "loss": 0.0025, "step": 22912 }, { "epoch": 4.67, "learning_rate": 3.3646724164455796e-06, "loss": 0.0001, "step": 22913 }, { "epoch": 4.67, "learning_rate": 3.3605907704661763e-06, "loss": 0.0028, "step": 22914 }, { "epoch": 4.67, "learning_rate": 3.3565115736417345e-06, "loss": 0.0002, "step": 22915 }, { "epoch": 4.67, "learning_rate": 3.3524348260403177e-06, "loss": 0.0003, "step": 22916 }, { "epoch": 4.67, "learning_rate": 3.348360527730104e-06, "loss": 0.0003, "step": 22917 }, { "epoch": 4.67, "learning_rate": 3.3442886787790722e-06, "loss": 0.0021, "step": 22918 }, { "epoch": 4.67, "learning_rate": 3.3402192792552516e-06, "loss": 0.0045, "step": 22919 }, { "epoch": 4.67, "learning_rate": 3.3361523292266047e-06, "loss": 0.0012, "step": 22920 }, { "epoch": 4.67, "learning_rate": 3.3320878287610597e-06, "loss": 0.0004, "step": 22921 }, { "epoch": 4.67, "learning_rate": 3.328025777926513e-06, "loss": 0.0018, "step": 22922 }, { "epoch": 4.67, "learning_rate": 3.3239661767907764e-06, "loss": 0.0003, "step": 22923 }, { "epoch": 4.67, "learning_rate": 3.3199090254216964e-06, "loss": 0.0003, "step": 22924 }, { "epoch": 4.67, "learning_rate": 3.3158543238870183e-06, "loss": 0.0001, "step": 22925 }, { "epoch": 4.67, "learning_rate": 3.311802072254438e-06, "loss": 0.0009, "step": 22926 }, { "epoch": 4.67, "learning_rate": 3.307752270591668e-06, "loss": 0.0001, "step": 22927 }, { "epoch": 4.67, "learning_rate": 3.3037049189663546e-06, "loss": 0.0012, "step": 22928 }, { "epoch": 4.67, "learning_rate": 3.299660017446043e-06, "loss": 0.0031, "step": 22929 }, { "epoch": 4.67, "learning_rate": 3.2956175660983632e-06, "loss": 0.0001, "step": 22930 }, { "epoch": 4.67, "learning_rate": 3.2915775649907604e-06, "loss": 0.0048, "step": 22931 }, { "epoch": 4.67, "learning_rate": 3.287540014190765e-06, "loss": 0.0042, "step": 22932 }, { "epoch": 4.67, "learning_rate": 3.283504913765789e-06, "loss": 0.0043, "step": 22933 }, { "epoch": 4.67, "learning_rate": 3.2794722637832115e-06, "loss": 0.0027, "step": 22934 }, { "epoch": 4.67, "learning_rate": 3.2754420643104297e-06, "loss": 0.0002, "step": 22935 }, { "epoch": 4.67, "learning_rate": 3.2714143154147053e-06, "loss": 0.0006, "step": 22936 }, { "epoch": 4.67, "learning_rate": 3.2673890171633356e-06, "loss": 0.0048, "step": 22937 }, { "epoch": 4.67, "learning_rate": 3.263366169623549e-06, "loss": 0.0028, "step": 22938 }, { "epoch": 4.67, "learning_rate": 3.259345772862526e-06, "loss": 0.0001, "step": 22939 }, { "epoch": 4.67, "learning_rate": 3.255327826947429e-06, "loss": 0.0008, "step": 22940 }, { "epoch": 4.67, "learning_rate": 3.251312331945355e-06, "loss": 0.009, "step": 22941 }, { "epoch": 4.67, "learning_rate": 3.2472992879233827e-06, "loss": 0.0026, "step": 22942 }, { "epoch": 4.67, "learning_rate": 3.2432886949485094e-06, "loss": 0.0015, "step": 22943 }, { "epoch": 4.67, "learning_rate": 3.2392805530877477e-06, "loss": 0.001, "step": 22944 }, { "epoch": 4.67, "learning_rate": 3.235274862408027e-06, "loss": 0.0001, "step": 22945 }, { "epoch": 4.67, "learning_rate": 3.231271622976278e-06, "loss": 0.0042, "step": 22946 }, { "epoch": 4.67, "learning_rate": 3.227270834859297e-06, "loss": 0.0009, "step": 22947 }, { "epoch": 4.67, "learning_rate": 3.22327249812398e-06, "loss": 0.0001, "step": 22948 }, { "epoch": 4.67, "learning_rate": 3.219276612837057e-06, "loss": 0.0005, "step": 22949 }, { "epoch": 4.67, "learning_rate": 3.2152831790652923e-06, "loss": 0.0001, "step": 22950 }, { "epoch": 4.67, "learning_rate": 3.2112921968753646e-06, "loss": 0.0012, "step": 22951 }, { "epoch": 4.67, "learning_rate": 3.207303666333938e-06, "loss": 0.0001, "step": 22952 }, { "epoch": 4.67, "learning_rate": 3.2033175875076424e-06, "loss": 0.0003, "step": 22953 }, { "epoch": 4.67, "learning_rate": 3.1993339604630407e-06, "loss": 0.0014, "step": 22954 }, { "epoch": 4.67, "learning_rate": 3.195352785266664e-06, "loss": 0.003, "step": 22955 }, { "epoch": 4.67, "learning_rate": 3.191374061985008e-06, "loss": 0.0068, "step": 22956 }, { "epoch": 4.67, "learning_rate": 3.1873977906845204e-06, "loss": 0.0024, "step": 22957 }, { "epoch": 4.67, "learning_rate": 3.183423971431631e-06, "loss": 0.0003, "step": 22958 }, { "epoch": 4.67, "learning_rate": 3.179452604292687e-06, "loss": 0.0007, "step": 22959 }, { "epoch": 4.68, "learning_rate": 3.1754836893340185e-06, "loss": 0.0047, "step": 22960 }, { "epoch": 4.68, "learning_rate": 3.1715172266219556e-06, "loss": 0.004, "step": 22961 }, { "epoch": 4.68, "learning_rate": 3.167553216222679e-06, "loss": 0.0001, "step": 22962 }, { "epoch": 4.68, "learning_rate": 3.1635916582024524e-06, "loss": 0.0014, "step": 22963 }, { "epoch": 4.68, "learning_rate": 3.1596325526274224e-06, "loss": 0.0021, "step": 22964 }, { "epoch": 4.68, "learning_rate": 3.15567589956367e-06, "loss": 0.0027, "step": 22965 }, { "epoch": 4.68, "learning_rate": 3.1517216990773585e-06, "loss": 0.0027, "step": 22966 }, { "epoch": 4.68, "learning_rate": 3.147769951234469e-06, "loss": 0.0015, "step": 22967 }, { "epoch": 4.68, "learning_rate": 3.1438206561010483e-06, "loss": 0.0005, "step": 22968 }, { "epoch": 4.68, "learning_rate": 3.139873813743027e-06, "loss": 0.0003, "step": 22969 }, { "epoch": 4.68, "learning_rate": 3.135929424226319e-06, "loss": 0.0035, "step": 22970 }, { "epoch": 4.68, "learning_rate": 3.1319874876168215e-06, "loss": 0.0013, "step": 22971 }, { "epoch": 4.68, "learning_rate": 3.128048003980349e-06, "loss": 0.0002, "step": 22972 }, { "epoch": 4.68, "learning_rate": 3.124110973382732e-06, "loss": 0.0002, "step": 22973 }, { "epoch": 4.68, "learning_rate": 3.1201763958897173e-06, "loss": 0.0003, "step": 22974 }, { "epoch": 4.68, "learning_rate": 3.1162442715669866e-06, "loss": 0.001, "step": 22975 }, { "epoch": 4.68, "learning_rate": 3.1123146004802536e-06, "loss": 0.0001, "step": 22976 }, { "epoch": 4.68, "learning_rate": 3.108387382695149e-06, "loss": 0.0022, "step": 22977 }, { "epoch": 4.68, "learning_rate": 3.104462618277237e-06, "loss": 0.0029, "step": 22978 }, { "epoch": 4.68, "learning_rate": 3.100540307292099e-06, "loss": 0.0001, "step": 22979 }, { "epoch": 4.68, "learning_rate": 3.096620449805215e-06, "loss": 0.0007, "step": 22980 }, { "epoch": 4.68, "learning_rate": 3.0927030458820836e-06, "loss": 0.001, "step": 22981 }, { "epoch": 4.68, "learning_rate": 3.088788095588102e-06, "loss": 0.0014, "step": 22982 }, { "epoch": 4.68, "learning_rate": 3.084875598988684e-06, "loss": 0.0019, "step": 22983 }, { "epoch": 4.68, "learning_rate": 3.080965556149162e-06, "loss": 0.0006, "step": 22984 }, { "epoch": 4.68, "learning_rate": 3.0770579671348496e-06, "loss": 0.0002, "step": 22985 }, { "epoch": 4.68, "learning_rate": 3.0731528320109946e-06, "loss": 0.0009, "step": 22986 }, { "epoch": 4.68, "learning_rate": 3.0692501508428446e-06, "loss": 0.0017, "step": 22987 }, { "epoch": 4.68, "learning_rate": 3.065349923695565e-06, "loss": 0.0002, "step": 22988 }, { "epoch": 4.68, "learning_rate": 3.061452150634286e-06, "loss": 0.0054, "step": 22989 }, { "epoch": 4.68, "learning_rate": 3.0575568317241394e-06, "loss": 0.0051, "step": 22990 }, { "epoch": 4.68, "learning_rate": 3.0536639670301564e-06, "loss": 0.0006, "step": 22991 }, { "epoch": 4.68, "learning_rate": 3.049773556617385e-06, "loss": 0.0048, "step": 22992 }, { "epoch": 4.68, "learning_rate": 3.045885600550757e-06, "loss": 0.0, "step": 22993 }, { "epoch": 4.68, "learning_rate": 3.0420000988952532e-06, "loss": 0.0019, "step": 22994 }, { "epoch": 4.68, "learning_rate": 3.038117051715738e-06, "loss": 0.0052, "step": 22995 }, { "epoch": 4.68, "learning_rate": 3.0342364590770774e-06, "loss": 0.0004, "step": 22996 }, { "epoch": 4.68, "learning_rate": 3.0303583210441183e-06, "loss": 0.0036, "step": 22997 }, { "epoch": 4.68, "learning_rate": 3.0264826376815597e-06, "loss": 0.0022, "step": 22998 }, { "epoch": 4.68, "learning_rate": 3.0226094090541997e-06, "loss": 0.0005, "step": 22999 }, { "epoch": 4.68, "learning_rate": 3.0187386352266695e-06, "loss": 0.0042, "step": 23000 }, { "epoch": 4.68, "learning_rate": 3.0148703162636844e-06, "loss": 0.0001, "step": 23001 }, { "epoch": 4.68, "learning_rate": 3.0110044522298095e-06, "loss": 0.0041, "step": 23002 }, { "epoch": 4.68, "learning_rate": 3.007141043189626e-06, "loss": 0.0028, "step": 23003 }, { "epoch": 4.68, "learning_rate": 3.003280089207649e-06, "loss": 0.0017, "step": 23004 }, { "epoch": 4.68, "learning_rate": 2.999421590348361e-06, "loss": 0.0013, "step": 23005 }, { "epoch": 4.68, "learning_rate": 2.995565546676226e-06, "loss": 0.0003, "step": 23006 }, { "epoch": 4.68, "learning_rate": 2.9917119582556435e-06, "loss": 0.0007, "step": 23007 }, { "epoch": 4.68, "learning_rate": 2.9878608251509615e-06, "loss": 0.0006, "step": 23008 }, { "epoch": 4.69, "learning_rate": 2.9840121474265123e-06, "loss": 0.0001, "step": 23009 }, { "epoch": 4.69, "learning_rate": 2.980165925146577e-06, "loss": 0.0006, "step": 23010 }, { "epoch": 4.69, "learning_rate": 2.9763221583753714e-06, "loss": 0.004, "step": 23011 }, { "epoch": 4.69, "learning_rate": 2.9724808471771277e-06, "loss": 0.0001, "step": 23012 }, { "epoch": 4.69, "learning_rate": 2.9686419916159774e-06, "loss": 0.0005, "step": 23013 }, { "epoch": 4.69, "learning_rate": 2.9648055917560697e-06, "loss": 0.0001, "step": 23014 }, { "epoch": 4.69, "learning_rate": 2.9609716476614365e-06, "loss": 0.0015, "step": 23015 }, { "epoch": 4.69, "learning_rate": 2.957140159396143e-06, "loss": 0.0043, "step": 23016 }, { "epoch": 4.69, "learning_rate": 2.953311127024155e-06, "loss": 0.0006, "step": 23017 }, { "epoch": 4.69, "learning_rate": 2.9494845506094376e-06, "loss": 0.0001, "step": 23018 }, { "epoch": 4.69, "learning_rate": 2.9456604302159403e-06, "loss": 0.0029, "step": 23019 }, { "epoch": 4.69, "learning_rate": 2.9418387659074783e-06, "loss": 0.0024, "step": 23020 }, { "epoch": 4.69, "learning_rate": 2.9380195577479006e-06, "loss": 0.0009, "step": 23021 }, { "epoch": 4.69, "learning_rate": 2.934202805800989e-06, "loss": 0.0007, "step": 23022 }, { "epoch": 4.69, "learning_rate": 2.9303885101305104e-06, "loss": 0.0001, "step": 23023 }, { "epoch": 4.69, "learning_rate": 2.926576670800146e-06, "loss": 0.0001, "step": 23024 }, { "epoch": 4.69, "learning_rate": 2.9227672878735788e-06, "loss": 0.0002, "step": 23025 }, { "epoch": 4.69, "learning_rate": 2.918960361414424e-06, "loss": 0.0006, "step": 23026 }, { "epoch": 4.69, "learning_rate": 2.915155891486265e-06, "loss": 0.0013, "step": 23027 }, { "epoch": 4.69, "learning_rate": 2.91135387815265e-06, "loss": 0.0007, "step": 23028 }, { "epoch": 4.69, "learning_rate": 2.907554321477079e-06, "loss": 0.0028, "step": 23029 }, { "epoch": 4.69, "learning_rate": 2.903757221523001e-06, "loss": 0.0013, "step": 23030 }, { "epoch": 4.69, "learning_rate": 2.8999625783538317e-06, "loss": 0.0105, "step": 23031 }, { "epoch": 4.69, "learning_rate": 2.8961703920329704e-06, "loss": 0.0031, "step": 23032 }, { "epoch": 4.69, "learning_rate": 2.8923806626237334e-06, "loss": 0.002, "step": 23033 }, { "epoch": 4.69, "learning_rate": 2.8885933901894365e-06, "loss": 0.0029, "step": 23034 }, { "epoch": 4.69, "learning_rate": 2.8848085747933127e-06, "loss": 0.0065, "step": 23035 }, { "epoch": 4.69, "learning_rate": 2.8810262164985943e-06, "loss": 0.0003, "step": 23036 }, { "epoch": 4.69, "learning_rate": 2.877246315368431e-06, "loss": 0.0011, "step": 23037 }, { "epoch": 4.69, "learning_rate": 2.873468871465989e-06, "loss": 0.0005, "step": 23038 }, { "epoch": 4.69, "learning_rate": 2.8696938848543184e-06, "loss": 0.0004, "step": 23039 }, { "epoch": 4.69, "learning_rate": 2.8659213555964844e-06, "loss": 0.0008, "step": 23040 }, { "epoch": 4.69, "learning_rate": 2.8621512837555207e-06, "loss": 0.0063, "step": 23041 }, { "epoch": 4.69, "learning_rate": 2.8583836693943595e-06, "loss": 0.0, "step": 23042 }, { "epoch": 4.69, "learning_rate": 2.8546185125759515e-06, "loss": 0.0004, "step": 23043 }, { "epoch": 4.69, "learning_rate": 2.8508558133631453e-06, "loss": 0.0025, "step": 23044 }, { "epoch": 4.69, "learning_rate": 2.8470955718188415e-06, "loss": 0.0013, "step": 23045 }, { "epoch": 4.69, "learning_rate": 2.8433377880057893e-06, "loss": 0.0036, "step": 23046 }, { "epoch": 4.69, "learning_rate": 2.8395824619867723e-06, "loss": 0.0001, "step": 23047 }, { "epoch": 4.69, "learning_rate": 2.83582959382454e-06, "loss": 0.0045, "step": 23048 }, { "epoch": 4.69, "learning_rate": 2.832079183581709e-06, "loss": 0.0001, "step": 23049 }, { "epoch": 4.69, "learning_rate": 2.828331231320996e-06, "loss": 0.0001, "step": 23050 }, { "epoch": 4.69, "learning_rate": 2.8245857371049176e-06, "loss": 0.0022, "step": 23051 }, { "epoch": 4.69, "learning_rate": 2.8208427009961066e-06, "loss": 0.001, "step": 23052 }, { "epoch": 4.69, "learning_rate": 2.8171021230570136e-06, "loss": 0.0034, "step": 23053 }, { "epoch": 4.69, "learning_rate": 2.813364003350155e-06, "loss": 0.0003, "step": 23054 }, { "epoch": 4.69, "learning_rate": 2.8096283419379475e-06, "loss": 0.004, "step": 23055 }, { "epoch": 4.69, "learning_rate": 2.805895138882791e-06, "loss": 0.0002, "step": 23056 }, { "epoch": 4.69, "learning_rate": 2.802164394247036e-06, "loss": 0.0005, "step": 23057 }, { "epoch": 4.7, "learning_rate": 2.7984361080929994e-06, "loss": 0.0026, "step": 23058 }, { "epoch": 4.7, "learning_rate": 2.7947102804829313e-06, "loss": 0.0081, "step": 23059 }, { "epoch": 4.7, "learning_rate": 2.790986911479065e-06, "loss": 0.0017, "step": 23060 }, { "epoch": 4.7, "learning_rate": 2.7872660011436176e-06, "loss": 0.002, "step": 23061 }, { "epoch": 4.7, "learning_rate": 2.7835475495386894e-06, "loss": 0.0004, "step": 23062 }, { "epoch": 4.7, "learning_rate": 2.7798315567264304e-06, "loss": 0.0022, "step": 23063 }, { "epoch": 4.7, "learning_rate": 2.7761180227688416e-06, "loss": 0.0026, "step": 23064 }, { "epoch": 4.7, "learning_rate": 2.772406947728023e-06, "loss": 0.0014, "step": 23065 }, { "epoch": 4.7, "learning_rate": 2.7686983316659083e-06, "loss": 0.0004, "step": 23066 }, { "epoch": 4.7, "learning_rate": 2.7649921746444646e-06, "loss": 0.0003, "step": 23067 }, { "epoch": 4.7, "learning_rate": 2.7612884767255594e-06, "loss": 0.0022, "step": 23068 }, { "epoch": 4.7, "learning_rate": 2.757587237971076e-06, "loss": 0.0001, "step": 23069 }, { "epoch": 4.7, "learning_rate": 2.7538884584428156e-06, "loss": 0.0007, "step": 23070 }, { "epoch": 4.7, "learning_rate": 2.750192138202578e-06, "loss": 0.0003, "step": 23071 }, { "epoch": 4.7, "learning_rate": 2.7464982773120646e-06, "loss": 0.0001, "step": 23072 }, { "epoch": 4.7, "learning_rate": 2.742806875833009e-06, "loss": 0.0013, "step": 23073 }, { "epoch": 4.7, "learning_rate": 2.7391179338270454e-06, "loss": 0.0017, "step": 23074 }, { "epoch": 4.7, "learning_rate": 2.7354314513557906e-06, "loss": 0.0035, "step": 23075 }, { "epoch": 4.7, "learning_rate": 2.731747428480813e-06, "loss": 0.0004, "step": 23076 }, { "epoch": 4.7, "learning_rate": 2.7280658652636122e-06, "loss": 0.0001, "step": 23077 }, { "epoch": 4.7, "learning_rate": 2.72438676176574e-06, "loss": 0.0006, "step": 23078 }, { "epoch": 4.7, "learning_rate": 2.720710118048597e-06, "loss": 0.0019, "step": 23079 }, { "epoch": 4.7, "learning_rate": 2.7170359341736004e-06, "loss": 0.0001, "step": 23080 }, { "epoch": 4.7, "learning_rate": 2.7133642102021513e-06, "loss": 0.0001, "step": 23081 }, { "epoch": 4.7, "learning_rate": 2.709694946195501e-06, "loss": 0.0007, "step": 23082 }, { "epoch": 4.7, "learning_rate": 2.706028142215e-06, "loss": 0.0003, "step": 23083 }, { "epoch": 4.7, "learning_rate": 2.702363798321866e-06, "loss": 0.0002, "step": 23084 }, { "epoch": 4.7, "learning_rate": 2.6987019145773004e-06, "loss": 0.007, "step": 23085 }, { "epoch": 4.7, "learning_rate": 2.695042491042454e-06, "loss": 0.0004, "step": 23086 }, { "epoch": 4.7, "learning_rate": 2.6913855277784613e-06, "loss": 0.002, "step": 23087 }, { "epoch": 4.7, "learning_rate": 2.68773102484639e-06, "loss": 0.0018, "step": 23088 }, { "epoch": 4.7, "learning_rate": 2.6840789823072752e-06, "loss": 0.001, "step": 23089 }, { "epoch": 4.7, "learning_rate": 2.6804294002221337e-06, "loss": 0.0027, "step": 23090 }, { "epoch": 4.7, "learning_rate": 2.676782278651901e-06, "loss": 0.0021, "step": 23091 }, { "epoch": 4.7, "learning_rate": 2.6731376176574948e-06, "loss": 0.0002, "step": 23092 }, { "epoch": 4.7, "learning_rate": 2.6694954172997995e-06, "loss": 0.0004, "step": 23093 }, { "epoch": 4.7, "learning_rate": 2.6658556776396333e-06, "loss": 0.0001, "step": 23094 }, { "epoch": 4.7, "learning_rate": 2.662218398737781e-06, "loss": 0.002, "step": 23095 }, { "epoch": 4.7, "learning_rate": 2.658583580655027e-06, "loss": 0.0001, "step": 23096 }, { "epoch": 4.7, "learning_rate": 2.654951223452023e-06, "loss": 0.0019, "step": 23097 }, { "epoch": 4.7, "learning_rate": 2.6513213271894875e-06, "loss": 0.0003, "step": 23098 }, { "epoch": 4.7, "learning_rate": 2.6476938919280043e-06, "loss": 0.0006, "step": 23099 }, { "epoch": 4.7, "learning_rate": 2.6440689177281926e-06, "loss": 0.0001, "step": 23100 }, { "epoch": 4.7, "learning_rate": 2.640446404650587e-06, "loss": 0.0001, "step": 23101 }, { "epoch": 4.7, "learning_rate": 2.636826352755672e-06, "loss": 0.0003, "step": 23102 }, { "epoch": 4.7, "learning_rate": 2.63320876210395e-06, "loss": 0.0012, "step": 23103 }, { "epoch": 4.7, "learning_rate": 2.6295936327558054e-06, "loss": 0.0008, "step": 23104 }, { "epoch": 4.7, "learning_rate": 2.6259809647716236e-06, "loss": 0.0032, "step": 23105 }, { "epoch": 4.7, "learning_rate": 2.622370758211756e-06, "loss": 0.0002, "step": 23106 }, { "epoch": 4.71, "learning_rate": 2.6187630131364877e-06, "loss": 0.0003, "step": 23107 }, { "epoch": 4.71, "learning_rate": 2.615157729606071e-06, "loss": 0.0004, "step": 23108 }, { "epoch": 4.71, "learning_rate": 2.6115549076807406e-06, "loss": 0.0005, "step": 23109 }, { "epoch": 4.71, "learning_rate": 2.6079545474206487e-06, "loss": 0.005, "step": 23110 }, { "epoch": 4.71, "learning_rate": 2.6043566488859468e-06, "loss": 0.0037, "step": 23111 }, { "epoch": 4.71, "learning_rate": 2.6007612121367205e-06, "loss": 0.0023, "step": 23112 }, { "epoch": 4.71, "learning_rate": 2.597168237233005e-06, "loss": 0.0003, "step": 23113 }, { "epoch": 4.71, "learning_rate": 2.5935777242348353e-06, "loss": 0.004, "step": 23114 }, { "epoch": 4.71, "learning_rate": 2.5899896732021473e-06, "loss": 0.0021, "step": 23115 }, { "epoch": 4.71, "learning_rate": 2.58640408419491e-06, "loss": 0.0012, "step": 23116 }, { "epoch": 4.71, "learning_rate": 2.582820957272991e-06, "loss": 0.001, "step": 23117 }, { "epoch": 4.71, "learning_rate": 2.5792402924962095e-06, "loss": 0.0011, "step": 23118 }, { "epoch": 4.71, "learning_rate": 2.575662089924402e-06, "loss": 0.0046, "step": 23119 }, { "epoch": 4.71, "learning_rate": 2.5720863496173196e-06, "loss": 0.006, "step": 23120 }, { "epoch": 4.71, "learning_rate": 2.5685130716346815e-06, "loss": 0.0006, "step": 23121 }, { "epoch": 4.71, "learning_rate": 2.564942256036173e-06, "loss": 0.0005, "step": 23122 }, { "epoch": 4.71, "learning_rate": 2.561373902881447e-06, "loss": 0.0002, "step": 23123 }, { "epoch": 4.71, "learning_rate": 2.5578080122300725e-06, "loss": 0.0009, "step": 23124 }, { "epoch": 4.71, "learning_rate": 2.554244584141618e-06, "loss": 0.0033, "step": 23125 }, { "epoch": 4.71, "learning_rate": 2.550683618675603e-06, "loss": 0.0013, "step": 23126 }, { "epoch": 4.71, "learning_rate": 2.5471251158915296e-06, "loss": 0.0001, "step": 23127 }, { "epoch": 4.71, "learning_rate": 2.543569075848767e-06, "loss": 0.0002, "step": 23128 }, { "epoch": 4.71, "learning_rate": 2.5400154986067677e-06, "loss": 0.0002, "step": 23129 }, { "epoch": 4.71, "learning_rate": 2.5364643842248345e-06, "loss": 0.0052, "step": 23130 }, { "epoch": 4.71, "learning_rate": 2.5329157327623197e-06, "loss": 0.0008, "step": 23131 }, { "epoch": 4.71, "learning_rate": 2.529369544278492e-06, "loss": 0.0003, "step": 23132 }, { "epoch": 4.71, "learning_rate": 2.525825818832539e-06, "loss": 0.0039, "step": 23133 }, { "epoch": 4.71, "learning_rate": 2.522284556483678e-06, "loss": 0.0041, "step": 23134 }, { "epoch": 4.71, "learning_rate": 2.518745757291063e-06, "loss": 0.0009, "step": 23135 }, { "epoch": 4.71, "learning_rate": 2.515209421313763e-06, "loss": 0.0001, "step": 23136 }, { "epoch": 4.71, "learning_rate": 2.511675548610881e-06, "loss": 0.0215, "step": 23137 }, { "epoch": 4.71, "learning_rate": 2.5081441392414026e-06, "loss": 0.006, "step": 23138 }, { "epoch": 4.71, "learning_rate": 2.5046151932643476e-06, "loss": 0.0005, "step": 23139 }, { "epoch": 4.71, "learning_rate": 2.501088710738619e-06, "loss": 0.0008, "step": 23140 }, { "epoch": 4.71, "learning_rate": 2.497564691723136e-06, "loss": 0.0014, "step": 23141 }, { "epoch": 4.71, "learning_rate": 2.494043136276769e-06, "loss": 0.0017, "step": 23142 }, { "epoch": 4.71, "learning_rate": 2.490524044458303e-06, "loss": 0.0056, "step": 23143 }, { "epoch": 4.71, "learning_rate": 2.487007416326525e-06, "loss": 0.0002, "step": 23144 }, { "epoch": 4.71, "learning_rate": 2.483493251940205e-06, "loss": 0.0002, "step": 23145 }, { "epoch": 4.71, "learning_rate": 2.4799815513579625e-06, "loss": 0.0029, "step": 23146 }, { "epoch": 4.71, "learning_rate": 2.476472314638517e-06, "loss": 0.0001, "step": 23147 }, { "epoch": 4.71, "learning_rate": 2.472965541840438e-06, "loss": 0.001, "step": 23148 }, { "epoch": 4.71, "learning_rate": 2.469461233022346e-06, "loss": 0.0031, "step": 23149 }, { "epoch": 4.71, "learning_rate": 2.4659593882427108e-06, "loss": 0.0001, "step": 23150 }, { "epoch": 4.71, "learning_rate": 2.4624600075600353e-06, "loss": 0.0011, "step": 23151 }, { "epoch": 4.71, "learning_rate": 2.4589630910327896e-06, "loss": 0.0042, "step": 23152 }, { "epoch": 4.71, "learning_rate": 2.4554686387193436e-06, "loss": 0.0064, "step": 23153 }, { "epoch": 4.71, "learning_rate": 2.4519766506781e-06, "loss": 0.0019, "step": 23154 }, { "epoch": 4.71, "learning_rate": 2.4484871269673633e-06, "loss": 0.0037, "step": 23155 }, { "epoch": 4.72, "learning_rate": 2.445000067645403e-06, "loss": 0.0002, "step": 23156 }, { "epoch": 4.72, "learning_rate": 2.4415154727704888e-06, "loss": 0.0076, "step": 23157 }, { "epoch": 4.72, "learning_rate": 2.4380333424007912e-06, "loss": 0.0006, "step": 23158 }, { "epoch": 4.72, "learning_rate": 2.434553676594481e-06, "loss": 0.0, "step": 23159 }, { "epoch": 4.72, "learning_rate": 2.43107647540966e-06, "loss": 0.0005, "step": 23160 }, { "epoch": 4.72, "learning_rate": 2.4276017389044334e-06, "loss": 0.0034, "step": 23161 }, { "epoch": 4.72, "learning_rate": 2.4241294671368205e-06, "loss": 0.0004, "step": 23162 }, { "epoch": 4.72, "learning_rate": 2.4206596601648256e-06, "loss": 0.0043, "step": 23163 }, { "epoch": 4.72, "learning_rate": 2.417192318046368e-06, "loss": 0.0004, "step": 23164 }, { "epoch": 4.72, "learning_rate": 2.4137274408394023e-06, "loss": 0.0015, "step": 23165 }, { "epoch": 4.72, "learning_rate": 2.410265028601749e-06, "loss": 0.0008, "step": 23166 }, { "epoch": 4.72, "learning_rate": 2.406805081391294e-06, "loss": 0.0007, "step": 23167 }, { "epoch": 4.72, "learning_rate": 2.403347599265776e-06, "loss": 0.0007, "step": 23168 }, { "epoch": 4.72, "learning_rate": 2.3998925822829807e-06, "loss": 0.0002, "step": 23169 }, { "epoch": 4.72, "learning_rate": 2.3964400305005793e-06, "loss": 0.0014, "step": 23170 }, { "epoch": 4.72, "learning_rate": 2.392989943976242e-06, "loss": 0.0001, "step": 23171 }, { "epoch": 4.72, "learning_rate": 2.3895423227676238e-06, "loss": 0.0015, "step": 23172 }, { "epoch": 4.72, "learning_rate": 2.3860971669322606e-06, "loss": 0.002, "step": 23173 }, { "epoch": 4.72, "learning_rate": 2.38265447652774e-06, "loss": 0.0009, "step": 23174 }, { "epoch": 4.72, "learning_rate": 2.3792142516115164e-06, "loss": 0.0055, "step": 23175 }, { "epoch": 4.72, "learning_rate": 2.375776492241077e-06, "loss": 0.0, "step": 23176 }, { "epoch": 4.72, "learning_rate": 2.3723411984738263e-06, "loss": 0.0021, "step": 23177 }, { "epoch": 4.72, "learning_rate": 2.3689083703671676e-06, "loss": 0.0049, "step": 23178 }, { "epoch": 4.72, "learning_rate": 2.3654780079783718e-06, "loss": 0.0052, "step": 23179 }, { "epoch": 4.72, "learning_rate": 2.3620501113648105e-06, "loss": 0.0012, "step": 23180 }, { "epoch": 4.72, "learning_rate": 2.3586246805836704e-06, "loss": 0.0029, "step": 23181 }, { "epoch": 4.72, "learning_rate": 2.3552017156922066e-06, "loss": 0.0045, "step": 23182 }, { "epoch": 4.72, "learning_rate": 2.3517812167475724e-06, "loss": 0.0058, "step": 23183 }, { "epoch": 4.72, "learning_rate": 2.3483631838068893e-06, "loss": 0.0028, "step": 23184 }, { "epoch": 4.72, "learning_rate": 2.3449476169272784e-06, "loss": 0.0021, "step": 23185 }, { "epoch": 4.72, "learning_rate": 2.3415345161657273e-06, "loss": 0.0036, "step": 23186 }, { "epoch": 4.72, "learning_rate": 2.3381238815792903e-06, "loss": 0.0027, "step": 23187 }, { "epoch": 4.72, "learning_rate": 2.3347157132249215e-06, "loss": 0.0017, "step": 23188 }, { "epoch": 4.72, "learning_rate": 2.3313100111595264e-06, "loss": 0.0001, "step": 23189 }, { "epoch": 4.72, "learning_rate": 2.327906775440008e-06, "loss": 0.0002, "step": 23190 }, { "epoch": 4.72, "learning_rate": 2.324506006123189e-06, "loss": 0.0009, "step": 23191 }, { "epoch": 4.72, "learning_rate": 2.3211077032658898e-06, "loss": 0.0016, "step": 23192 }, { "epoch": 4.72, "learning_rate": 2.3177118669248485e-06, "loss": 0.0008, "step": 23193 }, { "epoch": 4.72, "learning_rate": 2.3143184971567863e-06, "loss": 0.0056, "step": 23194 }, { "epoch": 4.72, "learning_rate": 2.310927594018375e-06, "loss": 0.0029, "step": 23195 }, { "epoch": 4.72, "learning_rate": 2.307539157566285e-06, "loss": 0.0001, "step": 23196 }, { "epoch": 4.72, "learning_rate": 2.3041531878570385e-06, "loss": 0.0011, "step": 23197 }, { "epoch": 4.72, "learning_rate": 2.3007696849472566e-06, "loss": 0.0001, "step": 23198 }, { "epoch": 4.72, "learning_rate": 2.297388648893411e-06, "loss": 0.0071, "step": 23199 }, { "epoch": 4.72, "learning_rate": 2.2940100797520067e-06, "loss": 0.0003, "step": 23200 }, { "epoch": 4.72, "learning_rate": 2.290633977579431e-06, "loss": 0.0019, "step": 23201 }, { "epoch": 4.72, "learning_rate": 2.28726034243209e-06, "loss": 0.002, "step": 23202 }, { "epoch": 4.72, "learning_rate": 2.283889174366321e-06, "loss": 0.0001, "step": 23203 }, { "epoch": 4.72, "learning_rate": 2.2805204734384463e-06, "loss": 0.0002, "step": 23204 }, { "epoch": 4.72, "learning_rate": 2.2771542397047205e-06, "loss": 0.0048, "step": 23205 }, { "epoch": 4.73, "learning_rate": 2.2737904732213486e-06, "loss": 0.0042, "step": 23206 }, { "epoch": 4.73, "learning_rate": 2.2704291740445523e-06, "loss": 0.0016, "step": 23207 }, { "epoch": 4.73, "learning_rate": 2.267070342230437e-06, "loss": 0.0019, "step": 23208 }, { "epoch": 4.73, "learning_rate": 2.2637139778351243e-06, "loss": 0.0023, "step": 23209 }, { "epoch": 4.73, "learning_rate": 2.260360080914636e-06, "loss": 0.0004, "step": 23210 }, { "epoch": 4.73, "learning_rate": 2.2570086515250443e-06, "loss": 0.0019, "step": 23211 }, { "epoch": 4.73, "learning_rate": 2.2536596897222535e-06, "loss": 0.0018, "step": 23212 }, { "epoch": 4.73, "learning_rate": 2.2503131955622698e-06, "loss": 0.0003, "step": 23213 }, { "epoch": 4.73, "learning_rate": 2.2469691691009482e-06, "loss": 0.0004, "step": 23214 }, { "epoch": 4.73, "learning_rate": 2.2436276103941274e-06, "loss": 0.0004, "step": 23215 }, { "epoch": 4.73, "learning_rate": 2.240288519497646e-06, "loss": 0.0009, "step": 23216 }, { "epoch": 4.73, "learning_rate": 2.2369518964672593e-06, "loss": 0.0068, "step": 23217 }, { "epoch": 4.73, "learning_rate": 2.2336177413587066e-06, "loss": 0.0015, "step": 23218 }, { "epoch": 4.73, "learning_rate": 2.2302860542276758e-06, "loss": 0.0009, "step": 23219 }, { "epoch": 4.73, "learning_rate": 2.2269568351297894e-06, "loss": 0.0095, "step": 23220 }, { "epoch": 4.73, "learning_rate": 2.2236300841206535e-06, "loss": 0.0058, "step": 23221 }, { "epoch": 4.73, "learning_rate": 2.220305801255856e-06, "loss": 0.0005, "step": 23222 }, { "epoch": 4.73, "learning_rate": 2.2169839865909036e-06, "loss": 0.0007, "step": 23223 }, { "epoch": 4.73, "learning_rate": 2.2136646401812842e-06, "loss": 0.0057, "step": 23224 }, { "epoch": 4.73, "learning_rate": 2.2103477620824206e-06, "loss": 0.0001, "step": 23225 }, { "epoch": 4.73, "learning_rate": 2.2070333523497353e-06, "loss": 0.0004, "step": 23226 }, { "epoch": 4.73, "learning_rate": 2.203721411038567e-06, "loss": 0.0004, "step": 23227 }, { "epoch": 4.73, "learning_rate": 2.200411938204222e-06, "loss": 0.0014, "step": 23228 }, { "epoch": 4.73, "learning_rate": 2.197104933902022e-06, "loss": 0.0008, "step": 23229 }, { "epoch": 4.73, "learning_rate": 2.193800398187123e-06, "loss": 0.0016, "step": 23230 }, { "epoch": 4.73, "learning_rate": 2.1904983311147984e-06, "loss": 0.0006, "step": 23231 }, { "epoch": 4.73, "learning_rate": 2.187198732740153e-06, "loss": 0.0005, "step": 23232 }, { "epoch": 4.73, "learning_rate": 2.1839016031183097e-06, "loss": 0.0103, "step": 23233 }, { "epoch": 4.73, "learning_rate": 2.1806069423043084e-06, "loss": 0.0002, "step": 23234 }, { "epoch": 4.73, "learning_rate": 2.1773147503532206e-06, "loss": 0.0083, "step": 23235 }, { "epoch": 4.73, "learning_rate": 2.1740250273200032e-06, "loss": 0.0002, "step": 23236 }, { "epoch": 4.73, "learning_rate": 2.170737773259612e-06, "loss": 0.0015, "step": 23237 }, { "epoch": 4.73, "learning_rate": 2.1674529882269533e-06, "loss": 0.0007, "step": 23238 }, { "epoch": 4.73, "learning_rate": 2.1641706722768827e-06, "loss": 0.0042, "step": 23239 }, { "epoch": 4.73, "learning_rate": 2.1608908254642067e-06, "loss": 0.0003, "step": 23240 }, { "epoch": 4.73, "learning_rate": 2.1576134478437313e-06, "loss": 0.0004, "step": 23241 }, { "epoch": 4.73, "learning_rate": 2.154338539470196e-06, "loss": 0.0007, "step": 23242 }, { "epoch": 4.73, "learning_rate": 2.151066100398258e-06, "loss": 0.0014, "step": 23243 }, { "epoch": 4.73, "learning_rate": 2.147796130682622e-06, "loss": 0.0007, "step": 23244 }, { "epoch": 4.73, "learning_rate": 2.144528630377862e-06, "loss": 0.0002, "step": 23245 }, { "epoch": 4.73, "learning_rate": 2.141263599538584e-06, "loss": 0.0004, "step": 23246 }, { "epoch": 4.73, "learning_rate": 2.1380010382193115e-06, "loss": 0.0014, "step": 23247 }, { "epoch": 4.73, "learning_rate": 2.134740946474517e-06, "loss": 0.0097, "step": 23248 }, { "epoch": 4.73, "learning_rate": 2.1314833243586904e-06, "loss": 0.0001, "step": 23249 }, { "epoch": 4.73, "learning_rate": 2.1282281719261886e-06, "loss": 0.0043, "step": 23250 }, { "epoch": 4.73, "learning_rate": 2.1249754892314174e-06, "loss": 0.0004, "step": 23251 }, { "epoch": 4.73, "learning_rate": 2.121725276328684e-06, "loss": 0.0002, "step": 23252 }, { "epoch": 4.73, "learning_rate": 2.118477533272278e-06, "loss": 0.0001, "step": 23253 }, { "epoch": 4.73, "learning_rate": 2.1152322601164397e-06, "loss": 0.0003, "step": 23254 }, { "epoch": 4.74, "learning_rate": 2.111989456915375e-06, "loss": 0.0002, "step": 23255 }, { "epoch": 4.74, "learning_rate": 2.108749123723258e-06, "loss": 0.0004, "step": 23256 }, { "epoch": 4.74, "learning_rate": 2.105511260594178e-06, "loss": 0.001, "step": 23257 }, { "epoch": 4.74, "learning_rate": 2.102275867582243e-06, "loss": 0.0008, "step": 23258 }, { "epoch": 4.74, "learning_rate": 2.099042944741475e-06, "loss": 0.0005, "step": 23259 }, { "epoch": 4.74, "learning_rate": 2.0958124921258813e-06, "loss": 0.0001, "step": 23260 }, { "epoch": 4.74, "learning_rate": 2.0925845097893857e-06, "loss": 0.0007, "step": 23261 }, { "epoch": 4.74, "learning_rate": 2.089358997785945e-06, "loss": 0.0018, "step": 23262 }, { "epoch": 4.74, "learning_rate": 2.0861359561693822e-06, "loss": 0.0, "step": 23263 }, { "epoch": 4.74, "learning_rate": 2.0829153849935886e-06, "loss": 0.005, "step": 23264 }, { "epoch": 4.74, "learning_rate": 2.0796972843123037e-06, "loss": 0.0011, "step": 23265 }, { "epoch": 4.74, "learning_rate": 2.076481654179285e-06, "loss": 0.001, "step": 23266 }, { "epoch": 4.74, "learning_rate": 2.0732684946482724e-06, "loss": 0.0037, "step": 23267 }, { "epoch": 4.74, "learning_rate": 2.07005780577289e-06, "loss": 0.0012, "step": 23268 }, { "epoch": 4.74, "learning_rate": 2.0668495876067948e-06, "loss": 0.0001, "step": 23269 }, { "epoch": 4.74, "learning_rate": 2.063643840203544e-06, "loss": 0.0011, "step": 23270 }, { "epoch": 4.74, "learning_rate": 2.0604405636166943e-06, "loss": 0.0014, "step": 23271 }, { "epoch": 4.74, "learning_rate": 2.0572397578997367e-06, "loss": 0.0003, "step": 23272 }, { "epoch": 4.74, "learning_rate": 2.0540414231061287e-06, "loss": 0.0012, "step": 23273 }, { "epoch": 4.74, "learning_rate": 2.05084555928931e-06, "loss": 0.0004, "step": 23274 }, { "epoch": 4.74, "learning_rate": 2.047652166502656e-06, "loss": 0.0093, "step": 23275 }, { "epoch": 4.74, "learning_rate": 2.0444612447994726e-06, "loss": 0.0001, "step": 23276 }, { "epoch": 4.74, "learning_rate": 2.0412727942330675e-06, "loss": 0.0013, "step": 23277 }, { "epoch": 4.74, "learning_rate": 2.0380868148567152e-06, "loss": 0.0011, "step": 23278 }, { "epoch": 4.74, "learning_rate": 2.0349033067236064e-06, "loss": 0.0008, "step": 23279 }, { "epoch": 4.74, "learning_rate": 2.0317222698869152e-06, "loss": 0.0011, "step": 23280 }, { "epoch": 4.74, "learning_rate": 2.0285437043997655e-06, "loss": 0.0025, "step": 23281 }, { "epoch": 4.74, "learning_rate": 2.025367610315265e-06, "loss": 0.0008, "step": 23282 }, { "epoch": 4.74, "learning_rate": 2.022193987686438e-06, "loss": 0.0002, "step": 23283 }, { "epoch": 4.74, "learning_rate": 2.0190228365663088e-06, "loss": 0.0032, "step": 23284 }, { "epoch": 4.74, "learning_rate": 2.0158541570078178e-06, "loss": 0.0001, "step": 23285 }, { "epoch": 4.74, "learning_rate": 2.012687949063907e-06, "loss": 0.0002, "step": 23286 }, { "epoch": 4.74, "learning_rate": 2.00952421278745e-06, "loss": 0.0059, "step": 23287 }, { "epoch": 4.74, "learning_rate": 2.006362948231305e-06, "loss": 0.002, "step": 23288 }, { "epoch": 4.74, "learning_rate": 2.0032041554482457e-06, "loss": 0.0017, "step": 23289 }, { "epoch": 4.74, "learning_rate": 2.0000478344910474e-06, "loss": 0.0011, "step": 23290 }, { "epoch": 4.74, "learning_rate": 1.9968939854124013e-06, "loss": 0.0003, "step": 23291 }, { "epoch": 4.74, "learning_rate": 1.993742608265014e-06, "loss": 0.0001, "step": 23292 }, { "epoch": 4.74, "learning_rate": 1.9905937031015285e-06, "loss": 0.0016, "step": 23293 }, { "epoch": 4.74, "learning_rate": 1.987447269974485e-06, "loss": 0.0001, "step": 23294 }, { "epoch": 4.74, "learning_rate": 1.9843033089364745e-06, "loss": 0.0004, "step": 23295 }, { "epoch": 4.74, "learning_rate": 1.9811618200399895e-06, "loss": 0.0007, "step": 23296 }, { "epoch": 4.74, "learning_rate": 1.97802280333752e-06, "loss": 0.0001, "step": 23297 }, { "epoch": 4.74, "learning_rate": 1.9748862588814918e-06, "loss": 0.0002, "step": 23298 }, { "epoch": 4.74, "learning_rate": 1.9717521867242457e-06, "loss": 0.005, "step": 23299 }, { "epoch": 4.74, "learning_rate": 1.9686205869181905e-06, "loss": 0.0003, "step": 23300 }, { "epoch": 4.74, "learning_rate": 1.9654914595155836e-06, "loss": 0.0031, "step": 23301 }, { "epoch": 4.74, "learning_rate": 1.9623648045687334e-06, "loss": 0.0068, "step": 23302 }, { "epoch": 4.74, "learning_rate": 1.9592406221297985e-06, "loss": 0.0011, "step": 23303 }, { "epoch": 4.75, "learning_rate": 1.9561189122510036e-06, "loss": 0.0003, "step": 23304 }, { "epoch": 4.75, "learning_rate": 1.9529996749844734e-06, "loss": 0.0031, "step": 23305 }, { "epoch": 4.75, "learning_rate": 1.9498829103823166e-06, "loss": 0.0021, "step": 23306 }, { "epoch": 4.75, "learning_rate": 1.9467686184965748e-06, "loss": 0.0022, "step": 23307 }, { "epoch": 4.75, "learning_rate": 1.9436567993792563e-06, "loss": 0.0018, "step": 23308 }, { "epoch": 4.75, "learning_rate": 1.9405474530823527e-06, "loss": 0.014, "step": 23309 }, { "epoch": 4.75, "learning_rate": 1.9374405796577895e-06, "loss": 0.0001, "step": 23310 }, { "epoch": 4.75, "learning_rate": 1.934336179157475e-06, "loss": 0.0031, "step": 23311 }, { "epoch": 4.75, "learning_rate": 1.931234251633218e-06, "loss": 0.0001, "step": 23312 }, { "epoch": 4.75, "learning_rate": 1.92813479713686e-06, "loss": 0.0008, "step": 23313 }, { "epoch": 4.75, "learning_rate": 1.925037815720143e-06, "loss": 0.0005, "step": 23314 }, { "epoch": 4.75, "learning_rate": 1.921943307434809e-06, "loss": 0.0001, "step": 23315 }, { "epoch": 4.75, "learning_rate": 1.91885127233255e-06, "loss": 0.0041, "step": 23316 }, { "epoch": 4.75, "learning_rate": 1.915761710464991e-06, "loss": 0.0058, "step": 23317 }, { "epoch": 4.75, "learning_rate": 1.9126746218837417e-06, "loss": 0.0001, "step": 23318 }, { "epoch": 4.75, "learning_rate": 1.9095900066403436e-06, "loss": 0.0106, "step": 23319 }, { "epoch": 4.75, "learning_rate": 1.9065078647863551e-06, "loss": 0.0019, "step": 23320 }, { "epoch": 4.75, "learning_rate": 1.9034281963732189e-06, "loss": 0.0001, "step": 23321 }, { "epoch": 4.75, "learning_rate": 1.9003510014523938e-06, "loss": 0.0001, "step": 23322 }, { "epoch": 4.75, "learning_rate": 1.897276280075255e-06, "loss": 0.0005, "step": 23323 }, { "epoch": 4.75, "learning_rate": 1.8942040322931785e-06, "loss": 0.0045, "step": 23324 }, { "epoch": 4.75, "learning_rate": 1.8911342581574562e-06, "loss": 0.0092, "step": 23325 }, { "epoch": 4.75, "learning_rate": 1.8880669577193807e-06, "loss": 0.0017, "step": 23326 }, { "epoch": 4.75, "learning_rate": 1.8850021310301444e-06, "loss": 0.0018, "step": 23327 }, { "epoch": 4.75, "learning_rate": 1.8819397781409563e-06, "loss": 0.0029, "step": 23328 }, { "epoch": 4.75, "learning_rate": 1.878879899102992e-06, "loss": 0.0055, "step": 23329 }, { "epoch": 4.75, "learning_rate": 1.8758224939673106e-06, "loss": 0.0083, "step": 23330 }, { "epoch": 4.75, "learning_rate": 1.8727675627850214e-06, "loss": 0.0006, "step": 23331 }, { "epoch": 4.75, "learning_rate": 1.8697151056071002e-06, "loss": 0.0004, "step": 23332 }, { "epoch": 4.75, "learning_rate": 1.8666651224845731e-06, "loss": 0.0014, "step": 23333 }, { "epoch": 4.75, "learning_rate": 1.863617613468349e-06, "loss": 0.0002, "step": 23334 }, { "epoch": 4.75, "learning_rate": 1.8605725786093374e-06, "loss": 0.0015, "step": 23335 }, { "epoch": 4.75, "learning_rate": 1.8575300179583974e-06, "loss": 0.0003, "step": 23336 }, { "epoch": 4.75, "learning_rate": 1.8544899315663387e-06, "loss": 0.0001, "step": 23337 }, { "epoch": 4.75, "learning_rate": 1.8514523194839537e-06, "loss": 0.0118, "step": 23338 }, { "epoch": 4.75, "learning_rate": 1.848417181761952e-06, "loss": 0.0007, "step": 23339 }, { "epoch": 4.75, "learning_rate": 1.845384518451043e-06, "loss": 0.0007, "step": 23340 }, { "epoch": 4.75, "learning_rate": 1.8423543296018861e-06, "loss": 0.0024, "step": 23341 }, { "epoch": 4.75, "learning_rate": 1.8393266152650743e-06, "loss": 0.0005, "step": 23342 }, { "epoch": 4.75, "learning_rate": 1.836301375491167e-06, "loss": 0.0009, "step": 23343 }, { "epoch": 4.75, "learning_rate": 1.833278610330724e-06, "loss": 0.0002, "step": 23344 }, { "epoch": 4.75, "learning_rate": 1.8302583198342046e-06, "loss": 0.0013, "step": 23345 }, { "epoch": 4.75, "learning_rate": 1.8272405040520688e-06, "loss": 0.0002, "step": 23346 }, { "epoch": 4.75, "learning_rate": 1.8242251630346927e-06, "loss": 0.0026, "step": 23347 }, { "epoch": 4.75, "learning_rate": 1.821212296832486e-06, "loss": 0.004, "step": 23348 }, { "epoch": 4.75, "learning_rate": 1.8182019054957252e-06, "loss": 0.002, "step": 23349 }, { "epoch": 4.75, "learning_rate": 1.815193989074687e-06, "loss": 0.0018, "step": 23350 }, { "epoch": 4.75, "learning_rate": 1.812188547619664e-06, "loss": 0.0009, "step": 23351 }, { "epoch": 4.75, "learning_rate": 1.8091855811807832e-06, "loss": 0.0001, "step": 23352 }, { "epoch": 4.76, "learning_rate": 1.8061850898082708e-06, "loss": 0.0007, "step": 23353 }, { "epoch": 4.76, "learning_rate": 1.8031870735521869e-06, "loss": 0.0017, "step": 23354 }, { "epoch": 4.76, "learning_rate": 1.8001915324626082e-06, "loss": 0.0011, "step": 23355 }, { "epoch": 4.76, "learning_rate": 1.7971984665895778e-06, "loss": 0.003, "step": 23356 }, { "epoch": 4.76, "learning_rate": 1.7942078759831058e-06, "loss": 0.0003, "step": 23357 }, { "epoch": 4.76, "learning_rate": 1.7912197606931023e-06, "loss": 0.0017, "step": 23358 }, { "epoch": 4.76, "learning_rate": 1.7882341207694938e-06, "loss": 0.0021, "step": 23359 }, { "epoch": 4.76, "learning_rate": 1.7852509562621576e-06, "loss": 0.0001, "step": 23360 }, { "epoch": 4.76, "learning_rate": 1.7822702672208866e-06, "loss": 0.0021, "step": 23361 }, { "epoch": 4.76, "learning_rate": 1.779292053695508e-06, "loss": 0.0004, "step": 23362 }, { "epoch": 4.76, "learning_rate": 1.7763163157357153e-06, "loss": 0.0016, "step": 23363 }, { "epoch": 4.76, "learning_rate": 1.7733430533912518e-06, "loss": 0.0002, "step": 23364 }, { "epoch": 4.76, "learning_rate": 1.7703722667117281e-06, "loss": 0.0037, "step": 23365 }, { "epoch": 4.76, "learning_rate": 1.7674039557468212e-06, "loss": 0.0024, "step": 23366 }, { "epoch": 4.76, "learning_rate": 1.7644381205460745e-06, "loss": 0.0007, "step": 23367 }, { "epoch": 4.76, "learning_rate": 1.7614747611590152e-06, "loss": 0.0038, "step": 23368 }, { "epoch": 4.76, "learning_rate": 1.758513877635137e-06, "loss": 0.0016, "step": 23369 }, { "epoch": 4.76, "learning_rate": 1.7555554700239173e-06, "loss": 0.0002, "step": 23370 }, { "epoch": 4.76, "learning_rate": 1.7525995383747494e-06, "loss": 0.0007, "step": 23371 }, { "epoch": 4.76, "learning_rate": 1.7496460827370106e-06, "loss": 0.0006, "step": 23372 }, { "epoch": 4.76, "learning_rate": 1.7466951031600118e-06, "loss": 0.0009, "step": 23373 }, { "epoch": 4.76, "learning_rate": 1.7437465996930632e-06, "loss": 0.0019, "step": 23374 }, { "epoch": 4.76, "learning_rate": 1.7408005723853925e-06, "loss": 0.0017, "step": 23375 }, { "epoch": 4.76, "learning_rate": 1.7378570212862264e-06, "loss": 0.0046, "step": 23376 }, { "epoch": 4.76, "learning_rate": 1.7349159464447094e-06, "loss": 0.0009, "step": 23377 }, { "epoch": 4.76, "learning_rate": 1.7319773479099518e-06, "loss": 0.0023, "step": 23378 }, { "epoch": 4.76, "learning_rate": 1.7290412257310648e-06, "loss": 0.0039, "step": 23379 }, { "epoch": 4.76, "learning_rate": 1.7261075799570424e-06, "loss": 0.0078, "step": 23380 }, { "epoch": 4.76, "learning_rate": 1.7231764106369284e-06, "loss": 0.0003, "step": 23381 }, { "epoch": 4.76, "learning_rate": 1.7202477178196838e-06, "loss": 0.0, "step": 23382 }, { "epoch": 4.76, "learning_rate": 1.7173215015541531e-06, "loss": 0.0017, "step": 23383 }, { "epoch": 4.76, "learning_rate": 1.7143977618892968e-06, "loss": 0.0035, "step": 23384 }, { "epoch": 4.76, "learning_rate": 1.7114764988738927e-06, "loss": 0.0003, "step": 23385 }, { "epoch": 4.76, "learning_rate": 1.7085577125567517e-06, "loss": 0.0001, "step": 23386 }, { "epoch": 4.76, "learning_rate": 1.7056414029866016e-06, "loss": 0.0034, "step": 23387 }, { "epoch": 4.76, "learning_rate": 1.7027275702121702e-06, "loss": 0.0013, "step": 23388 }, { "epoch": 4.76, "learning_rate": 1.699816214282118e-06, "loss": 0.0002, "step": 23389 }, { "epoch": 4.76, "learning_rate": 1.69690733524509e-06, "loss": 0.0015, "step": 23390 }, { "epoch": 4.76, "learning_rate": 1.6940009331496308e-06, "loss": 0.0033, "step": 23391 }, { "epoch": 4.76, "learning_rate": 1.6910970080443008e-06, "loss": 0.0001, "step": 23392 }, { "epoch": 4.76, "learning_rate": 1.6881955599776288e-06, "loss": 0.0114, "step": 23393 }, { "epoch": 4.76, "learning_rate": 1.6852965889980251e-06, "loss": 0.0001, "step": 23394 }, { "epoch": 4.76, "learning_rate": 1.6824000951539518e-06, "loss": 0.0001, "step": 23395 }, { "epoch": 4.76, "learning_rate": 1.6795060784937363e-06, "loss": 0.0001, "step": 23396 }, { "epoch": 4.76, "learning_rate": 1.6766145390657737e-06, "loss": 0.0019, "step": 23397 }, { "epoch": 4.76, "learning_rate": 1.6737254769183085e-06, "loss": 0.0019, "step": 23398 }, { "epoch": 4.76, "learning_rate": 1.6708388920996352e-06, "loss": 0.0024, "step": 23399 }, { "epoch": 4.76, "learning_rate": 1.6679547846579323e-06, "loss": 0.0015, "step": 23400 }, { "epoch": 4.76, "learning_rate": 1.6650731546413776e-06, "loss": 0.0054, "step": 23401 }, { "epoch": 4.77, "learning_rate": 1.6621940020980995e-06, "loss": 0.0019, "step": 23402 }, { "epoch": 4.77, "learning_rate": 1.6593173270761927e-06, "loss": 0.0012, "step": 23403 }, { "epoch": 4.77, "learning_rate": 1.6564431296237023e-06, "loss": 0.0019, "step": 23404 }, { "epoch": 4.77, "learning_rate": 1.6535714097886399e-06, "loss": 0.003, "step": 23405 }, { "epoch": 4.77, "learning_rate": 1.6507021676189503e-06, "loss": 0.0026, "step": 23406 }, { "epoch": 4.77, "learning_rate": 1.6478354031625451e-06, "loss": 0.001, "step": 23407 }, { "epoch": 4.77, "learning_rate": 1.644971116467353e-06, "loss": 0.0006, "step": 23408 }, { "epoch": 4.77, "learning_rate": 1.6421093075811687e-06, "loss": 0.0021, "step": 23409 }, { "epoch": 4.77, "learning_rate": 1.6392499765518042e-06, "loss": 0.0004, "step": 23410 }, { "epoch": 4.77, "learning_rate": 1.6363931234270044e-06, "loss": 0.0003, "step": 23411 }, { "epoch": 4.77, "learning_rate": 1.6335387482545148e-06, "loss": 0.0001, "step": 23412 }, { "epoch": 4.77, "learning_rate": 1.630686851081997e-06, "loss": 0.0003, "step": 23413 }, { "epoch": 4.77, "learning_rate": 1.6278374319570465e-06, "loss": 0.0015, "step": 23414 }, { "epoch": 4.77, "learning_rate": 1.624990490927308e-06, "loss": 0.0003, "step": 23415 }, { "epoch": 4.77, "learning_rate": 1.6221460280402942e-06, "loss": 0.0003, "step": 23416 }, { "epoch": 4.77, "learning_rate": 1.6193040433435333e-06, "loss": 0.0007, "step": 23417 }, { "epoch": 4.77, "learning_rate": 1.616464536884471e-06, "loss": 0.0023, "step": 23418 }, { "epoch": 4.77, "learning_rate": 1.6136275087105522e-06, "loss": 0.0014, "step": 23419 }, { "epoch": 4.77, "learning_rate": 1.610792958869156e-06, "loss": 0.0001, "step": 23420 }, { "epoch": 4.77, "learning_rate": 1.607960887407611e-06, "loss": 0.0007, "step": 23421 }, { "epoch": 4.77, "learning_rate": 1.6051312943732297e-06, "loss": 0.0006, "step": 23422 }, { "epoch": 4.77, "learning_rate": 1.6023041798132741e-06, "loss": 0.0001, "step": 23423 }, { "epoch": 4.77, "learning_rate": 1.599479543774973e-06, "loss": 0.0003, "step": 23424 }, { "epoch": 4.77, "learning_rate": 1.5966573863054722e-06, "loss": 0.0004, "step": 23425 }, { "epoch": 4.77, "learning_rate": 1.5938377074519338e-06, "loss": 0.0037, "step": 23426 }, { "epoch": 4.77, "learning_rate": 1.5910205072614368e-06, "loss": 0.0008, "step": 23427 }, { "epoch": 4.77, "learning_rate": 1.5882057857810438e-06, "loss": 0.0002, "step": 23428 }, { "epoch": 4.77, "learning_rate": 1.5853935430577501e-06, "loss": 0.0044, "step": 23429 }, { "epoch": 4.77, "learning_rate": 1.582583779138552e-06, "loss": 0.0007, "step": 23430 }, { "epoch": 4.77, "learning_rate": 1.5797764940703617e-06, "loss": 0.0064, "step": 23431 }, { "epoch": 4.77, "learning_rate": 1.5769716879000583e-06, "loss": 0.0004, "step": 23432 }, { "epoch": 4.77, "learning_rate": 1.5741693606745043e-06, "loss": 0.0005, "step": 23433 }, { "epoch": 4.77, "learning_rate": 1.571369512440479e-06, "loss": 0.0022, "step": 23434 }, { "epoch": 4.77, "learning_rate": 1.5685721432447785e-06, "loss": 0.0019, "step": 23435 }, { "epoch": 4.77, "learning_rate": 1.5657772531340983e-06, "loss": 0.0016, "step": 23436 }, { "epoch": 4.77, "learning_rate": 1.562984842155135e-06, "loss": 0.0003, "step": 23437 }, { "epoch": 4.77, "learning_rate": 1.560194910354501e-06, "loss": 0.0001, "step": 23438 }, { "epoch": 4.77, "learning_rate": 1.5574074577788254e-06, "loss": 0.0009, "step": 23439 }, { "epoch": 4.77, "learning_rate": 1.5546224844746548e-06, "loss": 0.0001, "step": 23440 }, { "epoch": 4.77, "learning_rate": 1.5518399904885014e-06, "loss": 0.0014, "step": 23441 }, { "epoch": 4.77, "learning_rate": 1.5490599758668286e-06, "loss": 0.0001, "step": 23442 }, { "epoch": 4.77, "learning_rate": 1.546282440656066e-06, "loss": 0.0002, "step": 23443 }, { "epoch": 4.77, "learning_rate": 1.5435073849026259e-06, "loss": 0.0004, "step": 23444 }, { "epoch": 4.77, "learning_rate": 1.5407348086528381e-06, "loss": 0.0003, "step": 23445 }, { "epoch": 4.77, "learning_rate": 1.5379647119530325e-06, "loss": 0.0012, "step": 23446 }, { "epoch": 4.77, "learning_rate": 1.5351970948494385e-06, "loss": 0.0022, "step": 23447 }, { "epoch": 4.77, "learning_rate": 1.5324319573883192e-06, "loss": 0.0001, "step": 23448 }, { "epoch": 4.77, "learning_rate": 1.5296692996158045e-06, "loss": 0.0008, "step": 23449 }, { "epoch": 4.77, "learning_rate": 1.526909121578107e-06, "loss": 0.0006, "step": 23450 }, { "epoch": 4.78, "learning_rate": 1.5241514233212737e-06, "loss": 0.0031, "step": 23451 }, { "epoch": 4.78, "learning_rate": 1.5213962048913842e-06, "loss": 0.0013, "step": 23452 }, { "epoch": 4.78, "learning_rate": 1.5186434663344515e-06, "loss": 0.0014, "step": 23453 }, { "epoch": 4.78, "learning_rate": 1.5158932076964392e-06, "loss": 0.0011, "step": 23454 }, { "epoch": 4.78, "learning_rate": 1.5131454290233102e-06, "loss": 0.0006, "step": 23455 }, { "epoch": 4.78, "learning_rate": 1.5104001303609282e-06, "loss": 0.0013, "step": 23456 }, { "epoch": 4.78, "learning_rate": 1.507657311755156e-06, "loss": 0.0006, "step": 23457 }, { "epoch": 4.78, "learning_rate": 1.5049169732518075e-06, "loss": 0.0043, "step": 23458 }, { "epoch": 4.78, "learning_rate": 1.5021791148966789e-06, "loss": 0.0002, "step": 23459 }, { "epoch": 4.78, "learning_rate": 1.4994437367354339e-06, "loss": 0.0014, "step": 23460 }, { "epoch": 4.78, "learning_rate": 1.4967108388138027e-06, "loss": 0.0002, "step": 23461 }, { "epoch": 4.78, "learning_rate": 1.4939804211774153e-06, "loss": 0.0001, "step": 23462 }, { "epoch": 4.78, "learning_rate": 1.4912524838718852e-06, "loss": 0.0023, "step": 23463 }, { "epoch": 4.78, "learning_rate": 1.4885270269427763e-06, "loss": 0.0018, "step": 23464 }, { "epoch": 4.78, "learning_rate": 1.4858040504355851e-06, "loss": 0.0004, "step": 23465 }, { "epoch": 4.78, "learning_rate": 1.4830835543958254e-06, "loss": 0.0009, "step": 23466 }, { "epoch": 4.78, "learning_rate": 1.480365538868894e-06, "loss": 0.0028, "step": 23467 }, { "epoch": 4.78, "learning_rate": 1.4776500039002381e-06, "loss": 0.0022, "step": 23468 }, { "epoch": 4.78, "learning_rate": 1.4749369495351715e-06, "loss": 0.0007, "step": 23469 }, { "epoch": 4.78, "learning_rate": 1.4722263758190077e-06, "loss": 0.001, "step": 23470 }, { "epoch": 4.78, "learning_rate": 1.4695182827970276e-06, "loss": 0.0006, "step": 23471 }, { "epoch": 4.78, "learning_rate": 1.4668126705144777e-06, "loss": 0.0014, "step": 23472 }, { "epoch": 4.78, "learning_rate": 1.4641095390165225e-06, "loss": 0.0036, "step": 23473 }, { "epoch": 4.78, "learning_rate": 1.4614088883483255e-06, "loss": 0.0004, "step": 23474 }, { "epoch": 4.78, "learning_rate": 1.458710718554984e-06, "loss": 0.0003, "step": 23475 }, { "epoch": 4.78, "learning_rate": 1.456015029681562e-06, "loss": 0.0005, "step": 23476 }, { "epoch": 4.78, "learning_rate": 1.4533218217730901e-06, "loss": 0.001, "step": 23477 }, { "epoch": 4.78, "learning_rate": 1.4506310948745493e-06, "loss": 0.0005, "step": 23478 }, { "epoch": 4.78, "learning_rate": 1.4479428490308697e-06, "loss": 0.0005, "step": 23479 }, { "epoch": 4.78, "learning_rate": 1.4452570842869493e-06, "loss": 0.001, "step": 23480 }, { "epoch": 4.78, "learning_rate": 1.4425738006876686e-06, "loss": 0.0026, "step": 23481 }, { "epoch": 4.78, "learning_rate": 1.439892998277825e-06, "loss": 0.0016, "step": 23482 }, { "epoch": 4.78, "learning_rate": 1.437214677102183e-06, "loss": 0.0055, "step": 23483 }, { "epoch": 4.78, "learning_rate": 1.4345388372055067e-06, "loss": 0.0, "step": 23484 }, { "epoch": 4.78, "learning_rate": 1.4318654786324434e-06, "loss": 0.0012, "step": 23485 }, { "epoch": 4.78, "learning_rate": 1.429194601427691e-06, "loss": 0.0005, "step": 23486 }, { "epoch": 4.78, "learning_rate": 1.4265262056358307e-06, "loss": 0.0049, "step": 23487 }, { "epoch": 4.78, "learning_rate": 1.4238602913014263e-06, "loss": 0.0006, "step": 23488 }, { "epoch": 4.78, "learning_rate": 1.4211968584690092e-06, "loss": 0.0015, "step": 23489 }, { "epoch": 4.78, "learning_rate": 1.418535907183077e-06, "loss": 0.0024, "step": 23490 }, { "epoch": 4.78, "learning_rate": 1.415877437488061e-06, "loss": 0.0005, "step": 23491 }, { "epoch": 4.78, "learning_rate": 1.4132214494283755e-06, "loss": 0.001, "step": 23492 }, { "epoch": 4.78, "learning_rate": 1.4105679430483518e-06, "loss": 0.0003, "step": 23493 }, { "epoch": 4.78, "learning_rate": 1.4079169183923377e-06, "loss": 0.0018, "step": 23494 }, { "epoch": 4.78, "learning_rate": 1.4052683755045812e-06, "loss": 0.0002, "step": 23495 }, { "epoch": 4.78, "learning_rate": 1.402622314429347e-06, "loss": 0.0011, "step": 23496 }, { "epoch": 4.78, "learning_rate": 1.3999787352108326e-06, "loss": 0.0001, "step": 23497 }, { "epoch": 4.78, "learning_rate": 1.3973376378931533e-06, "loss": 0.0052, "step": 23498 }, { "epoch": 4.78, "learning_rate": 1.3946990225204569e-06, "loss": 0.0001, "step": 23499 }, { "epoch": 4.79, "learning_rate": 1.3920628891367913e-06, "loss": 0.0027, "step": 23500 }, { "epoch": 4.79, "learning_rate": 1.3894292377861883e-06, "loss": 0.001, "step": 23501 }, { "epoch": 4.79, "learning_rate": 1.3867980685126457e-06, "loss": 0.0003, "step": 23502 }, { "epoch": 4.79, "learning_rate": 1.3841693813601118e-06, "loss": 0.001, "step": 23503 }, { "epoch": 4.79, "learning_rate": 1.3815431763724683e-06, "loss": 0.0002, "step": 23504 }, { "epoch": 4.79, "learning_rate": 1.3789194535935967e-06, "loss": 0.0008, "step": 23505 }, { "epoch": 4.79, "learning_rate": 1.3762982130673116e-06, "loss": 0.0078, "step": 23506 }, { "epoch": 4.79, "learning_rate": 1.3736794548373953e-06, "loss": 0.0002, "step": 23507 }, { "epoch": 4.79, "learning_rate": 1.371063178947579e-06, "loss": 0.0005, "step": 23508 }, { "epoch": 4.79, "learning_rate": 1.3684493854415612e-06, "loss": 0.0012, "step": 23509 }, { "epoch": 4.79, "learning_rate": 1.3658380743630071e-06, "loss": 0.0017, "step": 23510 }, { "epoch": 4.79, "learning_rate": 1.3632292457555149e-06, "loss": 0.0023, "step": 23511 }, { "epoch": 4.79, "learning_rate": 1.3606228996626833e-06, "loss": 0.0038, "step": 23512 }, { "epoch": 4.79, "learning_rate": 1.3580190361280108e-06, "loss": 0.0001, "step": 23513 }, { "epoch": 4.79, "learning_rate": 1.3554176551950124e-06, "loss": 0.0009, "step": 23514 }, { "epoch": 4.79, "learning_rate": 1.3528187569071202e-06, "loss": 0.0001, "step": 23515 }, { "epoch": 4.79, "learning_rate": 1.3502223413077496e-06, "loss": 0.0002, "step": 23516 }, { "epoch": 4.79, "learning_rate": 1.3476284084402654e-06, "loss": 0.0067, "step": 23517 }, { "epoch": 4.79, "learning_rate": 1.345036958347967e-06, "loss": 0.0019, "step": 23518 }, { "epoch": 4.79, "learning_rate": 1.3424479910741859e-06, "loss": 0.0001, "step": 23519 }, { "epoch": 4.79, "learning_rate": 1.339861506662121e-06, "loss": 0.0011, "step": 23520 }, { "epoch": 4.79, "learning_rate": 1.3372775051549877e-06, "loss": 0.0004, "step": 23521 }, { "epoch": 4.79, "learning_rate": 1.334695986595935e-06, "loss": 0.0007, "step": 23522 }, { "epoch": 4.79, "learning_rate": 1.332116951028095e-06, "loss": 0.0002, "step": 23523 }, { "epoch": 4.79, "learning_rate": 1.3295403984945164e-06, "loss": 0.0009, "step": 23524 }, { "epoch": 4.79, "learning_rate": 1.3269663290382648e-06, "loss": 0.0053, "step": 23525 }, { "epoch": 4.79, "learning_rate": 1.324394742702306e-06, "loss": 0.0016, "step": 23526 }, { "epoch": 4.79, "learning_rate": 1.3218256395296056e-06, "loss": 0.0002, "step": 23527 }, { "epoch": 4.79, "learning_rate": 1.3192590195630625e-06, "loss": 0.0034, "step": 23528 }, { "epoch": 4.79, "learning_rate": 1.3166948828455425e-06, "loss": 0.0015, "step": 23529 }, { "epoch": 4.79, "learning_rate": 1.3141332294198948e-06, "loss": 0.002, "step": 23530 }, { "epoch": 4.79, "learning_rate": 1.3115740593288683e-06, "loss": 0.0025, "step": 23531 }, { "epoch": 4.79, "learning_rate": 1.3090173726152453e-06, "loss": 0.0003, "step": 23532 }, { "epoch": 4.79, "learning_rate": 1.3064631693216921e-06, "loss": 0.0002, "step": 23533 }, { "epoch": 4.79, "learning_rate": 1.3039114494908908e-06, "loss": 0.0022, "step": 23534 }, { "epoch": 4.79, "learning_rate": 1.3013622131654412e-06, "loss": 0.0038, "step": 23535 }, { "epoch": 4.79, "learning_rate": 1.2988154603879419e-06, "loss": 0.0025, "step": 23536 }, { "epoch": 4.79, "learning_rate": 1.2962711912009094e-06, "loss": 0.0023, "step": 23537 }, { "epoch": 4.79, "learning_rate": 1.293729405646843e-06, "loss": 0.0002, "step": 23538 }, { "epoch": 4.79, "learning_rate": 1.2911901037682083e-06, "loss": 0.0035, "step": 23539 }, { "epoch": 4.79, "learning_rate": 1.288653285607405e-06, "loss": 0.0004, "step": 23540 }, { "epoch": 4.79, "learning_rate": 1.2861189512067994e-06, "loss": 0.0037, "step": 23541 }, { "epoch": 4.79, "learning_rate": 1.283587100608724e-06, "loss": 0.005, "step": 23542 }, { "epoch": 4.79, "learning_rate": 1.2810577338554783e-06, "loss": 0.0001, "step": 23543 }, { "epoch": 4.79, "learning_rate": 1.2785308509892788e-06, "loss": 0.0003, "step": 23544 }, { "epoch": 4.79, "learning_rate": 1.2760064520523583e-06, "loss": 0.0008, "step": 23545 }, { "epoch": 4.79, "learning_rate": 1.2734845370868496e-06, "loss": 0.0025, "step": 23546 }, { "epoch": 4.79, "learning_rate": 1.2709651061349025e-06, "loss": 0.0009, "step": 23547 }, { "epoch": 4.79, "learning_rate": 1.2684481592385998e-06, "loss": 0.0005, "step": 23548 }, { "epoch": 4.8, "learning_rate": 1.2659336964399414e-06, "loss": 0.0045, "step": 23549 }, { "epoch": 4.8, "learning_rate": 1.2634217177809603e-06, "loss": 0.0004, "step": 23550 }, { "epoch": 4.8, "learning_rate": 1.2609122233035728e-06, "loss": 0.0001, "step": 23551 }, { "epoch": 4.8, "learning_rate": 1.2584052130497457e-06, "loss": 0.0004, "step": 23552 }, { "epoch": 4.8, "learning_rate": 1.255900687061312e-06, "loss": 0.0014, "step": 23553 }, { "epoch": 4.8, "learning_rate": 1.2533986453801048e-06, "loss": 0.0003, "step": 23554 }, { "epoch": 4.8, "learning_rate": 1.2508990880479076e-06, "loss": 0.0049, "step": 23555 }, { "epoch": 4.8, "learning_rate": 1.2484020151065034e-06, "loss": 0.0036, "step": 23556 }, { "epoch": 4.8, "learning_rate": 1.245907426597559e-06, "loss": 0.0007, "step": 23557 }, { "epoch": 4.8, "learning_rate": 1.2434153225627574e-06, "loss": 0.0041, "step": 23558 }, { "epoch": 4.8, "learning_rate": 1.2409257030437158e-06, "loss": 0.0035, "step": 23559 }, { "epoch": 4.8, "learning_rate": 1.2384385680820174e-06, "loss": 0.0002, "step": 23560 }, { "epoch": 4.8, "learning_rate": 1.235953917719229e-06, "loss": 0.0003, "step": 23561 }, { "epoch": 4.8, "learning_rate": 1.233471751996784e-06, "loss": 0.0054, "step": 23562 }, { "epoch": 4.8, "learning_rate": 1.2309920709561994e-06, "loss": 0.0022, "step": 23563 }, { "epoch": 4.8, "learning_rate": 1.2285148746388584e-06, "loss": 0.0008, "step": 23564 }, { "epoch": 4.8, "learning_rate": 1.226040163086145e-06, "loss": 0.0002, "step": 23565 }, { "epoch": 4.8, "learning_rate": 1.2235679363393925e-06, "loss": 0.0002, "step": 23566 }, { "epoch": 4.8, "learning_rate": 1.2210981944399011e-06, "loss": 0.0001, "step": 23567 }, { "epoch": 4.8, "learning_rate": 1.218630937428905e-06, "loss": 0.0008, "step": 23568 }, { "epoch": 4.8, "learning_rate": 1.216166165347604e-06, "loss": 0.0001, "step": 23569 }, { "epoch": 4.8, "learning_rate": 1.2137038782371989e-06, "loss": 0.0019, "step": 23570 }, { "epoch": 4.8, "learning_rate": 1.2112440761387732e-06, "loss": 0.0055, "step": 23571 }, { "epoch": 4.8, "learning_rate": 1.2087867590934442e-06, "loss": 0.0003, "step": 23572 }, { "epoch": 4.8, "learning_rate": 1.206331927142229e-06, "loss": 0.002, "step": 23573 }, { "epoch": 4.8, "learning_rate": 1.2038795803261448e-06, "loss": 0.0011, "step": 23574 }, { "epoch": 4.8, "learning_rate": 1.201429718686142e-06, "loss": 0.0001, "step": 23575 }, { "epoch": 4.8, "learning_rate": 1.1989823422631384e-06, "loss": 0.0025, "step": 23576 }, { "epoch": 4.8, "learning_rate": 1.1965374510980175e-06, "loss": 0.0006, "step": 23577 }, { "epoch": 4.8, "learning_rate": 1.1940950452315967e-06, "loss": 0.0019, "step": 23578 }, { "epoch": 4.8, "learning_rate": 1.1916551247046935e-06, "loss": 0.0001, "step": 23579 }, { "epoch": 4.8, "learning_rate": 1.189217689558042e-06, "loss": 0.0025, "step": 23580 }, { "epoch": 4.8, "learning_rate": 1.1867827398323593e-06, "loss": 0.0004, "step": 23581 }, { "epoch": 4.8, "learning_rate": 1.1843502755682966e-06, "loss": 0.0015, "step": 23582 }, { "epoch": 4.8, "learning_rate": 1.1819202968065045e-06, "loss": 0.0043, "step": 23583 }, { "epoch": 4.8, "learning_rate": 1.1794928035875507e-06, "loss": 0.0029, "step": 23584 }, { "epoch": 4.8, "learning_rate": 1.177067795951986e-06, "loss": 0.0002, "step": 23585 }, { "epoch": 4.8, "learning_rate": 1.1746452739403111e-06, "loss": 0.0022, "step": 23586 }, { "epoch": 4.8, "learning_rate": 1.1722252375929942e-06, "loss": 0.0002, "step": 23587 }, { "epoch": 4.8, "learning_rate": 1.169807686950436e-06, "loss": 0.0006, "step": 23588 }, { "epoch": 4.8, "learning_rate": 1.1673926220530371e-06, "loss": 0.0014, "step": 23589 }, { "epoch": 4.8, "learning_rate": 1.1649800429411327e-06, "loss": 0.0003, "step": 23590 }, { "epoch": 4.8, "learning_rate": 1.16256994965499e-06, "loss": 0.0013, "step": 23591 }, { "epoch": 4.8, "learning_rate": 1.160162342234877e-06, "loss": 0.0001, "step": 23592 }, { "epoch": 4.8, "learning_rate": 1.1577572207210283e-06, "loss": 0.0031, "step": 23593 }, { "epoch": 4.8, "learning_rate": 1.1553545851535784e-06, "loss": 0.0004, "step": 23594 }, { "epoch": 4.8, "learning_rate": 1.1529544355726783e-06, "loss": 0.0005, "step": 23595 }, { "epoch": 4.8, "learning_rate": 1.1505567720184127e-06, "loss": 0.0039, "step": 23596 }, { "epoch": 4.8, "learning_rate": 1.1481615945307999e-06, "loss": 0.0033, "step": 23597 }, { "epoch": 4.81, "learning_rate": 1.1457689031498906e-06, "loss": 0.0007, "step": 23598 }, { "epoch": 4.81, "learning_rate": 1.1433786979156035e-06, "loss": 0.0001, "step": 23599 }, { "epoch": 4.81, "learning_rate": 1.1409909788678895e-06, "loss": 0.0001, "step": 23600 }, { "epoch": 4.81, "learning_rate": 1.138605746046617e-06, "loss": 0.0005, "step": 23601 }, { "epoch": 4.81, "learning_rate": 1.1362229994916206e-06, "loss": 0.001, "step": 23602 }, { "epoch": 4.81, "learning_rate": 1.1338427392427018e-06, "loss": 0.0028, "step": 23603 }, { "epoch": 4.81, "learning_rate": 1.1314649653396123e-06, "loss": 0.0053, "step": 23604 }, { "epoch": 4.81, "learning_rate": 1.1290896778220703e-06, "loss": 0.0052, "step": 23605 }, { "epoch": 4.81, "learning_rate": 1.126716876729744e-06, "loss": 0.0045, "step": 23606 }, { "epoch": 4.81, "learning_rate": 1.1243465621022685e-06, "loss": 0.0023, "step": 23607 }, { "epoch": 4.81, "learning_rate": 1.1219787339792286e-06, "loss": 0.0003, "step": 23608 }, { "epoch": 4.81, "learning_rate": 1.1196133924001592e-06, "loss": 0.0022, "step": 23609 }, { "epoch": 4.81, "learning_rate": 1.1172505374045793e-06, "loss": 0.0019, "step": 23610 }, { "epoch": 4.81, "learning_rate": 1.1148901690319568e-06, "loss": 0.0017, "step": 23611 }, { "epoch": 4.81, "learning_rate": 1.1125322873217269e-06, "loss": 0.0048, "step": 23612 }, { "epoch": 4.81, "learning_rate": 1.1101768923132247e-06, "loss": 0.0003, "step": 23613 }, { "epoch": 4.81, "learning_rate": 1.1078239840458359e-06, "loss": 0.0011, "step": 23614 }, { "epoch": 4.81, "learning_rate": 1.1054735625588284e-06, "loss": 0.0021, "step": 23615 }, { "epoch": 4.81, "learning_rate": 1.1031256278914712e-06, "loss": 0.0027, "step": 23616 }, { "epoch": 4.81, "learning_rate": 1.100780180082983e-06, "loss": 0.0001, "step": 23617 }, { "epoch": 4.81, "learning_rate": 1.098437219172532e-06, "loss": 0.0001, "step": 23618 }, { "epoch": 4.81, "learning_rate": 1.0960967451992543e-06, "loss": 0.0012, "step": 23619 }, { "epoch": 4.81, "learning_rate": 1.0937587582022345e-06, "loss": 0.0005, "step": 23620 }, { "epoch": 4.81, "learning_rate": 1.0914232582205252e-06, "loss": 0.0004, "step": 23621 }, { "epoch": 4.81, "learning_rate": 1.0890902452931282e-06, "loss": 0.0001, "step": 23622 }, { "epoch": 4.81, "learning_rate": 1.0867597194590127e-06, "loss": 0.0027, "step": 23623 }, { "epoch": 4.81, "learning_rate": 1.0844316807571141e-06, "loss": 0.0003, "step": 23624 }, { "epoch": 4.81, "learning_rate": 1.082106129226301e-06, "loss": 0.0031, "step": 23625 }, { "epoch": 4.81, "learning_rate": 1.0797830649054096e-06, "loss": 0.0001, "step": 23626 }, { "epoch": 4.81, "learning_rate": 1.0774624878332583e-06, "loss": 0.0014, "step": 23627 }, { "epoch": 4.81, "learning_rate": 1.075144398048583e-06, "loss": 0.0011, "step": 23628 }, { "epoch": 4.81, "learning_rate": 1.0728287955901195e-06, "loss": 0.0002, "step": 23629 }, { "epoch": 4.81, "learning_rate": 1.0705156804965365e-06, "loss": 0.001, "step": 23630 }, { "epoch": 4.81, "learning_rate": 1.0682050528064534e-06, "loss": 0.0015, "step": 23631 }, { "epoch": 4.81, "learning_rate": 1.0658969125584893e-06, "loss": 0.0038, "step": 23632 }, { "epoch": 4.81, "learning_rate": 1.0635912597911633e-06, "loss": 0.0023, "step": 23633 }, { "epoch": 4.81, "learning_rate": 1.061288094543028e-06, "loss": 0.0024, "step": 23634 }, { "epoch": 4.81, "learning_rate": 1.0589874168525025e-06, "loss": 0.0013, "step": 23635 }, { "epoch": 4.81, "learning_rate": 1.0566892267580395e-06, "loss": 0.0005, "step": 23636 }, { "epoch": 4.81, "learning_rate": 1.0543935242980085e-06, "loss": 0.001, "step": 23637 }, { "epoch": 4.81, "learning_rate": 1.0521003095107782e-06, "loss": 0.0068, "step": 23638 }, { "epoch": 4.81, "learning_rate": 1.0498095824346187e-06, "loss": 0.0013, "step": 23639 }, { "epoch": 4.81, "learning_rate": 1.0475213431077989e-06, "loss": 0.0033, "step": 23640 }, { "epoch": 4.81, "learning_rate": 1.045235591568555e-06, "loss": 0.0009, "step": 23641 }, { "epoch": 4.81, "learning_rate": 1.04295232785504e-06, "loss": 0.0013, "step": 23642 }, { "epoch": 4.81, "learning_rate": 1.0406715520053899e-06, "loss": 0.0025, "step": 23643 }, { "epoch": 4.81, "learning_rate": 1.0383932640577075e-06, "loss": 0.0, "step": 23644 }, { "epoch": 4.81, "learning_rate": 1.0361174640500626e-06, "loss": 0.0001, "step": 23645 }, { "epoch": 4.81, "learning_rate": 1.0338441520204243e-06, "loss": 0.0077, "step": 23646 }, { "epoch": 4.81, "learning_rate": 1.0315733280067962e-06, "loss": 0.0035, "step": 23647 }, { "epoch": 4.82, "learning_rate": 1.0293049920470643e-06, "loss": 0.0, "step": 23648 }, { "epoch": 4.82, "learning_rate": 1.0270391441791813e-06, "loss": 0.0022, "step": 23649 }, { "epoch": 4.82, "learning_rate": 1.0247757844409177e-06, "loss": 0.0017, "step": 23650 }, { "epoch": 4.82, "learning_rate": 1.022514912870126e-06, "loss": 0.0009, "step": 23651 }, { "epoch": 4.82, "learning_rate": 1.0202565295045428e-06, "loss": 0.0008, "step": 23652 }, { "epoch": 4.82, "learning_rate": 1.0180006343819047e-06, "loss": 0.0022, "step": 23653 }, { "epoch": 4.82, "learning_rate": 1.0157472275398649e-06, "loss": 0.0012, "step": 23654 }, { "epoch": 4.82, "learning_rate": 1.013496309016093e-06, "loss": 0.0006, "step": 23655 }, { "epoch": 4.82, "learning_rate": 1.0112478788481425e-06, "loss": 0.0007, "step": 23656 }, { "epoch": 4.82, "learning_rate": 1.0090019370736003e-06, "loss": 0.0032, "step": 23657 }, { "epoch": 4.82, "learning_rate": 1.006758483729969e-06, "loss": 0.0011, "step": 23658 }, { "epoch": 4.82, "learning_rate": 1.0045175188547194e-06, "loss": 0.0002, "step": 23659 }, { "epoch": 4.82, "learning_rate": 1.0022790424852545e-06, "loss": 0.0014, "step": 23660 }, { "epoch": 4.82, "learning_rate": 1.000043054659011e-06, "loss": 0.0004, "step": 23661 }, { "epoch": 4.82, "learning_rate": 9.978095554132759e-07, "loss": 0.0025, "step": 23662 }, { "epoch": 4.82, "learning_rate": 9.955785447854193e-07, "loss": 0.0015, "step": 23663 }, { "epoch": 4.82, "learning_rate": 9.933500228126278e-07, "loss": 0.0036, "step": 23664 }, { "epoch": 4.82, "learning_rate": 9.911239895321887e-07, "loss": 0.0012, "step": 23665 }, { "epoch": 4.82, "learning_rate": 9.889004449812388e-07, "loss": 0.0019, "step": 23666 }, { "epoch": 4.82, "learning_rate": 9.866793891969482e-07, "loss": 0.0007, "step": 23667 }, { "epoch": 4.82, "learning_rate": 9.844608222163708e-07, "loss": 0.0001, "step": 23668 }, { "epoch": 4.82, "learning_rate": 9.822447440765936e-07, "loss": 0.0009, "step": 23669 }, { "epoch": 4.82, "learning_rate": 9.8003115481462e-07, "loss": 0.0004, "step": 23670 }, { "epoch": 4.82, "learning_rate": 9.778200544674208e-07, "loss": 0.0031, "step": 23671 }, { "epoch": 4.82, "learning_rate": 9.756114430719331e-07, "loss": 0.0, "step": 23672 }, { "epoch": 4.82, "learning_rate": 9.734053206650273e-07, "loss": 0.0007, "step": 23673 }, { "epoch": 4.82, "learning_rate": 9.712016872835737e-07, "loss": 0.0007, "step": 23674 }, { "epoch": 4.82, "learning_rate": 9.6900054296436e-07, "loss": 0.0001, "step": 23675 }, { "epoch": 4.82, "learning_rate": 9.668018877441398e-07, "loss": 0.0004, "step": 23676 }, { "epoch": 4.82, "learning_rate": 9.646057216596504e-07, "loss": 0.0001, "step": 23677 }, { "epoch": 4.82, "learning_rate": 9.624120447475959e-07, "loss": 0.0145, "step": 23678 }, { "epoch": 4.82, "learning_rate": 9.602208570445636e-07, "loss": 0.009, "step": 23679 }, { "epoch": 4.82, "learning_rate": 9.580321585871742e-07, "loss": 0.0016, "step": 23680 }, { "epoch": 4.82, "learning_rate": 9.558459494119985e-07, "loss": 0.0008, "step": 23681 }, { "epoch": 4.82, "learning_rate": 9.536622295555241e-07, "loss": 0.002, "step": 23682 }, { "epoch": 4.82, "learning_rate": 9.514809990542383e-07, "loss": 0.0075, "step": 23683 }, { "epoch": 4.82, "learning_rate": 9.493022579445619e-07, "loss": 0.0016, "step": 23684 }, { "epoch": 4.82, "learning_rate": 9.471260062629161e-07, "loss": 0.0001, "step": 23685 }, { "epoch": 4.82, "learning_rate": 9.449522440456047e-07, "loss": 0.0008, "step": 23686 }, { "epoch": 4.82, "learning_rate": 9.427809713289492e-07, "loss": 0.0006, "step": 23687 }, { "epoch": 4.82, "learning_rate": 9.406121881492201e-07, "loss": 0.0013, "step": 23688 }, { "epoch": 4.82, "learning_rate": 9.384458945426388e-07, "loss": 0.0032, "step": 23689 }, { "epoch": 4.82, "learning_rate": 9.362820905453927e-07, "loss": 0.0017, "step": 23690 }, { "epoch": 4.82, "learning_rate": 9.341207761936031e-07, "loss": 0.0046, "step": 23691 }, { "epoch": 4.82, "learning_rate": 9.319619515233745e-07, "loss": 0.0015, "step": 23692 }, { "epoch": 4.82, "learning_rate": 9.298056165707779e-07, "loss": 0.0005, "step": 23693 }, { "epoch": 4.82, "learning_rate": 9.276517713718013e-07, "loss": 0.0036, "step": 23694 }, { "epoch": 4.82, "learning_rate": 9.25500415962449e-07, "loss": 0.0061, "step": 23695 }, { "epoch": 4.82, "learning_rate": 9.233515503786426e-07, "loss": 0.0009, "step": 23696 }, { "epoch": 4.83, "learning_rate": 9.212051746562532e-07, "loss": 0.0021, "step": 23697 }, { "epoch": 4.83, "learning_rate": 9.190612888311521e-07, "loss": 0.0006, "step": 23698 }, { "epoch": 4.83, "learning_rate": 9.169198929391275e-07, "loss": 0.0, "step": 23699 }, { "epoch": 4.83, "learning_rate": 9.147809870159673e-07, "loss": 0.0027, "step": 23700 }, { "epoch": 4.83, "learning_rate": 9.126445710973929e-07, "loss": 0.0005, "step": 23701 }, { "epoch": 4.83, "learning_rate": 9.105106452190591e-07, "loss": 0.0038, "step": 23702 }, { "epoch": 4.83, "learning_rate": 9.083792094166209e-07, "loss": 0.0006, "step": 23703 }, { "epoch": 4.83, "learning_rate": 9.06250263725683e-07, "loss": 0.0004, "step": 23704 }, { "epoch": 4.83, "learning_rate": 9.041238081818003e-07, "loss": 0.0001, "step": 23705 }, { "epoch": 4.83, "learning_rate": 9.019998428204944e-07, "loss": 0.0001, "step": 23706 }, { "epoch": 4.83, "learning_rate": 8.99878367677237e-07, "loss": 0.0003, "step": 23707 }, { "epoch": 4.83, "learning_rate": 8.977593827874496e-07, "loss": 0.0031, "step": 23708 }, { "epoch": 4.83, "learning_rate": 8.956428881865374e-07, "loss": 0.0, "step": 23709 }, { "epoch": 4.83, "learning_rate": 8.935288839098221e-07, "loss": 0.0025, "step": 23710 }, { "epoch": 4.83, "learning_rate": 8.914173699926585e-07, "loss": 0.0031, "step": 23711 }, { "epoch": 4.83, "learning_rate": 8.893083464702689e-07, "loss": 0.0041, "step": 23712 }, { "epoch": 4.83, "learning_rate": 8.87201813377908e-07, "loss": 0.0005, "step": 23713 }, { "epoch": 4.83, "learning_rate": 8.850977707507478e-07, "loss": 0.0002, "step": 23714 }, { "epoch": 4.83, "learning_rate": 8.82996218623927e-07, "loss": 0.0005, "step": 23715 }, { "epoch": 4.83, "learning_rate": 8.808971570325507e-07, "loss": 0.0032, "step": 23716 }, { "epoch": 4.83, "learning_rate": 8.788005860116576e-07, "loss": 0.0011, "step": 23717 }, { "epoch": 4.83, "learning_rate": 8.767065055963029e-07, "loss": 0.0107, "step": 23718 }, { "epoch": 4.83, "learning_rate": 8.746149158214255e-07, "loss": 0.0044, "step": 23719 }, { "epoch": 4.83, "learning_rate": 8.725258167219807e-07, "loss": 0.0009, "step": 23720 }, { "epoch": 4.83, "learning_rate": 8.704392083328404e-07, "loss": 0.0, "step": 23721 }, { "epoch": 4.83, "learning_rate": 8.68355090688877e-07, "loss": 0.0021, "step": 23722 }, { "epoch": 4.83, "learning_rate": 8.662734638248958e-07, "loss": 0.0028, "step": 23723 }, { "epoch": 4.83, "learning_rate": 8.641943277756524e-07, "loss": 0.0009, "step": 23724 }, { "epoch": 4.83, "learning_rate": 8.621176825758691e-07, "loss": 0.0011, "step": 23725 }, { "epoch": 4.83, "learning_rate": 8.600435282602347e-07, "loss": 0.0001, "step": 23726 }, { "epoch": 4.83, "learning_rate": 8.579718648634215e-07, "loss": 0.0002, "step": 23727 }, { "epoch": 4.83, "learning_rate": 8.559026924199853e-07, "loss": 0.0001, "step": 23728 }, { "epoch": 4.83, "learning_rate": 8.538360109644982e-07, "loss": 0.0026, "step": 23729 }, { "epoch": 4.83, "learning_rate": 8.517718205314828e-07, "loss": 0.0001, "step": 23730 }, { "epoch": 4.83, "learning_rate": 8.497101211554281e-07, "loss": 0.0045, "step": 23731 }, { "epoch": 4.83, "learning_rate": 8.476509128707565e-07, "loss": 0.0003, "step": 23732 }, { "epoch": 4.83, "learning_rate": 8.455941957118573e-07, "loss": 0.0008, "step": 23733 }, { "epoch": 4.83, "learning_rate": 8.435399697130696e-07, "loss": 0.0028, "step": 23734 }, { "epoch": 4.83, "learning_rate": 8.414882349087326e-07, "loss": 0.001, "step": 23735 }, { "epoch": 4.83, "learning_rate": 8.394389913330857e-07, "loss": 0.0004, "step": 23736 }, { "epoch": 4.83, "learning_rate": 8.373922390203846e-07, "loss": 0.0021, "step": 23737 }, { "epoch": 4.83, "learning_rate": 8.353479780047856e-07, "loss": 0.0003, "step": 23738 }, { "epoch": 4.83, "learning_rate": 8.333062083204445e-07, "loss": 0.0015, "step": 23739 }, { "epoch": 4.83, "learning_rate": 8.312669300014674e-07, "loss": 0.0017, "step": 23740 }, { "epoch": 4.83, "learning_rate": 8.292301430819104e-07, "loss": 0.0012, "step": 23741 }, { "epoch": 4.83, "learning_rate": 8.271958475957796e-07, "loss": 0.0003, "step": 23742 }, { "epoch": 4.83, "learning_rate": 8.251640435770646e-07, "loss": 0.0024, "step": 23743 }, { "epoch": 4.83, "learning_rate": 8.231347310597047e-07, "loss": 0.0006, "step": 23744 }, { "epoch": 4.83, "learning_rate": 8.21107910077573e-07, "loss": 0.0012, "step": 23745 }, { "epoch": 4.84, "learning_rate": 8.190835806645424e-07, "loss": 0.0063, "step": 23746 }, { "epoch": 4.84, "learning_rate": 8.170617428544191e-07, "loss": 0.0006, "step": 23747 }, { "epoch": 4.84, "learning_rate": 8.150423966809594e-07, "loss": 0.006, "step": 23748 }, { "epoch": 4.84, "learning_rate": 8.130255421779031e-07, "loss": 0.0018, "step": 23749 }, { "epoch": 4.84, "learning_rate": 8.110111793789231e-07, "loss": 0.0012, "step": 23750 }, { "epoch": 4.84, "learning_rate": 8.089993083176927e-07, "loss": 0.0015, "step": 23751 }, { "epoch": 4.84, "learning_rate": 8.069899290277681e-07, "loss": 0.0073, "step": 23752 }, { "epoch": 4.84, "learning_rate": 8.049830415427395e-07, "loss": 0.0002, "step": 23753 }, { "epoch": 4.84, "learning_rate": 8.029786458961296e-07, "loss": 0.0028, "step": 23754 }, { "epoch": 4.84, "learning_rate": 8.009767421213953e-07, "loss": 0.0009, "step": 23755 }, { "epoch": 4.84, "learning_rate": 7.989773302519931e-07, "loss": 0.002, "step": 23756 }, { "epoch": 4.84, "learning_rate": 7.969804103212963e-07, "loss": 0.0001, "step": 23757 }, { "epoch": 4.84, "learning_rate": 7.949859823626614e-07, "loss": 0.0038, "step": 23758 }, { "epoch": 4.84, "learning_rate": 7.92994046409412e-07, "loss": 0.002, "step": 23759 }, { "epoch": 4.84, "learning_rate": 7.910046024948213e-07, "loss": 0.0002, "step": 23760 }, { "epoch": 4.84, "learning_rate": 7.890176506520796e-07, "loss": 0.0009, "step": 23761 }, { "epoch": 4.84, "learning_rate": 7.870331909144268e-07, "loss": 0.0005, "step": 23762 }, { "epoch": 4.84, "learning_rate": 7.850512233149697e-07, "loss": 0.0001, "step": 23763 }, { "epoch": 4.84, "learning_rate": 7.830717478868154e-07, "loss": 0.0035, "step": 23764 }, { "epoch": 4.84, "learning_rate": 7.810947646630373e-07, "loss": 0.0004, "step": 23765 }, { "epoch": 4.84, "learning_rate": 7.791202736766255e-07, "loss": 0.0032, "step": 23766 }, { "epoch": 4.84, "learning_rate": 7.771482749606039e-07, "loss": 0.0035, "step": 23767 }, { "epoch": 4.84, "learning_rate": 7.751787685478794e-07, "loss": 0.0018, "step": 23768 }, { "epoch": 4.84, "learning_rate": 7.732117544713423e-07, "loss": 0.0019, "step": 23769 }, { "epoch": 4.84, "learning_rate": 7.712472327638663e-07, "loss": 0.0002, "step": 23770 }, { "epoch": 4.84, "learning_rate": 7.69285203458242e-07, "loss": 0.0009, "step": 23771 }, { "epoch": 4.84, "learning_rate": 7.673256665872596e-07, "loss": 0.0003, "step": 23772 }, { "epoch": 4.84, "learning_rate": 7.653686221836264e-07, "loss": 0.0002, "step": 23773 }, { "epoch": 4.84, "learning_rate": 7.634140702800329e-07, "loss": 0.0001, "step": 23774 }, { "epoch": 4.84, "learning_rate": 7.614620109091363e-07, "loss": 0.0009, "step": 23775 }, { "epoch": 4.84, "learning_rate": 7.595124441035271e-07, "loss": 0.0066, "step": 23776 }, { "epoch": 4.84, "learning_rate": 7.575653698957629e-07, "loss": 0.0027, "step": 23777 }, { "epoch": 4.84, "learning_rate": 7.556207883183841e-07, "loss": 0.0019, "step": 23778 }, { "epoch": 4.84, "learning_rate": 7.536786994038479e-07, "loss": 0.0006, "step": 23779 }, { "epoch": 4.84, "learning_rate": 7.51739103184612e-07, "loss": 0.0003, "step": 23780 }, { "epoch": 4.84, "learning_rate": 7.498019996930505e-07, "loss": 0.0006, "step": 23781 }, { "epoch": 4.84, "learning_rate": 7.478673889615372e-07, "loss": 0.0009, "step": 23782 }, { "epoch": 4.84, "learning_rate": 7.459352710223631e-07, "loss": 0.0009, "step": 23783 }, { "epoch": 4.84, "learning_rate": 7.440056459078025e-07, "loss": 0.0088, "step": 23784 }, { "epoch": 4.84, "learning_rate": 7.420785136500961e-07, "loss": 0.0096, "step": 23785 }, { "epoch": 4.84, "learning_rate": 7.401538742814183e-07, "loss": 0.0005, "step": 23786 }, { "epoch": 4.84, "learning_rate": 7.382317278339267e-07, "loss": 0.0011, "step": 23787 }, { "epoch": 4.84, "learning_rate": 7.363120743397122e-07, "loss": 0.0009, "step": 23788 }, { "epoch": 4.84, "learning_rate": 7.343949138308325e-07, "loss": 0.0, "step": 23789 }, { "epoch": 4.84, "learning_rate": 7.324802463393287e-07, "loss": 0.0009, "step": 23790 }, { "epoch": 4.84, "learning_rate": 7.305680718971585e-07, "loss": 0.0023, "step": 23791 }, { "epoch": 4.84, "learning_rate": 7.286583905362631e-07, "loss": 0.0032, "step": 23792 }, { "epoch": 4.84, "learning_rate": 7.267512022885502e-07, "loss": 0.0045, "step": 23793 }, { "epoch": 4.84, "learning_rate": 7.248465071858611e-07, "loss": 0.0012, "step": 23794 }, { "epoch": 4.85, "learning_rate": 7.229443052600204e-07, "loss": 0.0047, "step": 23795 }, { "epoch": 4.85, "learning_rate": 7.210445965427858e-07, "loss": 0.0037, "step": 23796 }, { "epoch": 4.85, "learning_rate": 7.191473810658821e-07, "loss": 0.0003, "step": 23797 }, { "epoch": 4.85, "learning_rate": 7.172526588610339e-07, "loss": 0.0, "step": 23798 }, { "epoch": 4.85, "learning_rate": 7.153604299598159e-07, "loss": 0.0006, "step": 23799 }, { "epoch": 4.85, "learning_rate": 7.134706943939029e-07, "loss": 0.0001, "step": 23800 }, { "epoch": 4.85, "learning_rate": 7.115834521948194e-07, "loss": 0.0018, "step": 23801 }, { "epoch": 4.85, "learning_rate": 7.096987033940905e-07, "loss": 0.0001, "step": 23802 }, { "epoch": 4.85, "learning_rate": 7.078164480232074e-07, "loss": 0.0021, "step": 23803 }, { "epoch": 4.85, "learning_rate": 7.059366861135951e-07, "loss": 0.0013, "step": 23804 }, { "epoch": 4.85, "learning_rate": 7.040594176966452e-07, "loss": 0.0019, "step": 23805 }, { "epoch": 4.85, "learning_rate": 7.021846428037325e-07, "loss": 0.0002, "step": 23806 }, { "epoch": 4.85, "learning_rate": 7.003123614661487e-07, "loss": 0.0001, "step": 23807 }, { "epoch": 4.85, "learning_rate": 6.984425737151689e-07, "loss": 0.0003, "step": 23808 }, { "epoch": 4.85, "learning_rate": 6.965752795820179e-07, "loss": 0.0027, "step": 23809 }, { "epoch": 4.85, "learning_rate": 6.947104790979041e-07, "loss": 0.0009, "step": 23810 }, { "epoch": 4.85, "learning_rate": 6.928481722939527e-07, "loss": 0.0006, "step": 23811 }, { "epoch": 4.85, "learning_rate": 6.909883592012721e-07, "loss": 0.0002, "step": 23812 }, { "epoch": 4.85, "learning_rate": 6.891310398509375e-07, "loss": 0.0001, "step": 23813 }, { "epoch": 4.85, "learning_rate": 6.872762142739407e-07, "loss": 0.0002, "step": 23814 }, { "epoch": 4.85, "learning_rate": 6.854238825012904e-07, "loss": 0.0016, "step": 23815 }, { "epoch": 4.85, "learning_rate": 6.835740445639115e-07, "loss": 0.0013, "step": 23816 }, { "epoch": 4.85, "learning_rate": 6.817267004926962e-07, "loss": 0.0005, "step": 23817 }, { "epoch": 4.85, "learning_rate": 6.798818503185199e-07, "loss": 0.0006, "step": 23818 }, { "epoch": 4.85, "learning_rate": 6.780394940721578e-07, "loss": 0.0003, "step": 23819 }, { "epoch": 4.85, "learning_rate": 6.761996317844021e-07, "loss": 0.0016, "step": 23820 }, { "epoch": 4.85, "learning_rate": 6.743622634859946e-07, "loss": 0.0042, "step": 23821 }, { "epoch": 4.85, "learning_rate": 6.725273892075944e-07, "loss": 0.0001, "step": 23822 }, { "epoch": 4.85, "learning_rate": 6.706950089798768e-07, "loss": 0.0004, "step": 23823 }, { "epoch": 4.85, "learning_rate": 6.688651228334341e-07, "loss": 0.0013, "step": 23824 }, { "epoch": 4.85, "learning_rate": 6.670377307988084e-07, "loss": 0.0011, "step": 23825 }, { "epoch": 4.85, "learning_rate": 6.652128329065421e-07, "loss": 0.0026, "step": 23826 }, { "epoch": 4.85, "learning_rate": 6.633904291871272e-07, "loss": 0.0005, "step": 23827 }, { "epoch": 4.85, "learning_rate": 6.615705196709731e-07, "loss": 0.0018, "step": 23828 }, { "epoch": 4.85, "learning_rate": 6.597531043884885e-07, "loss": 0.0008, "step": 23829 }, { "epoch": 4.85, "learning_rate": 6.579381833700326e-07, "loss": 0.0036, "step": 23830 }, { "epoch": 4.85, "learning_rate": 6.561257566458978e-07, "loss": 0.0003, "step": 23831 }, { "epoch": 4.85, "learning_rate": 6.543158242463764e-07, "loss": 0.0024, "step": 23832 }, { "epoch": 4.85, "learning_rate": 6.525083862016945e-07, "loss": 0.0028, "step": 23833 }, { "epoch": 4.85, "learning_rate": 6.507034425420443e-07, "loss": 0.0002, "step": 23834 }, { "epoch": 4.85, "learning_rate": 6.489009932975519e-07, "loss": 0.0007, "step": 23835 }, { "epoch": 4.85, "learning_rate": 6.471010384983266e-07, "loss": 0.0001, "step": 23836 }, { "epoch": 4.85, "learning_rate": 6.453035781744443e-07, "loss": 0.0021, "step": 23837 }, { "epoch": 4.85, "learning_rate": 6.435086123559307e-07, "loss": 0.0002, "step": 23838 }, { "epoch": 4.85, "learning_rate": 6.417161410727456e-07, "loss": 0.0041, "step": 23839 }, { "epoch": 4.85, "learning_rate": 6.399261643548315e-07, "loss": 0.0008, "step": 23840 }, { "epoch": 4.85, "learning_rate": 6.381386822320811e-07, "loss": 0.0014, "step": 23841 }, { "epoch": 4.85, "learning_rate": 6.363536947343706e-07, "loss": 0.0031, "step": 23842 }, { "epoch": 4.85, "learning_rate": 6.345712018914762e-07, "loss": 0.0002, "step": 23843 }, { "epoch": 4.86, "learning_rate": 6.327912037332072e-07, "loss": 0.0018, "step": 23844 }, { "epoch": 4.86, "learning_rate": 6.310137002892734e-07, "loss": 0.0001, "step": 23845 }, { "epoch": 4.86, "learning_rate": 6.292386915893676e-07, "loss": 0.0029, "step": 23846 }, { "epoch": 4.86, "learning_rate": 6.274661776631162e-07, "loss": 0.0006, "step": 23847 }, { "epoch": 4.86, "learning_rate": 6.256961585401621e-07, "loss": 0.0184, "step": 23848 }, { "epoch": 4.86, "learning_rate": 6.239286342500316e-07, "loss": 0.0005, "step": 23849 }, { "epoch": 4.86, "learning_rate": 6.221636048222678e-07, "loss": 0.0011, "step": 23850 }, { "epoch": 4.86, "learning_rate": 6.204010702863471e-07, "loss": 0.0003, "step": 23851 }, { "epoch": 4.86, "learning_rate": 6.186410306716794e-07, "loss": 0.0, "step": 23852 }, { "epoch": 4.86, "learning_rate": 6.168834860077077e-07, "loss": 0.0005, "step": 23853 }, { "epoch": 4.86, "learning_rate": 6.151284363237585e-07, "loss": 0.0047, "step": 23854 }, { "epoch": 4.86, "learning_rate": 6.133758816491419e-07, "loss": 0.0033, "step": 23855 }, { "epoch": 4.86, "learning_rate": 6.116258220131343e-07, "loss": 0.0017, "step": 23856 }, { "epoch": 4.86, "learning_rate": 6.098782574449624e-07, "loss": 0.0109, "step": 23857 }, { "epoch": 4.86, "learning_rate": 6.081331879738194e-07, "loss": 0.0011, "step": 23858 }, { "epoch": 4.86, "learning_rate": 6.063906136288654e-07, "loss": 0.0029, "step": 23859 }, { "epoch": 4.86, "learning_rate": 6.046505344391772e-07, "loss": 0.0005, "step": 23860 }, { "epoch": 4.86, "learning_rate": 6.029129504338315e-07, "loss": 0.0026, "step": 23861 }, { "epoch": 4.86, "learning_rate": 6.011778616418384e-07, "loss": 0.0021, "step": 23862 }, { "epoch": 4.86, "learning_rate": 5.994452680921913e-07, "loss": 0.0002, "step": 23863 }, { "epoch": 4.86, "learning_rate": 5.977151698138172e-07, "loss": 0.0054, "step": 23864 }, { "epoch": 4.86, "learning_rate": 5.959875668356262e-07, "loss": 0.0016, "step": 23865 }, { "epoch": 4.86, "learning_rate": 5.94262459186462e-07, "loss": 0.0003, "step": 23866 }, { "epoch": 4.86, "learning_rate": 5.925398468951181e-07, "loss": 0.0018, "step": 23867 }, { "epoch": 4.86, "learning_rate": 5.908197299904049e-07, "loss": 0.0003, "step": 23868 }, { "epoch": 4.86, "learning_rate": 5.891021085010328e-07, "loss": 0.0015, "step": 23869 }, { "epoch": 4.86, "learning_rate": 5.873869824556787e-07, "loss": 0.0004, "step": 23870 }, { "epoch": 4.86, "learning_rate": 5.856743518830031e-07, "loss": 0.0008, "step": 23871 }, { "epoch": 4.86, "learning_rate": 5.839642168115999e-07, "loss": 0.001, "step": 23872 }, { "epoch": 4.86, "learning_rate": 5.82256577270046e-07, "loss": 0.0078, "step": 23873 }, { "epoch": 4.86, "learning_rate": 5.805514332868522e-07, "loss": 0.0065, "step": 23874 }, { "epoch": 4.86, "learning_rate": 5.788487848904955e-07, "loss": 0.0012, "step": 23875 }, { "epoch": 4.86, "learning_rate": 5.771486321094199e-07, "loss": 0.0024, "step": 23876 }, { "epoch": 4.86, "learning_rate": 5.754509749720193e-07, "loss": 0.0006, "step": 23877 }, { "epoch": 4.86, "learning_rate": 5.737558135066378e-07, "loss": 0.005, "step": 23878 }, { "epoch": 4.86, "learning_rate": 5.720631477415861e-07, "loss": 0.007, "step": 23879 }, { "epoch": 4.86, "learning_rate": 5.703729777051746e-07, "loss": 0.0001, "step": 23880 }, { "epoch": 4.86, "learning_rate": 5.686853034255811e-07, "loss": 0.0018, "step": 23881 }, { "epoch": 4.86, "learning_rate": 5.670001249310163e-07, "loss": 0.0001, "step": 23882 }, { "epoch": 4.86, "learning_rate": 5.653174422496243e-07, "loss": 0.001, "step": 23883 }, { "epoch": 4.86, "learning_rate": 5.636372554095159e-07, "loss": 0.0005, "step": 23884 }, { "epoch": 4.86, "learning_rate": 5.61959564438752e-07, "loss": 0.0017, "step": 23885 }, { "epoch": 4.86, "learning_rate": 5.602843693653436e-07, "loss": 0.0005, "step": 23886 }, { "epoch": 4.86, "learning_rate": 5.586116702172683e-07, "loss": 0.0005, "step": 23887 }, { "epoch": 4.86, "learning_rate": 5.569414670224703e-07, "loss": 0.0002, "step": 23888 }, { "epoch": 4.86, "learning_rate": 5.552737598088275e-07, "loss": 0.0022, "step": 23889 }, { "epoch": 4.86, "learning_rate": 5.536085486042341e-07, "loss": 0.0005, "step": 23890 }, { "epoch": 4.86, "learning_rate": 5.519458334364679e-07, "loss": 0.0001, "step": 23891 }, { "epoch": 4.86, "learning_rate": 5.502856143333068e-07, "loss": 0.001, "step": 23892 }, { "epoch": 4.87, "learning_rate": 5.486278913224951e-07, "loss": 0.0129, "step": 23893 }, { "epoch": 4.87, "learning_rate": 5.469726644316941e-07, "loss": 0.0053, "step": 23894 }, { "epoch": 4.87, "learning_rate": 5.453199336885649e-07, "loss": 0.0006, "step": 23895 }, { "epoch": 4.87, "learning_rate": 5.436696991207024e-07, "loss": 0.0005, "step": 23896 }, { "epoch": 4.87, "learning_rate": 5.420219607557008e-07, "loss": 0.0001, "step": 23897 }, { "epoch": 4.87, "learning_rate": 5.403767186210218e-07, "loss": 0.0001, "step": 23898 }, { "epoch": 4.87, "learning_rate": 5.387339727441931e-07, "loss": 0.0022, "step": 23899 }, { "epoch": 4.87, "learning_rate": 5.370937231526429e-07, "loss": 0.0025, "step": 23900 }, { "epoch": 4.87, "learning_rate": 5.354559698737493e-07, "loss": 0.0035, "step": 23901 }, { "epoch": 4.87, "learning_rate": 5.338207129348737e-07, "loss": 0.0003, "step": 23902 }, { "epoch": 4.87, "learning_rate": 5.321879523633277e-07, "loss": 0.004, "step": 23903 }, { "epoch": 4.87, "learning_rate": 5.305576881863894e-07, "loss": 0.0025, "step": 23904 }, { "epoch": 4.87, "learning_rate": 5.289299204312703e-07, "loss": 0.0014, "step": 23905 }, { "epoch": 4.87, "learning_rate": 5.27304649125182e-07, "loss": 0.0046, "step": 23906 }, { "epoch": 4.87, "learning_rate": 5.256818742952362e-07, "loss": 0.0006, "step": 23907 }, { "epoch": 4.87, "learning_rate": 5.240615959685778e-07, "loss": 0.001, "step": 23908 }, { "epoch": 4.87, "learning_rate": 5.224438141722353e-07, "loss": 0.0009, "step": 23909 }, { "epoch": 4.87, "learning_rate": 5.20828528933237e-07, "loss": 0.0005, "step": 23910 }, { "epoch": 4.87, "learning_rate": 5.192157402785779e-07, "loss": 0.0002, "step": 23911 }, { "epoch": 4.87, "learning_rate": 5.176054482351699e-07, "loss": 0.0016, "step": 23912 }, { "epoch": 4.87, "learning_rate": 5.159976528299248e-07, "loss": 0.0045, "step": 23913 }, { "epoch": 4.87, "learning_rate": 5.143923540896877e-07, "loss": 0.0033, "step": 23914 }, { "epoch": 4.87, "learning_rate": 5.127895520412706e-07, "loss": 0.001, "step": 23915 }, { "epoch": 4.87, "learning_rate": 5.11189246711452e-07, "loss": 0.0015, "step": 23916 }, { "epoch": 4.87, "learning_rate": 5.095914381269439e-07, "loss": 0.0021, "step": 23917 }, { "epoch": 4.87, "learning_rate": 5.079961263144417e-07, "loss": 0.0091, "step": 23918 }, { "epoch": 4.87, "learning_rate": 5.064033113005906e-07, "loss": 0.0001, "step": 23919 }, { "epoch": 4.87, "learning_rate": 5.048129931120027e-07, "loss": 0.003, "step": 23920 }, { "epoch": 4.87, "learning_rate": 5.032251717752233e-07, "loss": 0.0013, "step": 23921 }, { "epoch": 4.87, "learning_rate": 5.016398473167815e-07, "loss": 0.0004, "step": 23922 }, { "epoch": 4.87, "learning_rate": 5.00057019763156e-07, "loss": 0.0022, "step": 23923 }, { "epoch": 4.87, "learning_rate": 4.984766891407754e-07, "loss": 0.0019, "step": 23924 }, { "epoch": 4.87, "learning_rate": 4.968988554760356e-07, "loss": 0.0002, "step": 23925 }, { "epoch": 4.87, "learning_rate": 4.953235187952986e-07, "loss": 0.0007, "step": 23926 }, { "epoch": 4.87, "learning_rate": 4.937506791248435e-07, "loss": 0.0007, "step": 23927 }, { "epoch": 4.87, "learning_rate": 4.921803364909993e-07, "loss": 0.0015, "step": 23928 }, { "epoch": 4.87, "learning_rate": 4.906124909199449e-07, "loss": 0.0001, "step": 23929 }, { "epoch": 4.87, "learning_rate": 4.890471424378761e-07, "loss": 0.001, "step": 23930 }, { "epoch": 4.87, "learning_rate": 4.874842910709553e-07, "loss": 0.0004, "step": 23931 }, { "epoch": 4.87, "learning_rate": 4.85923936845245e-07, "loss": 0.0005, "step": 23932 }, { "epoch": 4.87, "learning_rate": 4.843660797868576e-07, "loss": 0.0016, "step": 23933 }, { "epoch": 4.87, "learning_rate": 4.82810719921789e-07, "loss": 0.0001, "step": 23934 }, { "epoch": 4.87, "learning_rate": 4.812578572760017e-07, "loss": 0.0001, "step": 23935 }, { "epoch": 4.87, "learning_rate": 4.797074918754584e-07, "loss": 0.0001, "step": 23936 }, { "epoch": 4.87, "learning_rate": 4.781596237460217e-07, "loss": 0.0025, "step": 23937 }, { "epoch": 4.87, "learning_rate": 4.766142529135708e-07, "loss": 0.0012, "step": 23938 }, { "epoch": 4.87, "learning_rate": 4.7507137940391847e-07, "loss": 0.0001, "step": 23939 }, { "epoch": 4.87, "learning_rate": 4.735310032428108e-07, "loss": 0.0008, "step": 23940 }, { "epoch": 4.87, "learning_rate": 4.7199312445597714e-07, "loss": 0.0034, "step": 23941 }, { "epoch": 4.88, "learning_rate": 4.704577430691303e-07, "loss": 0.0001, "step": 23942 }, { "epoch": 4.88, "learning_rate": 4.6892485910788314e-07, "loss": 0.0031, "step": 23943 }, { "epoch": 4.88, "learning_rate": 4.673944725978651e-07, "loss": 0.0004, "step": 23944 }, { "epoch": 4.88, "learning_rate": 4.658665835646058e-07, "loss": 0.0004, "step": 23945 }, { "epoch": 4.88, "learning_rate": 4.643411920336515e-07, "loss": 0.0002, "step": 23946 }, { "epoch": 4.88, "learning_rate": 4.628182980304651e-07, "loss": 0.0003, "step": 23947 }, { "epoch": 4.88, "learning_rate": 4.6129790158047633e-07, "loss": 0.0011, "step": 23948 }, { "epoch": 4.88, "learning_rate": 4.597800027090981e-07, "loss": 0.0005, "step": 23949 }, { "epoch": 4.88, "learning_rate": 4.5826460144167685e-07, "loss": 0.0038, "step": 23950 }, { "epoch": 4.88, "learning_rate": 4.567516978034924e-07, "loss": 0.0006, "step": 23951 }, { "epoch": 4.88, "learning_rate": 4.552412918198578e-07, "loss": 0.0001, "step": 23952 }, { "epoch": 4.88, "learning_rate": 4.5373338351596955e-07, "loss": 0.002, "step": 23953 }, { "epoch": 4.88, "learning_rate": 4.5222797291702415e-07, "loss": 0.0028, "step": 23954 }, { "epoch": 4.88, "learning_rate": 4.507250600481682e-07, "loss": 0.0016, "step": 23955 }, { "epoch": 4.88, "learning_rate": 4.4922464493449826e-07, "loss": 0.0002, "step": 23956 }, { "epoch": 4.88, "learning_rate": 4.4772672760107765e-07, "loss": 0.0029, "step": 23957 }, { "epoch": 4.88, "learning_rate": 4.46231308072903e-07, "loss": 0.0006, "step": 23958 }, { "epoch": 4.88, "learning_rate": 4.447383863749876e-07, "loss": 0.0001, "step": 23959 }, { "epoch": 4.88, "learning_rate": 4.4324796253222825e-07, "loss": 0.0059, "step": 23960 }, { "epoch": 4.88, "learning_rate": 4.4176003656955504e-07, "loss": 0.0002, "step": 23961 }, { "epoch": 4.88, "learning_rate": 4.4027460851178143e-07, "loss": 0.0012, "step": 23962 }, { "epoch": 4.88, "learning_rate": 4.387916783837542e-07, "loss": 0.0006, "step": 23963 }, { "epoch": 4.88, "learning_rate": 4.373112462102202e-07, "loss": 0.0032, "step": 23964 }, { "epoch": 4.88, "learning_rate": 4.35833312015893e-07, "loss": 0.0015, "step": 23965 }, { "epoch": 4.88, "learning_rate": 4.343578758254862e-07, "loss": 0.0006, "step": 23966 }, { "epoch": 4.88, "learning_rate": 4.328849376636134e-07, "loss": 0.0028, "step": 23967 }, { "epoch": 4.88, "learning_rate": 4.3141449755490497e-07, "loss": 0.0088, "step": 23968 }, { "epoch": 4.88, "learning_rate": 4.2994655552389126e-07, "loss": 0.001, "step": 23969 }, { "epoch": 4.88, "learning_rate": 4.284811115951192e-07, "loss": 0.0037, "step": 23970 }, { "epoch": 4.88, "learning_rate": 4.2701816579303606e-07, "loss": 0.0005, "step": 23971 }, { "epoch": 4.88, "learning_rate": 4.255577181421055e-07, "loss": 0.0025, "step": 23972 }, { "epoch": 4.88, "learning_rate": 4.2409976866669137e-07, "loss": 0.0033, "step": 23973 }, { "epoch": 4.88, "learning_rate": 4.2264431739115756e-07, "loss": 0.0002, "step": 23974 }, { "epoch": 4.88, "learning_rate": 4.211913643398013e-07, "loss": 0.0006, "step": 23975 }, { "epoch": 4.88, "learning_rate": 4.197409095369031e-07, "loss": 0.003, "step": 23976 }, { "epoch": 4.88, "learning_rate": 4.182929530066936e-07, "loss": 0.0007, "step": 23977 }, { "epoch": 4.88, "learning_rate": 4.168474947733369e-07, "loss": 0.0022, "step": 23978 }, { "epoch": 4.88, "learning_rate": 4.154045348609969e-07, "loss": 0.0031, "step": 23979 }, { "epoch": 4.88, "learning_rate": 4.1396407329375435e-07, "loss": 0.0007, "step": 23980 }, { "epoch": 4.88, "learning_rate": 4.125261100956734e-07, "loss": 0.0008, "step": 23981 }, { "epoch": 4.88, "learning_rate": 4.1109064529078474e-07, "loss": 0.0033, "step": 23982 }, { "epoch": 4.88, "learning_rate": 4.0965767890303593e-07, "loss": 0.0034, "step": 23983 }, { "epoch": 4.88, "learning_rate": 4.082272109563911e-07, "loss": 0.0109, "step": 23984 }, { "epoch": 4.88, "learning_rate": 4.0679924147469787e-07, "loss": 0.0046, "step": 23985 }, { "epoch": 4.88, "learning_rate": 4.053737704818705e-07, "loss": 0.0019, "step": 23986 }, { "epoch": 4.88, "learning_rate": 4.0395079800165653e-07, "loss": 0.0033, "step": 23987 }, { "epoch": 4.88, "learning_rate": 4.025303240578537e-07, "loss": 0.002, "step": 23988 }, { "epoch": 4.88, "learning_rate": 4.011123486741763e-07, "loss": 0.0017, "step": 23989 }, { "epoch": 4.88, "learning_rate": 3.9969687187432206e-07, "loss": 0.0016, "step": 23990 }, { "epoch": 4.89, "learning_rate": 3.9828389368192217e-07, "loss": 0.0025, "step": 23991 }, { "epoch": 4.89, "learning_rate": 3.9687341412055765e-07, "loss": 0.0003, "step": 23992 }, { "epoch": 4.89, "learning_rate": 3.9546543321380963e-07, "loss": 0.0009, "step": 23993 }, { "epoch": 4.89, "learning_rate": 3.940599509851927e-07, "loss": 0.0017, "step": 23994 }, { "epoch": 4.89, "learning_rate": 3.9265696745817143e-07, "loss": 0.0008, "step": 23995 }, { "epoch": 4.89, "learning_rate": 3.91256482656177e-07, "loss": 0.0045, "step": 23996 }, { "epoch": 4.89, "learning_rate": 3.8985849660262415e-07, "loss": 0.0019, "step": 23997 }, { "epoch": 4.89, "learning_rate": 3.884630093208274e-07, "loss": 0.0001, "step": 23998 }, { "epoch": 4.89, "learning_rate": 3.870700208341182e-07, "loss": 0.0001, "step": 23999 }, { "epoch": 4.89, "learning_rate": 3.856795311657446e-07, "loss": 0.0073, "step": 24000 }, { "epoch": 4.89, "learning_rate": 3.842915403389546e-07, "loss": 0.0032, "step": 24001 }, { "epoch": 4.89, "learning_rate": 3.829060483768964e-07, "loss": 0.0031, "step": 24002 }, { "epoch": 4.89, "learning_rate": 3.815230553027515e-07, "loss": 0.005, "step": 24003 }, { "epoch": 4.89, "learning_rate": 3.8014256113958477e-07, "loss": 0.0016, "step": 24004 }, { "epoch": 4.89, "learning_rate": 3.78764565910461e-07, "loss": 0.0023, "step": 24005 }, { "epoch": 4.89, "learning_rate": 3.773890696383952e-07, "loss": 0.0002, "step": 24006 }, { "epoch": 4.89, "learning_rate": 3.7601607234636897e-07, "loss": 0.003, "step": 24007 }, { "epoch": 4.89, "learning_rate": 3.74645574057314e-07, "loss": 0.0039, "step": 24008 }, { "epoch": 4.89, "learning_rate": 3.732775747941119e-07, "loss": 0.004, "step": 24009 }, { "epoch": 4.89, "learning_rate": 3.719120745796278e-07, "loss": 0.0009, "step": 24010 }, { "epoch": 4.89, "learning_rate": 3.7054907343664344e-07, "loss": 0.0002, "step": 24011 }, { "epoch": 4.89, "learning_rate": 3.6918857138794055e-07, "loss": 0.0005, "step": 24012 }, { "epoch": 4.89, "learning_rate": 3.6783056845623437e-07, "loss": 0.0011, "step": 24013 }, { "epoch": 4.89, "learning_rate": 3.6647506466420673e-07, "loss": 0.0032, "step": 24014 }, { "epoch": 4.89, "learning_rate": 3.651220600344895e-07, "loss": 0.0009, "step": 24015 }, { "epoch": 4.89, "learning_rate": 3.63771554589698e-07, "loss": 0.0001, "step": 24016 }, { "epoch": 4.89, "learning_rate": 3.6242354835238073e-07, "loss": 0.0006, "step": 24017 }, { "epoch": 4.89, "learning_rate": 3.6107804134505315e-07, "loss": 0.0, "step": 24018 }, { "epoch": 4.89, "learning_rate": 3.5973503359018053e-07, "loss": 0.0003, "step": 24019 }, { "epoch": 4.89, "learning_rate": 3.583945251102116e-07, "loss": 0.0033, "step": 24020 }, { "epoch": 4.89, "learning_rate": 3.5705651592751183e-07, "loss": 0.0035, "step": 24021 }, { "epoch": 4.89, "learning_rate": 3.5572100606444667e-07, "loss": 0.0003, "step": 24022 }, { "epoch": 4.89, "learning_rate": 3.5438799554329823e-07, "loss": 0.0041, "step": 24023 }, { "epoch": 4.89, "learning_rate": 3.530574843863654e-07, "loss": 0.0014, "step": 24024 }, { "epoch": 4.89, "learning_rate": 3.517294726158304e-07, "loss": 0.0041, "step": 24025 }, { "epoch": 4.89, "learning_rate": 3.504039602539088e-07, "loss": 0.0005, "step": 24026 }, { "epoch": 4.89, "learning_rate": 3.4908094732273294e-07, "loss": 0.0007, "step": 24027 }, { "epoch": 4.89, "learning_rate": 3.4776043384438514e-07, "loss": 0.0006, "step": 24028 }, { "epoch": 4.89, "learning_rate": 3.4644241984091436e-07, "loss": 0.0003, "step": 24029 }, { "epoch": 4.89, "learning_rate": 3.4512690533435304e-07, "loss": 0.0004, "step": 24030 }, { "epoch": 4.89, "learning_rate": 3.4381389034666696e-07, "loss": 0.0014, "step": 24031 }, { "epoch": 4.89, "learning_rate": 3.425033748997885e-07, "loss": 0.0005, "step": 24032 }, { "epoch": 4.89, "learning_rate": 3.4119535901560024e-07, "loss": 0.0027, "step": 24033 }, { "epoch": 4.89, "learning_rate": 3.3988984271595133e-07, "loss": 0.0045, "step": 24034 }, { "epoch": 4.89, "learning_rate": 3.3858682602264097e-07, "loss": 0.0006, "step": 24035 }, { "epoch": 4.89, "learning_rate": 3.3728630895743514e-07, "loss": 0.0008, "step": 24036 }, { "epoch": 4.89, "learning_rate": 3.3598829154206644e-07, "loss": 0.0004, "step": 24037 }, { "epoch": 4.89, "learning_rate": 3.346927737981842e-07, "loss": 0.0005, "step": 24038 }, { "epoch": 4.89, "learning_rate": 3.33399755747471e-07, "loss": 0.0002, "step": 24039 }, { "epoch": 4.9, "learning_rate": 3.3210923741147644e-07, "loss": 0.0004, "step": 24040 }, { "epoch": 4.9, "learning_rate": 3.3082121881178316e-07, "loss": 0.0076, "step": 24041 }, { "epoch": 4.9, "learning_rate": 3.2953569996990724e-07, "loss": 0.0001, "step": 24042 }, { "epoch": 4.9, "learning_rate": 3.282526809072983e-07, "loss": 0.0002, "step": 24043 }, { "epoch": 4.9, "learning_rate": 3.269721616453891e-07, "loss": 0.001, "step": 24044 }, { "epoch": 4.9, "learning_rate": 3.2569414220557923e-07, "loss": 0.0003, "step": 24045 }, { "epoch": 4.9, "learning_rate": 3.2441862260921825e-07, "loss": 0.0016, "step": 24046 }, { "epoch": 4.9, "learning_rate": 3.231456028775725e-07, "loss": 0.0011, "step": 24047 }, { "epoch": 4.9, "learning_rate": 3.218750830319583e-07, "loss": 0.0016, "step": 24048 }, { "epoch": 4.9, "learning_rate": 3.2060706309355865e-07, "loss": 0.0032, "step": 24049 }, { "epoch": 4.9, "learning_rate": 3.1934154308355666e-07, "loss": 0.0003, "step": 24050 }, { "epoch": 4.9, "learning_rate": 3.1807852302308534e-07, "loss": 0.0027, "step": 24051 }, { "epoch": 4.9, "learning_rate": 3.168180029332612e-07, "loss": 0.0001, "step": 24052 }, { "epoch": 4.9, "learning_rate": 3.155599828351174e-07, "loss": 0.0015, "step": 24053 }, { "epoch": 4.9, "learning_rate": 3.1430446274967047e-07, "loss": 0.0012, "step": 24054 }, { "epoch": 4.9, "learning_rate": 3.130514426979036e-07, "loss": 0.0042, "step": 24055 }, { "epoch": 4.9, "learning_rate": 3.118009227007168e-07, "loss": 0.0004, "step": 24056 }, { "epoch": 4.9, "learning_rate": 3.105529027790099e-07, "loss": 0.0004, "step": 24057 }, { "epoch": 4.9, "learning_rate": 3.09307382953633e-07, "loss": 0.0014, "step": 24058 }, { "epoch": 4.9, "learning_rate": 3.080643632453861e-07, "loss": 0.0003, "step": 24059 }, { "epoch": 4.9, "learning_rate": 3.068238436750359e-07, "loss": 0.0031, "step": 24060 }, { "epoch": 4.9, "learning_rate": 3.055858242632825e-07, "loss": 0.0004, "step": 24061 }, { "epoch": 4.9, "learning_rate": 3.043503050308094e-07, "loss": 0.0047, "step": 24062 }, { "epoch": 4.9, "learning_rate": 3.031172859982667e-07, "loss": 0.0004, "step": 24063 }, { "epoch": 4.9, "learning_rate": 3.018867671862213e-07, "loss": 0.0004, "step": 24064 }, { "epoch": 4.9, "learning_rate": 3.006587486152734e-07, "loss": 0.0003, "step": 24065 }, { "epoch": 4.9, "learning_rate": 2.994332303058733e-07, "loss": 0.0018, "step": 24066 }, { "epoch": 4.9, "learning_rate": 2.9821021227853794e-07, "loss": 0.0001, "step": 24067 }, { "epoch": 4.9, "learning_rate": 2.969896945536676e-07, "loss": 0.0084, "step": 24068 }, { "epoch": 4.9, "learning_rate": 2.9577167715164606e-07, "loss": 0.0055, "step": 24069 }, { "epoch": 4.9, "learning_rate": 2.945561600928237e-07, "loss": 0.0011, "step": 24070 }, { "epoch": 4.9, "learning_rate": 2.933431433975175e-07, "loss": 0.0002, "step": 24071 }, { "epoch": 4.9, "learning_rate": 2.921326270859614e-07, "loss": 0.0001, "step": 24072 }, { "epoch": 4.9, "learning_rate": 2.909246111783725e-07, "loss": 0.0019, "step": 24073 }, { "epoch": 4.9, "learning_rate": 2.89719095694968e-07, "loss": 0.0001, "step": 24074 }, { "epoch": 4.9, "learning_rate": 2.8851608065583174e-07, "loss": 0.0011, "step": 24075 }, { "epoch": 4.9, "learning_rate": 2.873155660810811e-07, "loss": 0.0013, "step": 24076 }, { "epoch": 4.9, "learning_rate": 2.861175519907499e-07, "loss": 0.0018, "step": 24077 }, { "epoch": 4.9, "learning_rate": 2.849220384048889e-07, "loss": 0.0018, "step": 24078 }, { "epoch": 4.9, "learning_rate": 2.8372902534341545e-07, "loss": 0.0002, "step": 24079 }, { "epoch": 4.9, "learning_rate": 2.8253851282628026e-07, "loss": 0.0007, "step": 24080 }, { "epoch": 4.9, "learning_rate": 2.813505008733674e-07, "loss": 0.0033, "step": 24081 }, { "epoch": 4.9, "learning_rate": 2.8016498950451107e-07, "loss": 0.0027, "step": 24082 }, { "epoch": 4.9, "learning_rate": 2.7898197873952864e-07, "loss": 0.0002, "step": 24083 }, { "epoch": 4.9, "learning_rate": 2.7780146859815444e-07, "loss": 0.0011, "step": 24084 }, { "epoch": 4.9, "learning_rate": 2.7662345910012263e-07, "loss": 0.0045, "step": 24085 }, { "epoch": 4.9, "learning_rate": 2.754479502651008e-07, "loss": 0.0022, "step": 24086 }, { "epoch": 4.9, "learning_rate": 2.7427494211272326e-07, "loss": 0.004, "step": 24087 }, { "epoch": 4.9, "learning_rate": 2.731044346625744e-07, "loss": 0.0009, "step": 24088 }, { "epoch": 4.9, "learning_rate": 2.7193642793422175e-07, "loss": 0.0007, "step": 24089 }, { "epoch": 4.91, "learning_rate": 2.707709219471499e-07, "loss": 0.0043, "step": 24090 }, { "epoch": 4.91, "learning_rate": 2.6960791672084314e-07, "loss": 0.0021, "step": 24091 }, { "epoch": 4.91, "learning_rate": 2.6844741227471934e-07, "loss": 0.0026, "step": 24092 }, { "epoch": 4.91, "learning_rate": 2.6728940862816295e-07, "loss": 0.0003, "step": 24093 }, { "epoch": 4.91, "learning_rate": 2.6613390580052517e-07, "loss": 0.0009, "step": 24094 }, { "epoch": 4.91, "learning_rate": 2.6498090381107394e-07, "loss": 0.0003, "step": 24095 }, { "epoch": 4.91, "learning_rate": 2.638304026790938e-07, "loss": 0.0003, "step": 24096 }, { "epoch": 4.91, "learning_rate": 2.6268240242380277e-07, "loss": 0.0018, "step": 24097 }, { "epoch": 4.91, "learning_rate": 2.6153690306435215e-07, "loss": 0.001, "step": 24098 }, { "epoch": 4.91, "learning_rate": 2.6039390461989327e-07, "loss": 0.0061, "step": 24099 }, { "epoch": 4.91, "learning_rate": 2.5925340710951095e-07, "loss": 0.0001, "step": 24100 }, { "epoch": 4.91, "learning_rate": 2.581154105522398e-07, "loss": 0.0036, "step": 24101 }, { "epoch": 4.91, "learning_rate": 2.5697991496711476e-07, "loss": 0.0027, "step": 24102 }, { "epoch": 4.91, "learning_rate": 2.558469203730873e-07, "loss": 0.0026, "step": 24103 }, { "epoch": 4.91, "learning_rate": 2.547164267890589e-07, "loss": 0.004, "step": 24104 }, { "epoch": 4.91, "learning_rate": 2.535884342339478e-07, "loss": 0.0098, "step": 24105 }, { "epoch": 4.91, "learning_rate": 2.524629427265723e-07, "loss": 0.0005, "step": 24106 }, { "epoch": 4.91, "learning_rate": 2.5133995228573403e-07, "loss": 0.0006, "step": 24107 }, { "epoch": 4.91, "learning_rate": 2.5021946293018456e-07, "loss": 0.0039, "step": 24108 }, { "epoch": 4.91, "learning_rate": 2.491014746786424e-07, "loss": 0.0, "step": 24109 }, { "epoch": 4.91, "learning_rate": 2.4798598754977583e-07, "loss": 0.0004, "step": 24110 }, { "epoch": 4.91, "learning_rate": 2.4687300156223667e-07, "loss": 0.0001, "step": 24111 }, { "epoch": 4.91, "learning_rate": 2.4576251673459337e-07, "loss": 0.0009, "step": 24112 }, { "epoch": 4.91, "learning_rate": 2.4465453308538107e-07, "loss": 0.0004, "step": 24113 }, { "epoch": 4.91, "learning_rate": 2.4354905063313503e-07, "loss": 0.0094, "step": 24114 }, { "epoch": 4.91, "learning_rate": 2.4244606939630706e-07, "loss": 0.0001, "step": 24115 }, { "epoch": 4.91, "learning_rate": 2.4134558939331585e-07, "loss": 0.0003, "step": 24116 }, { "epoch": 4.91, "learning_rate": 2.402476106425466e-07, "loss": 0.0026, "step": 24117 }, { "epoch": 4.91, "learning_rate": 2.3915213316231806e-07, "loss": 0.0011, "step": 24118 }, { "epoch": 4.91, "learning_rate": 2.380591569709489e-07, "loss": 0.0002, "step": 24119 }, { "epoch": 4.91, "learning_rate": 2.3696868208669117e-07, "loss": 0.0021, "step": 24120 }, { "epoch": 4.91, "learning_rate": 2.3588070852776364e-07, "loss": 0.0006, "step": 24121 }, { "epoch": 4.91, "learning_rate": 2.3479523631231845e-07, "loss": 0.0025, "step": 24122 }, { "epoch": 4.91, "learning_rate": 2.3371226545849108e-07, "loss": 0.0001, "step": 24123 }, { "epoch": 4.91, "learning_rate": 2.326317959843671e-07, "loss": 0.0015, "step": 24124 }, { "epoch": 4.91, "learning_rate": 2.3155382790801537e-07, "loss": 0.0014, "step": 24125 }, { "epoch": 4.91, "learning_rate": 2.3047836124740482e-07, "loss": 0.0003, "step": 24126 }, { "epoch": 4.91, "learning_rate": 2.2940539602053776e-07, "loss": 0.0069, "step": 24127 }, { "epoch": 4.91, "learning_rate": 2.283349322452832e-07, "loss": 0.0037, "step": 24128 }, { "epoch": 4.91, "learning_rate": 2.2726696993957682e-07, "loss": 0.0083, "step": 24129 }, { "epoch": 4.91, "learning_rate": 2.2620150912122102e-07, "loss": 0.0025, "step": 24130 }, { "epoch": 4.91, "learning_rate": 2.251385498080016e-07, "loss": 0.0008, "step": 24131 }, { "epoch": 4.91, "learning_rate": 2.2407809201770433e-07, "loss": 0.0006, "step": 24132 }, { "epoch": 4.91, "learning_rate": 2.2302013576801502e-07, "loss": 0.0017, "step": 24133 }, { "epoch": 4.91, "learning_rate": 2.2196468107663623e-07, "loss": 0.0007, "step": 24134 }, { "epoch": 4.91, "learning_rate": 2.2091172796115386e-07, "loss": 0.0002, "step": 24135 }, { "epoch": 4.91, "learning_rate": 2.198612764391705e-07, "loss": 0.0004, "step": 24136 }, { "epoch": 4.91, "learning_rate": 2.188133265282388e-07, "loss": 0.0004, "step": 24137 }, { "epoch": 4.91, "learning_rate": 2.177678782458614e-07, "loss": 0.0021, "step": 24138 }, { "epoch": 4.92, "learning_rate": 2.16724931609491e-07, "loss": 0.0054, "step": 24139 }, { "epoch": 4.92, "learning_rate": 2.1568448663654704e-07, "loss": 0.0234, "step": 24140 }, { "epoch": 4.92, "learning_rate": 2.1464654334441555e-07, "loss": 0.0067, "step": 24141 }, { "epoch": 4.92, "learning_rate": 2.1361110175043272e-07, "loss": 0.0014, "step": 24142 }, { "epoch": 4.92, "learning_rate": 2.1257816187186805e-07, "loss": 0.0015, "step": 24143 }, { "epoch": 4.92, "learning_rate": 2.115477237260077e-07, "loss": 0.0002, "step": 24144 }, { "epoch": 4.92, "learning_rate": 2.1051978733003795e-07, "loss": 0.0006, "step": 24145 }, { "epoch": 4.92, "learning_rate": 2.09494352701145e-07, "loss": 0.0001, "step": 24146 }, { "epoch": 4.92, "learning_rate": 2.084714198564319e-07, "loss": 0.0001, "step": 24147 }, { "epoch": 4.92, "learning_rate": 2.0745098881301825e-07, "loss": 0.0003, "step": 24148 }, { "epoch": 4.92, "learning_rate": 2.0643305958790713e-07, "loss": 0.0008, "step": 24149 }, { "epoch": 4.92, "learning_rate": 2.0541763219811824e-07, "loss": 0.0005, "step": 24150 }, { "epoch": 4.92, "learning_rate": 2.0440470666062135e-07, "loss": 0.0006, "step": 24151 }, { "epoch": 4.92, "learning_rate": 2.0339428299231963e-07, "loss": 0.0006, "step": 24152 }, { "epoch": 4.92, "learning_rate": 2.0238636121009954e-07, "loss": 0.0003, "step": 24153 }, { "epoch": 4.92, "learning_rate": 2.0138094133079762e-07, "loss": 0.0012, "step": 24154 }, { "epoch": 4.92, "learning_rate": 2.0037802337118381e-07, "loss": 0.0001, "step": 24155 }, { "epoch": 4.92, "learning_rate": 1.99377607348028e-07, "loss": 0.0006, "step": 24156 }, { "epoch": 4.92, "learning_rate": 1.983796932780335e-07, "loss": 0.0007, "step": 24157 }, { "epoch": 4.92, "learning_rate": 1.973842811778703e-07, "loss": 0.0001, "step": 24158 }, { "epoch": 4.92, "learning_rate": 1.9639137106417513e-07, "loss": 0.0017, "step": 24159 }, { "epoch": 4.92, "learning_rate": 1.9540096295350137e-07, "loss": 0.005, "step": 24160 }, { "epoch": 4.92, "learning_rate": 1.9441305686241914e-07, "loss": 0.0005, "step": 24161 }, { "epoch": 4.92, "learning_rate": 1.934276528073986e-07, "loss": 0.0013, "step": 24162 }, { "epoch": 4.92, "learning_rate": 1.9244475080494316e-07, "loss": 0.001, "step": 24163 }, { "epoch": 4.92, "learning_rate": 1.914643508714231e-07, "loss": 0.0047, "step": 24164 }, { "epoch": 4.92, "learning_rate": 1.9048645302324195e-07, "loss": 0.0023, "step": 24165 }, { "epoch": 4.92, "learning_rate": 1.8951105727670335e-07, "loss": 0.0009, "step": 24166 }, { "epoch": 4.92, "learning_rate": 1.8853816364814424e-07, "loss": 0.0012, "step": 24167 }, { "epoch": 4.92, "learning_rate": 1.875677721537683e-07, "loss": 0.0004, "step": 24168 }, { "epoch": 4.92, "learning_rate": 1.8659988280981253e-07, "loss": 0.0015, "step": 24169 }, { "epoch": 4.92, "learning_rate": 1.8563449563241407e-07, "loss": 0.0164, "step": 24170 }, { "epoch": 4.92, "learning_rate": 1.8467161063772662e-07, "loss": 0.0024, "step": 24171 }, { "epoch": 4.92, "learning_rate": 1.8371122784182068e-07, "loss": 0.0028, "step": 24172 }, { "epoch": 4.92, "learning_rate": 1.8275334726073343e-07, "loss": 0.0024, "step": 24173 }, { "epoch": 4.92, "learning_rate": 1.8179796891046871e-07, "loss": 0.0008, "step": 24174 }, { "epoch": 4.92, "learning_rate": 1.8084509280698046e-07, "loss": 0.0001, "step": 24175 }, { "epoch": 4.92, "learning_rate": 1.7989471896618922e-07, "loss": 0.0024, "step": 24176 }, { "epoch": 4.92, "learning_rate": 1.7894684740394905e-07, "loss": 0.0075, "step": 24177 }, { "epoch": 4.92, "learning_rate": 1.7800147813609722e-07, "loss": 0.0016, "step": 24178 }, { "epoch": 4.92, "learning_rate": 1.7705861117843778e-07, "loss": 0.0009, "step": 24179 }, { "epoch": 4.92, "learning_rate": 1.7611824654672478e-07, "loss": 0.0014, "step": 24180 }, { "epoch": 4.92, "learning_rate": 1.7518038425662907e-07, "loss": 0.0002, "step": 24181 }, { "epoch": 4.92, "learning_rate": 1.7424502432383802e-07, "loss": 0.0009, "step": 24182 }, { "epoch": 4.92, "learning_rate": 1.7331216676398918e-07, "loss": 0.002, "step": 24183 }, { "epoch": 4.92, "learning_rate": 1.723818115926201e-07, "loss": 0.0074, "step": 24184 }, { "epoch": 4.92, "learning_rate": 1.714539588253183e-07, "loss": 0.0056, "step": 24185 }, { "epoch": 4.92, "learning_rate": 1.7052860847753813e-07, "loss": 0.0001, "step": 24186 }, { "epoch": 4.92, "learning_rate": 1.6960576056476715e-07, "loss": 0.0002, "step": 24187 }, { "epoch": 4.93, "learning_rate": 1.6868541510239308e-07, "loss": 0.0014, "step": 24188 }, { "epoch": 4.93, "learning_rate": 1.677675721058036e-07, "loss": 0.0007, "step": 24189 }, { "epoch": 4.93, "learning_rate": 1.668522315903198e-07, "loss": 0.0005, "step": 24190 }, { "epoch": 4.93, "learning_rate": 1.6593939357124607e-07, "loss": 0.0017, "step": 24191 }, { "epoch": 4.93, "learning_rate": 1.6502905806380362e-07, "loss": 0.0004, "step": 24192 }, { "epoch": 4.93, "learning_rate": 1.6412122508321356e-07, "loss": 0.0062, "step": 24193 }, { "epoch": 4.93, "learning_rate": 1.6321589464464714e-07, "loss": 0.0008, "step": 24194 }, { "epoch": 4.93, "learning_rate": 1.6231306676319223e-07, "loss": 0.0006, "step": 24195 }, { "epoch": 4.93, "learning_rate": 1.6141274145395344e-07, "loss": 0.0027, "step": 24196 }, { "epoch": 4.93, "learning_rate": 1.6051491873196876e-07, "loss": 0.0039, "step": 24197 }, { "epoch": 4.93, "learning_rate": 1.5961959861222617e-07, "loss": 0.0012, "step": 24198 }, { "epoch": 4.93, "learning_rate": 1.587267811096804e-07, "loss": 0.0005, "step": 24199 }, { "epoch": 4.93, "learning_rate": 1.5783646623923618e-07, "loss": 0.0013, "step": 24200 }, { "epoch": 4.93, "learning_rate": 1.5694865401576495e-07, "loss": 0.001, "step": 24201 }, { "epoch": 4.93, "learning_rate": 1.5606334445412148e-07, "loss": 0.0017, "step": 24202 }, { "epoch": 4.93, "learning_rate": 1.5518053756906067e-07, "loss": 0.0009, "step": 24203 }, { "epoch": 4.93, "learning_rate": 1.5430023337532072e-07, "loss": 0.0026, "step": 24204 }, { "epoch": 4.93, "learning_rate": 1.534224318876398e-07, "loss": 0.0001, "step": 24205 }, { "epoch": 4.93, "learning_rate": 1.5254713312065625e-07, "loss": 0.0002, "step": 24206 }, { "epoch": 4.93, "learning_rate": 1.5167433708899168e-07, "loss": 0.0025, "step": 24207 }, { "epoch": 4.93, "learning_rate": 1.5080404380721777e-07, "loss": 0.0008, "step": 24208 }, { "epoch": 4.93, "learning_rate": 1.4993625328988955e-07, "loss": 0.0001, "step": 24209 }, { "epoch": 4.93, "learning_rate": 1.490709655514788e-07, "loss": 0.0077, "step": 24210 }, { "epoch": 4.93, "learning_rate": 1.4820818060644056e-07, "loss": 0.0057, "step": 24211 }, { "epoch": 4.93, "learning_rate": 1.473478984691967e-07, "loss": 0.0029, "step": 24212 }, { "epoch": 4.93, "learning_rate": 1.46490119154119e-07, "loss": 0.002, "step": 24213 }, { "epoch": 4.93, "learning_rate": 1.4563484267551272e-07, "loss": 0.0002, "step": 24214 }, { "epoch": 4.93, "learning_rate": 1.4478206904768308e-07, "loss": 0.0001, "step": 24215 }, { "epoch": 4.93, "learning_rate": 1.4393179828486867e-07, "loss": 0.0002, "step": 24216 }, { "epoch": 4.93, "learning_rate": 1.430840304012415e-07, "loss": 0.0002, "step": 24217 }, { "epoch": 4.93, "learning_rate": 1.4223876541100688e-07, "loss": 0.003, "step": 24218 }, { "epoch": 4.93, "learning_rate": 1.4139600332827018e-07, "loss": 0.0006, "step": 24219 }, { "epoch": 4.93, "learning_rate": 1.405557441670868e-07, "loss": 0.0001, "step": 24220 }, { "epoch": 4.93, "learning_rate": 1.3971798794149558e-07, "loss": 0.0004, "step": 24221 }, { "epoch": 4.93, "learning_rate": 1.3888273466550193e-07, "loss": 0.0028, "step": 24222 }, { "epoch": 4.93, "learning_rate": 1.380499843530447e-07, "loss": 0.0011, "step": 24223 }, { "epoch": 4.93, "learning_rate": 1.3721973701804612e-07, "loss": 0.0002, "step": 24224 }, { "epoch": 4.93, "learning_rate": 1.3639199267436173e-07, "loss": 0.0009, "step": 24225 }, { "epoch": 4.93, "learning_rate": 1.3556675133581384e-07, "loss": 0.0001, "step": 24226 }, { "epoch": 4.93, "learning_rate": 1.3474401301619143e-07, "loss": 0.0017, "step": 24227 }, { "epoch": 4.93, "learning_rate": 1.3392377772923347e-07, "loss": 0.0007, "step": 24228 }, { "epoch": 4.93, "learning_rate": 1.3310604548864566e-07, "loss": 0.0003, "step": 24229 }, { "epoch": 4.93, "learning_rate": 1.322908163080838e-07, "loss": 0.0014, "step": 24230 }, { "epoch": 4.93, "learning_rate": 1.3147809020115364e-07, "loss": 0.0019, "step": 24231 }, { "epoch": 4.93, "learning_rate": 1.306678671814443e-07, "loss": 0.0003, "step": 24232 }, { "epoch": 4.93, "learning_rate": 1.2986014726246163e-07, "loss": 0.0009, "step": 24233 }, { "epoch": 4.93, "learning_rate": 1.2905493045772818e-07, "loss": 0.0015, "step": 24234 }, { "epoch": 4.93, "learning_rate": 1.282522167806832e-07, "loss": 0.0001, "step": 24235 }, { "epoch": 4.93, "learning_rate": 1.2745200624471596e-07, "loss": 0.0029, "step": 24236 }, { "epoch": 4.94, "learning_rate": 1.2665429886321576e-07, "loss": 0.002, "step": 24237 }, { "epoch": 4.94, "learning_rate": 1.2585909464948862e-07, "loss": 0.0065, "step": 24238 }, { "epoch": 4.94, "learning_rate": 1.250663936168239e-07, "loss": 0.0009, "step": 24239 }, { "epoch": 4.94, "learning_rate": 1.2427619577846104e-07, "loss": 0.0049, "step": 24240 }, { "epoch": 4.94, "learning_rate": 1.2348850114760612e-07, "loss": 0.0012, "step": 24241 }, { "epoch": 4.94, "learning_rate": 1.2270330973738196e-07, "loss": 0.0008, "step": 24242 }, { "epoch": 4.94, "learning_rate": 1.2192062156094474e-07, "loss": 0.0017, "step": 24243 }, { "epoch": 4.94, "learning_rate": 1.21140436631334e-07, "loss": 0.0029, "step": 24244 }, { "epoch": 4.94, "learning_rate": 1.2036275496160597e-07, "loss": 0.0057, "step": 24245 }, { "epoch": 4.94, "learning_rate": 1.1958757656473362e-07, "loss": 0.0036, "step": 24246 }, { "epoch": 4.94, "learning_rate": 1.1881490145367322e-07, "loss": 0.0001, "step": 24247 }, { "epoch": 4.94, "learning_rate": 1.1804472964131451e-07, "loss": 0.0016, "step": 24248 }, { "epoch": 4.94, "learning_rate": 1.1727706114053048e-07, "loss": 0.0038, "step": 24249 }, { "epoch": 4.94, "learning_rate": 1.1651189596416088e-07, "loss": 0.0001, "step": 24250 }, { "epoch": 4.94, "learning_rate": 1.1574923412494553e-07, "loss": 0.0016, "step": 24251 }, { "epoch": 4.94, "learning_rate": 1.1498907563565751e-07, "loss": 0.0018, "step": 24252 }, { "epoch": 4.94, "learning_rate": 1.142314205089867e-07, "loss": 0.001, "step": 24253 }, { "epoch": 4.94, "learning_rate": 1.1347626875755633e-07, "loss": 0.0003, "step": 24254 }, { "epoch": 4.94, "learning_rate": 1.1272362039402294e-07, "loss": 0.0001, "step": 24255 }, { "epoch": 4.94, "learning_rate": 1.119734754309265e-07, "loss": 0.0067, "step": 24256 }, { "epoch": 4.94, "learning_rate": 1.1122583388082363e-07, "loss": 0.0003, "step": 24257 }, { "epoch": 4.94, "learning_rate": 1.1048069575617102e-07, "loss": 0.0006, "step": 24258 }, { "epoch": 4.94, "learning_rate": 1.097380610694254e-07, "loss": 0.0002, "step": 24259 }, { "epoch": 4.94, "learning_rate": 1.089979298329935e-07, "loss": 0.0009, "step": 24260 }, { "epoch": 4.94, "learning_rate": 1.0826030205924874e-07, "loss": 0.0019, "step": 24261 }, { "epoch": 4.94, "learning_rate": 1.075251777604813e-07, "loss": 0.0004, "step": 24262 }, { "epoch": 4.94, "learning_rate": 1.0679255694899802e-07, "loss": 0.0025, "step": 24263 }, { "epoch": 4.94, "learning_rate": 1.0606243963700579e-07, "loss": 0.0001, "step": 24264 }, { "epoch": 4.94, "learning_rate": 1.0533482583672814e-07, "loss": 0.0025, "step": 24265 }, { "epoch": 4.94, "learning_rate": 1.0460971556030539e-07, "loss": 0.0028, "step": 24266 }, { "epoch": 4.94, "learning_rate": 1.0388710881984452e-07, "loss": 0.0002, "step": 24267 }, { "epoch": 4.94, "learning_rate": 1.031670056274192e-07, "loss": 0.0029, "step": 24268 }, { "epoch": 4.94, "learning_rate": 1.0244940599505314e-07, "loss": 0.0032, "step": 24269 }, { "epoch": 4.94, "learning_rate": 1.0173430993473675e-07, "loss": 0.0058, "step": 24270 }, { "epoch": 4.94, "learning_rate": 1.0102171745841048e-07, "loss": 0.0043, "step": 24271 }, { "epoch": 4.94, "learning_rate": 1.0031162857796482e-07, "loss": 0.0017, "step": 24272 }, { "epoch": 4.94, "learning_rate": 9.960404330529026e-08, "loss": 0.0027, "step": 24273 }, { "epoch": 4.94, "learning_rate": 9.889896165217737e-08, "loss": 0.0028, "step": 24274 }, { "epoch": 4.94, "learning_rate": 9.819638363040005e-08, "loss": 0.0011, "step": 24275 }, { "epoch": 4.94, "learning_rate": 9.749630925171558e-08, "loss": 0.0015, "step": 24276 }, { "epoch": 4.94, "learning_rate": 9.679873852779796e-08, "loss": 0.0, "step": 24277 }, { "epoch": 4.94, "learning_rate": 9.61036714703045e-08, "loss": 0.0027, "step": 24278 }, { "epoch": 4.94, "learning_rate": 9.541110809084263e-08, "loss": 0.0002, "step": 24279 }, { "epoch": 4.94, "learning_rate": 9.472104840098637e-08, "loss": 0.0034, "step": 24280 }, { "epoch": 4.94, "learning_rate": 9.403349241224322e-08, "loss": 0.0, "step": 24281 }, { "epoch": 4.94, "learning_rate": 9.334844013612063e-08, "loss": 0.0016, "step": 24282 }, { "epoch": 4.94, "learning_rate": 9.26658915840428e-08, "loss": 0.0001, "step": 24283 }, { "epoch": 4.94, "learning_rate": 9.198584676741727e-08, "loss": 0.0001, "step": 24284 }, { "epoch": 4.94, "learning_rate": 9.130830569758496e-08, "loss": 0.0005, "step": 24285 }, { "epoch": 4.95, "learning_rate": 9.06332683858868e-08, "loss": 0.0039, "step": 24286 }, { "epoch": 4.95, "learning_rate": 8.996073484359711e-08, "loss": 0.0083, "step": 24287 }, { "epoch": 4.95, "learning_rate": 8.92907050819236e-08, "loss": 0.0032, "step": 24288 }, { "epoch": 4.95, "learning_rate": 8.862317911207395e-08, "loss": 0.0024, "step": 24289 }, { "epoch": 4.95, "learning_rate": 8.795815694520591e-08, "loss": 0.0002, "step": 24290 }, { "epoch": 4.95, "learning_rate": 8.729563859241062e-08, "loss": 0.0035, "step": 24291 }, { "epoch": 4.95, "learning_rate": 8.66356240647459e-08, "loss": 0.0002, "step": 24292 }, { "epoch": 4.95, "learning_rate": 8.597811337326954e-08, "loss": 0.0027, "step": 24293 }, { "epoch": 4.95, "learning_rate": 8.532310652892282e-08, "loss": 0.0006, "step": 24294 }, { "epoch": 4.95, "learning_rate": 8.467060354268029e-08, "loss": 0.0009, "step": 24295 }, { "epoch": 4.95, "learning_rate": 8.402060442541658e-08, "loss": 0.0004, "step": 24296 }, { "epoch": 4.95, "learning_rate": 8.337310918798967e-08, "loss": 0.0001, "step": 24297 }, { "epoch": 4.95, "learning_rate": 8.272811784122425e-08, "loss": 0.0018, "step": 24298 }, { "epoch": 4.95, "learning_rate": 8.208563039587834e-08, "loss": 0.0018, "step": 24299 }, { "epoch": 4.95, "learning_rate": 8.144564686271004e-08, "loss": 0.0049, "step": 24300 }, { "epoch": 4.95, "learning_rate": 8.080816725237749e-08, "loss": 0.0003, "step": 24301 }, { "epoch": 4.95, "learning_rate": 8.017319157555546e-08, "loss": 0.0015, "step": 24302 }, { "epoch": 4.95, "learning_rate": 7.954071984281885e-08, "loss": 0.0002, "step": 24303 }, { "epoch": 4.95, "learning_rate": 7.891075206475916e-08, "loss": 0.0018, "step": 24304 }, { "epoch": 4.95, "learning_rate": 7.828328825186803e-08, "loss": 0.0045, "step": 24305 }, { "epoch": 4.95, "learning_rate": 7.76583284146537e-08, "loss": 0.0023, "step": 24306 }, { "epoch": 4.95, "learning_rate": 7.703587256355781e-08, "loss": 0.0029, "step": 24307 }, { "epoch": 4.95, "learning_rate": 7.641592070893876e-08, "loss": 0.0005, "step": 24308 }, { "epoch": 4.95, "learning_rate": 7.579847286118824e-08, "loss": 0.0029, "step": 24309 }, { "epoch": 4.95, "learning_rate": 7.518352903061465e-08, "loss": 0.0012, "step": 24310 }, { "epoch": 4.95, "learning_rate": 7.45710892274598e-08, "loss": 0.007, "step": 24311 }, { "epoch": 4.95, "learning_rate": 7.396115346198217e-08, "loss": 0.0008, "step": 24312 }, { "epoch": 4.95, "learning_rate": 7.335372174435694e-08, "loss": 0.001, "step": 24313 }, { "epoch": 4.95, "learning_rate": 7.2748794084726e-08, "loss": 0.0002, "step": 24314 }, { "epoch": 4.95, "learning_rate": 7.214637049321459e-08, "loss": 0.0004, "step": 24315 }, { "epoch": 4.95, "learning_rate": 7.154645097984802e-08, "loss": 0.0026, "step": 24316 }, { "epoch": 4.95, "learning_rate": 7.094903555466824e-08, "loss": 0.0005, "step": 24317 }, { "epoch": 4.95, "learning_rate": 7.035412422766728e-08, "loss": 0.0, "step": 24318 }, { "epoch": 4.95, "learning_rate": 6.976171700875388e-08, "loss": 0.0009, "step": 24319 }, { "epoch": 4.95, "learning_rate": 6.917181390783677e-08, "loss": 0.0021, "step": 24320 }, { "epoch": 4.95, "learning_rate": 6.858441493475808e-08, "loss": 0.0091, "step": 24321 }, { "epoch": 4.95, "learning_rate": 6.799952009932664e-08, "loss": 0.0003, "step": 24322 }, { "epoch": 4.95, "learning_rate": 6.74171294113346e-08, "loss": 0.0001, "step": 24323 }, { "epoch": 4.95, "learning_rate": 6.683724288049086e-08, "loss": 0.0003, "step": 24324 }, { "epoch": 4.95, "learning_rate": 6.625986051648768e-08, "loss": 0.001, "step": 24325 }, { "epoch": 4.95, "learning_rate": 6.568498232896736e-08, "loss": 0.0015, "step": 24326 }, { "epoch": 4.95, "learning_rate": 6.511260832752219e-08, "loss": 0.0004, "step": 24327 }, { "epoch": 4.95, "learning_rate": 6.454273852171122e-08, "loss": 0.0077, "step": 24328 }, { "epoch": 4.95, "learning_rate": 6.39753729210768e-08, "loss": 0.0058, "step": 24329 }, { "epoch": 4.95, "learning_rate": 6.341051153506138e-08, "loss": 0.003, "step": 24330 }, { "epoch": 4.95, "learning_rate": 6.284815437312407e-08, "loss": 0.002, "step": 24331 }, { "epoch": 4.95, "learning_rate": 6.228830144465735e-08, "loss": 0.0036, "step": 24332 }, { "epoch": 4.95, "learning_rate": 6.17309527589871e-08, "loss": 0.0002, "step": 24333 }, { "epoch": 4.95, "learning_rate": 6.117610832543918e-08, "loss": 0.0067, "step": 24334 }, { "epoch": 4.96, "learning_rate": 6.06237681532895e-08, "loss": 0.0001, "step": 24335 }, { "epoch": 4.96, "learning_rate": 6.007393225176404e-08, "loss": 0.0008, "step": 24336 }, { "epoch": 4.96, "learning_rate": 5.9526600630022126e-08, "loss": 0.0024, "step": 24337 }, { "epoch": 4.96, "learning_rate": 5.898177329720643e-08, "loss": 0.0032, "step": 24338 }, { "epoch": 4.96, "learning_rate": 5.843945026244301e-08, "loss": 0.0025, "step": 24339 }, { "epoch": 4.96, "learning_rate": 5.7899631534774616e-08, "loss": 0.0007, "step": 24340 }, { "epoch": 4.96, "learning_rate": 5.736231712321071e-08, "loss": 0.0006, "step": 24341 }, { "epoch": 4.96, "learning_rate": 5.68275070367441e-08, "loss": 0.0001, "step": 24342 }, { "epoch": 4.96, "learning_rate": 5.629520128430098e-08, "loss": 0.0029, "step": 24343 }, { "epoch": 4.96, "learning_rate": 5.576539987475759e-08, "loss": 0.0011, "step": 24344 }, { "epoch": 4.96, "learning_rate": 5.523810281695684e-08, "loss": 0.0007, "step": 24345 }, { "epoch": 4.96, "learning_rate": 5.4713310119741674e-08, "loss": 0.0001, "step": 24346 }, { "epoch": 4.96, "learning_rate": 5.4191021791855086e-08, "loss": 0.0001, "step": 24347 }, { "epoch": 4.96, "learning_rate": 5.367123784200678e-08, "loss": 0.0006, "step": 24348 }, { "epoch": 4.96, "learning_rate": 5.315395827890645e-08, "loss": 0.0004, "step": 24349 }, { "epoch": 4.96, "learning_rate": 5.2639183111163884e-08, "loss": 0.0007, "step": 24350 }, { "epoch": 4.96, "learning_rate": 5.2126912347405513e-08, "loss": 0.0004, "step": 24351 }, { "epoch": 4.96, "learning_rate": 5.16171459961745e-08, "loss": 0.0027, "step": 24352 }, { "epoch": 4.96, "learning_rate": 5.110988406598071e-08, "loss": 0.0103, "step": 24353 }, { "epoch": 4.96, "learning_rate": 5.060512656530069e-08, "loss": 0.0051, "step": 24354 }, { "epoch": 4.96, "learning_rate": 5.0102873502577686e-08, "loss": 0.0021, "step": 24355 }, { "epoch": 4.96, "learning_rate": 4.9603124886171684e-08, "loss": 0.0003, "step": 24356 }, { "epoch": 4.96, "learning_rate": 4.910588072444266e-08, "loss": 0.0032, "step": 24357 }, { "epoch": 4.96, "learning_rate": 4.861114102571728e-08, "loss": 0.0017, "step": 24358 }, { "epoch": 4.96, "learning_rate": 4.8118905798222305e-08, "loss": 0.0002, "step": 24359 }, { "epoch": 4.96, "learning_rate": 4.7629175050201143e-08, "loss": 0.0004, "step": 24360 }, { "epoch": 4.96, "learning_rate": 4.714194878981392e-08, "loss": 0.0055, "step": 24361 }, { "epoch": 4.96, "learning_rate": 4.665722702523744e-08, "loss": 0.0002, "step": 24362 }, { "epoch": 4.96, "learning_rate": 4.617500976451527e-08, "loss": 0.001, "step": 24363 }, { "epoch": 4.96, "learning_rate": 4.5695297015757584e-08, "loss": 0.0011, "step": 24364 }, { "epoch": 4.96, "learning_rate": 4.521808878692468e-08, "loss": 0.0018, "step": 24365 }, { "epoch": 4.96, "learning_rate": 4.4743385086010167e-08, "loss": 0.0017, "step": 24366 }, { "epoch": 4.96, "learning_rate": 4.4271185920957684e-08, "loss": 0.0027, "step": 24367 }, { "epoch": 4.96, "learning_rate": 4.3801491299627625e-08, "loss": 0.0003, "step": 24368 }, { "epoch": 4.96, "learning_rate": 4.333430122988035e-08, "loss": 0.0008, "step": 24369 }, { "epoch": 4.96, "learning_rate": 4.286961571950964e-08, "loss": 0.0015, "step": 24370 }, { "epoch": 4.96, "learning_rate": 4.240743477627595e-08, "loss": 0.0003, "step": 24371 }, { "epoch": 4.96, "learning_rate": 4.1947758407906426e-08, "loss": 0.0005, "step": 24372 }, { "epoch": 4.96, "learning_rate": 4.149058662207827e-08, "loss": 0.0035, "step": 24373 }, { "epoch": 4.96, "learning_rate": 4.103591942641871e-08, "loss": 0.0044, "step": 24374 }, { "epoch": 4.96, "learning_rate": 4.058375682852166e-08, "loss": 0.0001, "step": 24375 }, { "epoch": 4.96, "learning_rate": 4.013409883596441e-08, "loss": 0.0006, "step": 24376 }, { "epoch": 4.96, "learning_rate": 3.968694545622431e-08, "loss": 0.0002, "step": 24377 }, { "epoch": 4.96, "learning_rate": 3.9242296696778696e-08, "loss": 0.0061, "step": 24378 }, { "epoch": 4.96, "learning_rate": 3.8800152565054977e-08, "loss": 0.0003, "step": 24379 }, { "epoch": 4.96, "learning_rate": 3.836051306844723e-08, "loss": 0.0054, "step": 24380 }, { "epoch": 4.96, "learning_rate": 3.7923378214299583e-08, "loss": 0.0009, "step": 24381 }, { "epoch": 4.96, "learning_rate": 3.7488748009889545e-08, "loss": 0.0021, "step": 24382 }, { "epoch": 4.96, "learning_rate": 3.705662246251129e-08, "loss": 0.0002, "step": 24383 }, { "epoch": 4.97, "learning_rate": 3.6627001579342397e-08, "loss": 0.0018, "step": 24384 }, { "epoch": 4.97, "learning_rate": 3.619988536759377e-08, "loss": 0.0024, "step": 24385 }, { "epoch": 4.97, "learning_rate": 3.5775273834376394e-08, "loss": 0.0072, "step": 24386 }, { "epoch": 4.97, "learning_rate": 3.535316698678459e-08, "loss": 0.0, "step": 24387 }, { "epoch": 4.97, "learning_rate": 3.493356483187937e-08, "loss": 0.0014, "step": 24388 }, { "epoch": 4.97, "learning_rate": 3.4516467376655146e-08, "loss": 0.0001, "step": 24389 }, { "epoch": 4.97, "learning_rate": 3.410187462810632e-08, "loss": 0.0036, "step": 24390 }, { "epoch": 4.97, "learning_rate": 3.3689786593110724e-08, "loss": 0.0023, "step": 24391 }, { "epoch": 4.97, "learning_rate": 3.328020327859615e-08, "loss": 0.0012, "step": 24392 }, { "epoch": 4.97, "learning_rate": 3.287312469137382e-08, "loss": 0.0002, "step": 24393 }, { "epoch": 4.97, "learning_rate": 3.2468550838254946e-08, "loss": 0.0002, "step": 24394 }, { "epoch": 4.97, "learning_rate": 3.2066481726000795e-08, "loss": 0.0052, "step": 24395 }, { "epoch": 4.97, "learning_rate": 3.1666917361322654e-08, "loss": 0.0002, "step": 24396 }, { "epoch": 4.97, "learning_rate": 3.126985775088187e-08, "loss": 0.006, "step": 24397 }, { "epoch": 4.97, "learning_rate": 3.087530290132312e-08, "loss": 0.0014, "step": 24398 }, { "epoch": 4.97, "learning_rate": 3.048325281924113e-08, "loss": 0.0011, "step": 24399 }, { "epoch": 4.97, "learning_rate": 3.009370751118068e-08, "loss": 0.0017, "step": 24400 }, { "epoch": 4.97, "learning_rate": 2.9706666983619897e-08, "loss": 0.0003, "step": 24401 }, { "epoch": 4.97, "learning_rate": 2.9322131243070257e-08, "loss": 0.0124, "step": 24402 }, { "epoch": 4.97, "learning_rate": 2.894010029592664e-08, "loss": 0.0, "step": 24403 }, { "epoch": 4.97, "learning_rate": 2.8560574148567273e-08, "loss": 0.0007, "step": 24404 }, { "epoch": 4.97, "learning_rate": 2.8183552807337085e-08, "loss": 0.0001, "step": 24405 }, { "epoch": 4.97, "learning_rate": 2.7809036278531038e-08, "loss": 0.0044, "step": 24406 }, { "epoch": 4.97, "learning_rate": 2.7437024568410794e-08, "loss": 0.0001, "step": 24407 }, { "epoch": 4.97, "learning_rate": 2.7067517683188045e-08, "loss": 0.0002, "step": 24408 }, { "epoch": 4.97, "learning_rate": 2.6700515629024533e-08, "loss": 0.0001, "step": 24409 }, { "epoch": 4.97, "learning_rate": 2.633601841206534e-08, "loss": 0.0008, "step": 24410 }, { "epoch": 4.97, "learning_rate": 2.597402603838894e-08, "loss": 0.0012, "step": 24411 }, { "epoch": 4.97, "learning_rate": 2.5614538514040496e-08, "loss": 0.0038, "step": 24412 }, { "epoch": 4.97, "learning_rate": 2.5257555845031862e-08, "loss": 0.002, "step": 24413 }, { "epoch": 4.97, "learning_rate": 2.4903078037308287e-08, "loss": 0.003, "step": 24414 }, { "epoch": 4.97, "learning_rate": 2.4551105096798362e-08, "loss": 0.0024, "step": 24415 }, { "epoch": 4.97, "learning_rate": 2.420163702939737e-08, "loss": 0.0016, "step": 24416 }, { "epoch": 4.97, "learning_rate": 2.3854673840917326e-08, "loss": 0.0042, "step": 24417 }, { "epoch": 4.97, "learning_rate": 2.3510215537170252e-08, "loss": 0.0002, "step": 24418 }, { "epoch": 4.97, "learning_rate": 2.3168262123901548e-08, "loss": 0.0004, "step": 24419 }, { "epoch": 4.97, "learning_rate": 2.282881360683997e-08, "loss": 0.0023, "step": 24420 }, { "epoch": 4.97, "learning_rate": 2.2491869991614343e-08, "loss": 0.0003, "step": 24421 }, { "epoch": 4.97, "learning_rate": 2.2157431283886808e-08, "loss": 0.0042, "step": 24422 }, { "epoch": 4.97, "learning_rate": 2.1825497489236233e-08, "loss": 0.0001, "step": 24423 }, { "epoch": 4.97, "learning_rate": 2.1496068613208183e-08, "loss": 0.0024, "step": 24424 }, { "epoch": 4.97, "learning_rate": 2.1169144661281612e-08, "loss": 0.0007, "step": 24425 }, { "epoch": 4.97, "learning_rate": 2.084472563895212e-08, "loss": 0.0054, "step": 24426 }, { "epoch": 4.97, "learning_rate": 2.052281155161539e-08, "loss": 0.0001, "step": 24427 }, { "epoch": 4.97, "learning_rate": 2.020340240465046e-08, "loss": 0.0011, "step": 24428 }, { "epoch": 4.97, "learning_rate": 1.9886498203403044e-08, "loss": 0.0032, "step": 24429 }, { "epoch": 4.97, "learning_rate": 1.957209895315226e-08, "loss": 0.0001, "step": 24430 }, { "epoch": 4.97, "learning_rate": 1.926020465916056e-08, "loss": 0.003, "step": 24431 }, { "epoch": 4.97, "learning_rate": 1.8950815326640445e-08, "loss": 0.0037, "step": 24432 }, { "epoch": 4.98, "learning_rate": 1.8643930960737795e-08, "loss": 0.0004, "step": 24433 }, { "epoch": 4.98, "learning_rate": 1.8339551566598497e-08, "loss": 0.0013, "step": 24434 }, { "epoch": 4.98, "learning_rate": 1.8037677149285168e-08, "loss": 0.0005, "step": 24435 }, { "epoch": 4.98, "learning_rate": 1.7738307713877077e-08, "loss": 0.0014, "step": 24436 }, { "epoch": 4.98, "learning_rate": 1.7441443265336918e-08, "loss": 0.0021, "step": 24437 }, { "epoch": 4.98, "learning_rate": 1.7147083808627393e-08, "loss": 0.0003, "step": 24438 }, { "epoch": 4.98, "learning_rate": 1.6855229348694544e-08, "loss": 0.0001, "step": 24439 }, { "epoch": 4.98, "learning_rate": 1.6565879890384493e-08, "loss": 0.0003, "step": 24440 }, { "epoch": 4.98, "learning_rate": 1.6279035438526712e-08, "loss": 0.0021, "step": 24441 }, { "epoch": 4.98, "learning_rate": 1.5994695997934015e-08, "loss": 0.0015, "step": 24442 }, { "epoch": 4.98, "learning_rate": 1.5712861573335954e-08, "loss": 0.0069, "step": 24443 }, { "epoch": 4.98, "learning_rate": 1.543353216946208e-08, "loss": 0.0051, "step": 24444 }, { "epoch": 4.98, "learning_rate": 1.515670779095868e-08, "loss": 0.0008, "step": 24445 }, { "epoch": 4.98, "learning_rate": 1.4882388442455373e-08, "loss": 0.0002, "step": 24446 }, { "epoch": 4.98, "learning_rate": 1.4610574128531837e-08, "loss": 0.0061, "step": 24447 }, { "epoch": 4.98, "learning_rate": 1.4341264853734436e-08, "loss": 0.0033, "step": 24448 }, { "epoch": 4.98, "learning_rate": 1.4074460622542915e-08, "loss": 0.005, "step": 24449 }, { "epoch": 4.98, "learning_rate": 1.3810161439437028e-08, "loss": 0.0012, "step": 24450 }, { "epoch": 4.98, "learning_rate": 1.3548367308813257e-08, "loss": 0.0013, "step": 24451 }, { "epoch": 4.98, "learning_rate": 1.3289078235068085e-08, "loss": 0.0018, "step": 24452 }, { "epoch": 4.98, "learning_rate": 1.3032294222498074e-08, "loss": 0.0025, "step": 24453 }, { "epoch": 4.98, "learning_rate": 1.2778015275416442e-08, "loss": 0.001, "step": 24454 }, { "epoch": 4.98, "learning_rate": 1.2526241398053138e-08, "loss": 0.0018, "step": 24455 }, { "epoch": 4.98, "learning_rate": 1.2276972594638112e-08, "loss": 0.0005, "step": 24456 }, { "epoch": 4.98, "learning_rate": 1.2030208869301395e-08, "loss": 0.0065, "step": 24457 }, { "epoch": 4.98, "learning_rate": 1.1785950226189666e-08, "loss": 0.0005, "step": 24458 }, { "epoch": 4.98, "learning_rate": 1.1544196669382999e-08, "loss": 0.0037, "step": 24459 }, { "epoch": 4.98, "learning_rate": 1.1304948202911501e-08, "loss": 0.0046, "step": 24460 }, { "epoch": 4.98, "learning_rate": 1.1068204830771977e-08, "loss": 0.0023, "step": 24461 }, { "epoch": 4.98, "learning_rate": 1.0833966556911266e-08, "loss": 0.0005, "step": 24462 }, { "epoch": 4.98, "learning_rate": 1.0602233385242909e-08, "loss": 0.0001, "step": 24463 }, { "epoch": 4.98, "learning_rate": 1.0373005319647132e-08, "loss": 0.0015, "step": 24464 }, { "epoch": 4.98, "learning_rate": 1.0146282363954206e-08, "loss": 0.004, "step": 24465 }, { "epoch": 4.98, "learning_rate": 9.92206452194444e-09, "loss": 0.0001, "step": 24466 }, { "epoch": 4.98, "learning_rate": 9.700351797348182e-09, "loss": 0.0014, "step": 24467 }, { "epoch": 4.98, "learning_rate": 9.481144193895785e-09, "loss": 0.0001, "step": 24468 }, { "epoch": 4.98, "learning_rate": 9.264441715234327e-09, "loss": 0.003, "step": 24469 }, { "epoch": 4.98, "learning_rate": 9.050244364977588e-09, "loss": 0.001, "step": 24470 }, { "epoch": 4.98, "learning_rate": 8.838552146706035e-09, "loss": 0.0006, "step": 24471 }, { "epoch": 4.98, "learning_rate": 8.629365063966831e-09, "loss": 0.0001, "step": 24472 }, { "epoch": 4.98, "learning_rate": 8.422683120257179e-09, "loss": 0.0011, "step": 24473 }, { "epoch": 4.98, "learning_rate": 8.218506318991013e-09, "loss": 0.0004, "step": 24474 }, { "epoch": 4.98, "learning_rate": 8.016834663632232e-09, "loss": 0.0002, "step": 24475 }, { "epoch": 4.98, "learning_rate": 7.817668157511503e-09, "loss": 0.001, "step": 24476 }, { "epoch": 4.98, "learning_rate": 7.621006803959495e-09, "loss": 0.0004, "step": 24477 }, { "epoch": 4.98, "learning_rate": 7.4268506062735715e-09, "loss": 0.0004, "step": 24478 }, { "epoch": 4.98, "learning_rate": 7.2351995676844795e-09, "loss": 0.0006, "step": 24479 }, { "epoch": 4.98, "learning_rate": 7.046053691406317e-09, "loss": 0.0001, "step": 24480 }, { "epoch": 4.98, "learning_rate": 6.8594129805865646e-09, "loss": 0.0011, "step": 24481 }, { "epoch": 4.99, "learning_rate": 6.6752774383560525e-09, "loss": 0.0021, "step": 24482 }, { "epoch": 4.99, "learning_rate": 6.493647067778995e-09, "loss": 0.0024, "step": 24483 }, { "epoch": 4.99, "learning_rate": 6.314521871886302e-09, "loss": 0.0039, "step": 24484 }, { "epoch": 4.99, "learning_rate": 6.137901853658922e-09, "loss": 0.0072, "step": 24485 }, { "epoch": 4.99, "learning_rate": 5.963787016077803e-09, "loss": 0.0003, "step": 24486 }, { "epoch": 4.99, "learning_rate": 5.792177362040629e-09, "loss": 0.0001, "step": 24487 }, { "epoch": 4.99, "learning_rate": 5.6230728943951195e-09, "loss": 0.0004, "step": 24488 }, { "epoch": 4.99, "learning_rate": 5.456473615988999e-09, "loss": 0.0063, "step": 24489 }, { "epoch": 4.99, "learning_rate": 5.292379529586721e-09, "loss": 0.0003, "step": 24490 }, { "epoch": 4.99, "learning_rate": 5.130790637952742e-09, "loss": 0.0025, "step": 24491 }, { "epoch": 4.99, "learning_rate": 4.971706943751597e-09, "loss": 0.0025, "step": 24492 }, { "epoch": 4.99, "learning_rate": 4.815128449664474e-09, "loss": 0.0003, "step": 24493 }, { "epoch": 4.99, "learning_rate": 4.6610551583059486e-09, "loss": 0.0024, "step": 24494 }, { "epoch": 4.99, "learning_rate": 4.5094870722406365e-09, "loss": 0.0007, "step": 24495 }, { "epoch": 4.99, "learning_rate": 4.3604241939998455e-09, "loss": 0.0003, "step": 24496 }, { "epoch": 4.99, "learning_rate": 4.213866526081577e-09, "loss": 0.0034, "step": 24497 }, { "epoch": 4.99, "learning_rate": 4.069814070917221e-09, "loss": 0.0014, "step": 24498 }, { "epoch": 4.99, "learning_rate": 3.928266830938165e-09, "loss": 0.0001, "step": 24499 }, { "epoch": 4.99, "learning_rate": 3.78922480849253e-09, "loss": 0.0058, "step": 24500 }, { "epoch": 4.99, "learning_rate": 3.6526880058951325e-09, "loss": 0.0022, "step": 24501 }, { "epoch": 4.99, "learning_rate": 3.518656425444133e-09, "loss": 0.0011, "step": 24502 }, { "epoch": 4.99, "learning_rate": 3.3871300693710803e-09, "loss": 0.0003, "step": 24503 }, { "epoch": 4.99, "learning_rate": 3.2581089398742155e-09, "loss": 0.0013, "step": 24504 }, { "epoch": 4.99, "learning_rate": 3.1315930391018207e-09, "loss": 0.0002, "step": 24505 }, { "epoch": 4.99, "learning_rate": 3.0075823691688705e-09, "loss": 0.0005, "step": 24506 }, { "epoch": 4.99, "learning_rate": 2.8860769321403797e-09, "loss": 0.0014, "step": 24507 }, { "epoch": 4.99, "learning_rate": 2.76707673006471e-09, "loss": 0.0002, "step": 24508 }, { "epoch": 4.99, "learning_rate": 2.6505817649236095e-09, "loss": 0.0001, "step": 24509 }, { "epoch": 4.99, "learning_rate": 2.536592038648866e-09, "loss": 0.0058, "step": 24510 }, { "epoch": 4.99, "learning_rate": 2.425107553155614e-09, "loss": 0.001, "step": 24511 }, { "epoch": 4.99, "learning_rate": 2.316128310309029e-09, "loss": 0.0006, "step": 24512 }, { "epoch": 4.99, "learning_rate": 2.209654311924325e-09, "loss": 0.0002, "step": 24513 }, { "epoch": 4.99, "learning_rate": 2.1056855597667566e-09, "loss": 0.0008, "step": 24514 }, { "epoch": 4.99, "learning_rate": 2.0042220556015788e-09, "loss": 0.0002, "step": 24515 }, { "epoch": 4.99, "learning_rate": 1.9052638010941255e-09, "loss": 0.0007, "step": 24516 }, { "epoch": 4.99, "learning_rate": 1.808810797909732e-09, "loss": 0.0014, "step": 24517 }, { "epoch": 4.99, "learning_rate": 1.7148630476637727e-09, "loss": 0.0101, "step": 24518 }, { "epoch": 4.99, "learning_rate": 1.6234205519216615e-09, "loss": 0.0012, "step": 24519 }, { "epoch": 4.99, "learning_rate": 1.5344833122155064e-09, "loss": 0.001, "step": 24520 }, { "epoch": 4.99, "learning_rate": 1.448051330010802e-09, "loss": 0.0008, "step": 24521 }, { "epoch": 4.99, "learning_rate": 1.364124606789696e-09, "loss": 0.0002, "step": 24522 }, { "epoch": 4.99, "learning_rate": 1.2827031439177626e-09, "loss": 0.0008, "step": 24523 }, { "epoch": 4.99, "learning_rate": 1.2037869427605762e-09, "loss": 0.0039, "step": 24524 }, { "epoch": 4.99, "learning_rate": 1.1273760046504043e-09, "loss": 0.0054, "step": 24525 }, { "epoch": 4.99, "learning_rate": 1.0534703308529013e-09, "loss": 0.0021, "step": 24526 }, { "epoch": 4.99, "learning_rate": 9.820699226004147e-10, "loss": 0.0027, "step": 24527 }, { "epoch": 4.99, "learning_rate": 9.131747811086387e-10, "loss": 0.0003, "step": 24528 }, { "epoch": 4.99, "learning_rate": 8.467849074933474e-10, "loss": 0.0001, "step": 24529 }, { "epoch": 4.99, "learning_rate": 7.829003028869684e-10, "loss": 0.0032, "step": 24530 }, { "epoch": 4.99, "learning_rate": 7.215209683386624e-10, "loss": 0.001, "step": 24531 }, { "epoch": 5.0, "learning_rate": 6.626469048975902e-10, "loss": 0.001, "step": 24532 }, { "epoch": 5.0, "learning_rate": 6.062781135296457e-10, "loss": 0.0072, "step": 24533 }, { "epoch": 5.0, "learning_rate": 5.524145951840698e-10, "loss": 0.0001, "step": 24534 }, { "epoch": 5.0, "learning_rate": 5.010563507601428e-10, "loss": 0.0006, "step": 24535 }, { "epoch": 5.0, "learning_rate": 4.5220338110718566e-10, "loss": 0.0007, "step": 24536 }, { "epoch": 5.0, "learning_rate": 4.058556870412122e-10, "loss": 0.0055, "step": 24537 }, { "epoch": 5.0, "learning_rate": 3.620132693449296e-10, "loss": 0.0003, "step": 24538 }, { "epoch": 5.0, "learning_rate": 3.206761287510851e-10, "loss": 0.0002, "step": 24539 }, { "epoch": 5.0, "learning_rate": 2.8184426594246576e-10, "loss": 0.0051, "step": 24540 }, { "epoch": 5.0, "learning_rate": 2.4551768158520557e-10, "loss": 0.0038, "step": 24541 }, { "epoch": 5.0, "learning_rate": 2.1169637626217151e-10, "loss": 0.0026, "step": 24542 }, { "epoch": 5.0, "learning_rate": 1.8038035053957734e-10, "loss": 0.0, "step": 24543 }, { "epoch": 5.0, "learning_rate": 1.5156960496698345e-10, "loss": 0.0008, "step": 24544 }, { "epoch": 5.0, "learning_rate": 1.2526413999403019e-10, "loss": 0.0001, "step": 24545 }, { "epoch": 5.0, "learning_rate": 1.0146395607035784e-10, "loss": 0.0039, "step": 24546 }, { "epoch": 5.0, "learning_rate": 8.016905361230009e-11, "loss": 0.0028, "step": 24547 }, { "epoch": 5.0, "learning_rate": 6.13794329529238e-11, "loss": 0.0007, "step": 24548 }, { "epoch": 5.0, "learning_rate": 4.509509440864256e-11, "loss": 0.0009, "step": 24549 }, { "epoch": 5.0, "learning_rate": 3.131603826256324e-11, "loss": 0.0013, "step": 24550 }, { "epoch": 5.0, "learning_rate": 2.004226474783266e-11, "loss": 0.0001, "step": 24551 }, { "epoch": 5.0, "learning_rate": 1.1273774030984284e-11, "loss": 0.0021, "step": 24552 }, { "epoch": 5.0, "learning_rate": 5.010566261898219e-12, "loss": 0.0004, "step": 24553 }, { "epoch": 5.0, "learning_rate": 1.2526415738012274e-12, "loss": 0.0001, "step": 24554 }, { "epoch": 5.0, "learning_rate": 0.0, "loss": 0.0014, "step": 24555 }, { "epoch": 5.0, "step": 24555, "total_flos": 1.9137197607726612e+18, "train_loss": 0.013171266583756296, "train_runtime": 80458.8335, "train_samples_per_second": 4.883, "train_steps_per_second": 0.305 } ], "logging_steps": 1.0, "max_steps": 24555, "num_input_tokens_seen": 0, "num_train_epochs": 5, "save_steps": 1000, "total_flos": 1.9137197607726612e+18, "train_batch_size": 2, "trial_name": null, "trial_params": null }